Hero scripts of machete.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 

53 lines
1.4 KiB

import Hero from '@ulixee/hero';
import configs from '../config.mjs';
import HeroBot from './HeroBot.mjs';
class Xigua extends HeroBot {
async scrap(url) {
let data = {};
try {
let options = {};
if (this.heroServer) {
options.connectionToCore = this.heroServer;
}
const profile = await this.init('xigua');
if (profile) {
options.userProfile = profile;
}
const hero = new Hero(options);
await hero.goto(url, configs.heroBotOptions);
//等待所有内容加载完成
const tab = await hero.activeTab;
await tab.waitForLoad('AllContentLoaded', {timeoutMs: configs.heroTabOptions.timeoutMs});
//解析网页HTML数据
const elems = await hero.detach( hero.document.querySelectorAll('meta') );
let meta_name = '';
for (const elem of elems) {
meta_name = elem.getAttribute('name');
if (!meta_name) {continue;}
meta_name = meta_name.toLowerCase();
if (meta_name.indexOf('og:image') > -1) {
data.cover = elem.getAttribute('content');
}else if (meta_name.indexOf('og:title') > -1) {
data.title = elem.getAttribute('content');
}
}
await hero.close();
}catch(error) {
console.error("Error got when request %s via hero: %s", url, error);
};
return data;
}
}
export default Xigua;