web-spider
Version:
web-spider is a simple and fast web spider written with Nodejs!
26 lines (24 loc) • 644 B
JavaScript
/**
* 这是一个最简单的例子
* 抓取cnodejs首页的信息,web目录下cnodejs需要获取的数据
*/
const cheerio = require('cheerio');
const url = "https://cnodejs.org";
let urlInfo = {url:url, proxy: { host: '111.56.40.134', port: '8118', protocol: 'http' }};
let spider = new (require('../'))({urlInfo:urlInfo});
//启动爬虫
spider.start();
spider.on('success',(data) =>{
try{
console.log(data);
let $ = cheerio.load(data.data.content);
let web = require('./web/cnodejs.org');
web.run($);
console.log(web.getList());
}catch(e){
console.error(e);
}
});
spider.on('error',(err) =>{
console.error(err);
});