![分享一个好用的Nodejs爬虫工具-crawler](https://pic.rmb.bdstatic.com/bjh/1c0800079c8df93ab778d86cbf131227.jpeg@s_0,w_2000)
在网上找了一个用于爬取的库,挺好用,分享给大家,直接看代码
这里的地址随便找了一个网站,请勿非法使用!!!
const Crawler = require('crawler');
var c = new Crawler({
maxConnections: 2,
jQuery: 'cheerio',
});
const baseUrl = 'http://kaijiang.500.com/ssq.shtml';
c.queue({
url: baseUrl, callback: (error, res, done) => {
if (error) {
return console.log(error);
} else {
var $ = res.$;
let dates = ''
let reds = [];
let blues = [];
dates = $('#change_date').text()
$('.ball_box01').children().children().filter('.ball_red').each((i, element) => {
reds.push($(element).text())
});
blues = [dates, $('.ball_box01').children().find('.ball_blue').text()]
let others = [];
Object.values($('.iSelectList').children()).forEach(element => {
let p = $(element).text();
if ($(element)[0]) {
let purl = $(element)[0].attribs.href;
others.push({ [p]: purl })
}
});
console.log(reds, blues, others)
}
done();
}
},
);