Created by
zhao fuyun
last modified
| const puppeteer = require('puppeteer');
const fs = require('fs');
(async () => {
const browser = await puppeteer.launch();
const page = await browser.newPage();
var list = [];
var totalPages = 125;
for(var i = 1; i <= totalPages; i++) {
console.log(`${i}/${totalPages}`);
var url = `http://www.goldwind.com.cn/web/investors.do?action=financial&cid=201004200356190000&page=${i}`;
await page.goto(url);
const result = await page.$eval('#scroll_box ul.textList', el => {
var items = Array.from(el.querySelectorAll('li'));
return items.map(li => {
var link = li.querySelector('a');
var time = li.querySelector('span.time');
return {
text: link.textContent,
href: decodeURI(link.href),
datetime: time.textContent
};
});
});
list = list.concat(result);
}
console.log('done!');
fs.writeFileSync('./notice.json', JSON.stringify(list, null, 4));
await browser.close();
})();
|