Skip to content

Instantly share code, notes, and snippets.

@Tirael
Last active November 24, 2016 21:15
Show Gist options
  • Save Tirael/0f9a88a41d73e0f575287733271c50f3 to your computer and use it in GitHub Desktop.
Save Tirael/0f9a88a41d73e0f575287733271c50f3 to your computer and use it in GitHub Desktop.
Dynamic paging with Nightmare / Electron (page scrape)
var Nightmare = require('nightmare');
var vo = require('vo');
vo(run)(function(err, result) {
if (err) throw err;
});
function* run() {
var nightmare = Nightmare({ show: true }),
MAX_PAGE = 100,
currentPage = 0,
nextExists = true,
links = [];
yield nightmare
.goto('http://www.google.com')
.wait('input[name="q"]')
.click('input[name="q"]')
.type('input[name="q"]', 'Anequim Project')
.click('input[name="btnK"]')
.wait(2000)
nextExists = yield nightmare.visible('#pnnext');
while (nextExists && currentPage < MAX_PAGE) {
links.push(yield nightmare
.evaluate(function() {
var linkArray = [];
var links = document.querySelectorAll('h3.r a');
return links[0].href;
}));
yield nightmare
.click('#pnnext')
.wait(2000)
currentPage++;
nextExists = yield nightmare.visible('#pnnext');
}
console.dir(links);
yield nightmare.end();
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment