Noun. Aranea - a genus of orb-weaving spiders including common garden spiders and barn spiders
Aranea is a node.js powered web spider, i made it to learn the ropes. At the moment only pulls back all the links on the first page. Not very useful huh?
var sys = require('sys'),
Aranea = require('./lib/aranea');
var spider = new Aranea();
spider.on('pageFinished', function(page){
// Do something with each page!
});
spider.crawl("http://google.com");
var sys = require('sys'),
Aranea = require('./lib/aranea');
var spider = new Aranea();
spider.linkSelector = 'a.gb1';
spider.on('pageFinished', function(page){
sys.puts(JSON.stringify(page.links));
});
spider.crawl("http://google.com");
// ["http://www.google.com/imghp?hl=en&tab=wi"
// ,"http://video.google.com/?hl=en&tab=wv"
// ,"http://maps.google.com/maps?hl=en&tab=wl"
// ,"http://news.google.com/nwshp?hl=en&tab=wn"
// ,"http://www.google.com/prdhp?hl=en&tab=wf"
// ,"http://mail.google.com/mail/?hl=en&tab=wm"]
var sys = require('sys'),
Aranea = require('./lib/aranea');
var spider = new Aranea();
spider.linkSelector = 'a[href^="http://mail."]';
spider.on('pageFinished', function(page){
sys.puts(JSON.stringify(page.links));
});
spider.crawl("http://google.com");
// ["http://mail.google.com/mail/?hl=en&tab=wm"]