mns
My News Scraper - Scrape sites for groups of articles
Example of usage
var mns = require( 'mns' );
var scraper = mns({
url : "http://news.ycombinator.com/news",
type : "text/html",
selectors : {
list : "td:not([align]).title",
article : {
url : {
selector : "a",
attr : "href"
},
src : "span",
title : "a"
}
}
});
scraper.execute(function( err, items ) {
if ( err ) {
return console.log( err );
}
});
Some website configurations reside in test/files/sitesToScrape.json
Disclaimer
This is still a work in progress, under active development. At the moment, the library is in alpha stage, providing very basic functionality. If you have any question, feel free to open an issue on this repository.