Ported from mono0x/extractcontent.
npm install extract-main-text
var BodyExtractor = require('extract-main-text');
var extractor = new BodyExtractor({
url: 'http://***.com/'
});
extractor.analyze()
.then(function(text) {
console.log(extractor.title);
console.log(extractor.mainText);
});
The BSD license