simplecrawler
Advanced tools
Comparing version 0.0.8 to 0.0.9
10
index.js
@@ -282,3 +282,3 @@ // Simplecrawler | ||
cleanAndQueue(resourceText.match(/^javascript\:[a-z0-9]+\(['"][^'"\s]+/ig)); | ||
return resources; | ||
@@ -352,3 +352,9 @@ } | ||
function queueLinkedItems(resourceData,queueItem) { | ||
discoverResources(resourceData,queueItem).forEach(function(url){ queueURL(url,queueItem); }); | ||
var resources = discoverResources(resourceData,queueItem); | ||
// Emit discovered resources. ie: might be useful in building a graph of | ||
// page relationships. | ||
crawler.emit("discoverycomplete",queueItem,resources); | ||
resources.forEach(function(url){ queueURL(url,queueItem); }); | ||
} | ||
@@ -355,0 +361,0 @@ |
{ | ||
"name": "simplecrawler", | ||
"description": "Very straigntforward web crawler. Uses EventEmitter. Generates queue statistics and has a basic cache mechanism with extensible backend.", | ||
"version": "0.0.8", | ||
"version": "0.0.9", | ||
"homepage": "http://github.com/cgiffard/node-simplecrawler", | ||
@@ -6,0 +6,0 @@ "author": "Christopher Giffard <christopher.giffard@cgiffard.com>", |
Sorry, the diff of this file is not supported yet
53589
986
272