simplecrawler
Advanced tools
+8
-2
@@ -282,3 +282,3 @@ // Simplecrawler | ||
| cleanAndQueue(resourceText.match(/^javascript\:[a-z0-9]+\(['"][^'"\s]+/ig)); | ||
| return resources; | ||
@@ -352,3 +352,9 @@ } | ||
| function queueLinkedItems(resourceData,queueItem) { | ||
| discoverResources(resourceData,queueItem).forEach(function(url){ queueURL(url,queueItem); }); | ||
| var resources = discoverResources(resourceData,queueItem); | ||
| // Emit discovered resources. ie: might be useful in building a graph of | ||
| // page relationships. | ||
| crawler.emit("discoverycomplete",queueItem,resources); | ||
| resources.forEach(function(url){ queueURL(url,queueItem); }); | ||
| } | ||
@@ -355,0 +361,0 @@ |
+1
-1
| { | ||
| "name": "simplecrawler", | ||
| "description": "Very straigntforward web crawler. Uses EventEmitter. Generates queue statistics and has a basic cache mechanism with extensible backend.", | ||
| "version": "0.0.8", | ||
| "version": "0.0.9", | ||
| "homepage": "http://github.com/cgiffard/node-simplecrawler", | ||
@@ -6,0 +6,0 @@ "author": "Christopher Giffard <christopher.giffard@cgiffard.com>", |
Sorry, the diff of this file is not supported yet
Network access
Supply chain riskThis module accesses the network.
Found 3 instances in 1 package
Filesystem access
Supply chain riskAccesses the file system, and could potentially read sensitive data.
Found 1 instance in 1 package
Long strings
Supply chain riskContains long string literals, which may be a sign of obfuscated or packed code.
Found 1 instance in 1 package
Network access
Supply chain riskThis module accesses the network.
Found 3 instances in 1 package
Filesystem access
Supply chain riskAccesses the file system, and could potentially read sensitive data.
Found 1 instance in 1 package
Long strings
Supply chain riskContains long string literals, which may be a sign of obfuscated or packed code.
Found 1 instance in 1 package
53589
0.86%986
0.41%272
1.87%9
12.5%