Crawlab nodejs sdk
用于在crawlab的nodejs爬虫任务把爬取的内容写进结果集里。兼容crawlab 0.6.0版本
安装
npm i crawlab-node-sdk
pnpm add crawlab-node-sdk
使用
const { getCollection } = require('crawlab-node-sdk')
async function test() {
const collection = await getCollection();
const testData = [
{
book: 556677,
page: 1,
},
{
book: 556677,
page: 2,
},{
book: 556677,
page: 3,
},{
book: 556677,
page: 4,
},{
book: 556677,
page: 5,
}
]
const insertResult = await collection.addDataList(testData);
console.log('Inserted documents =>', insertResult);
}
test().then(()=>{
process.exit(0)
})
对应环境的docker-compose.yml
version: '3.3'
services:
master:
image: easonxie/crawlab-nodejs
container_name: crawlab_master
restart: always
environment:
CRAWLAB_NODE_MASTER: "Y"
CRAWLAB_MONGO_HOST: "mongo"
CRAWLAB_MONGO_PORT: "27017"
CRAWLAB_MONGO_DB: "crawlab"
CRAWLAB_MONGO_USERNAME: "username"
CRAWLAB_MONGO_PASSWORD: "password"
CRAWLAB_MONGO_AUTHSOURCE: "admin"
volumes:
- "/opt/crawlab/master:/data"
ports:
- "7878:8080"
depends_on:
- mongo
mongo:
image: mongo:4.2
restart: always
environment:
MONGO_INITDB_ROOT_USERNAME: "username"
MONGO_INITDB_ROOT_PASSWORD: "password"
volumes:
- "/opt/crawlab/mongo/data/db:/data/db"
ports:
- "27017:27017"
ChangeLog
- 0.0.1 初始化
- 0.0.5 添加readme说明