Huge News!Announcing our $40M Series B led by Abstract Ventures.Learn More
Socket
Sign inDemoInstall
Socket

scrapq

Package Overview
Dependencies
Maintainers
1
Versions
17
Alerts
File Explorer

Advanced tools

Socket logo

Install Socket

Detect and block malicious and high-risk dependencies

Install

scrapq - npm Package Compare versions

Comparing version 2.0.1 to 2.1.0

.gitlab-ci.yml

5

CHANGELOG.md

@@ -9,2 +9,7 @@ # Changelog

## [2.1.0] - 2020-18-04
- Added support for `exist` selector
- Rename `GeType` to `TypeOfQuery`
## [2.0.0] - 2020-13-02

@@ -11,0 +16,0 @@

4

dist/browser/scrapq.min.js

@@ -1,2 +0,2 @@

var scrapq=function(t){var e={};function r(n){if(e[n])return e[n].exports;var u=e[n]={i:n,l:!1,exports:{}};return t[n].call(u.exports,u,u.exports,r),u.l=!0,u.exports}return r.m=t,r.c=e,r.d=function(t,e,n){r.o(t,e)||Object.defineProperty(t,e,{enumerable:!0,get:n})},r.r=function(t){"undefined"!=typeof Symbol&&Symbol.toStringTag&&Object.defineProperty(t,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(t,"__esModule",{value:!0})},r.t=function(t,e){if(1&e&&(t=r(t)),8&e)return t;if(4&e&&"object"==typeof t&&t&&t.__esModule)return t;var n=Object.create(null);if(r.r(n),Object.defineProperty(n,"default",{enumerable:!0,value:t}),2&e&&"string"!=typeof t)for(var u in t)r.d(n,u,function(e){return t[e]}.bind(null,u));return n},r.n=function(t){var e=t&&t.__esModule?function(){return t.default}:function(){return t};return r.d(e,"a",e),e},r.o=function(t,e){return Object.prototype.hasOwnProperty.call(t,e)},r.p="",r(r.s=0)}([function(t,e,r){"use strict";Object.defineProperty(e,"__esModule",{value:!0});var n=r(1),u=r(2),o=r(3);function c(t){return"type"in t&&"select"in t}function i(t,e,r){switch(r.type){case"text":var n=""===r.select?t(e).text():t(r.select,e).text();return n||n.trim();case"attr":return(f=""===r.select?e:t(r.select,e)).attr(r.attr);case"count":return(o=t(r.select,e)).length;case"list":for(var u=[],o=t(r.select,e),s=0;s<o.length;s++){var f=o.eq(s),a=c(r.query)?i(t,f,r.query):l(t,f,r.query,{});u.push(a)}return u;case"html":if(""===r.select)return t(e).html();var p=(f=t(r.select,e)).html();return"string"==typeof p?p.trim():p;default:throw new Error('Undefined selector "'+JSON.stringify(r)+'"')}}function l(t,e,r,n){return Object.keys(r).forEach((function(u){var o=r[u];c(o)?n[u]=i(t,e,o):n[u]=l(t,e,o,{})})),n}e.scrap=function(t,e){var r=n.load(t),u=r.root();return c(e)?i(r,u,e):l(r,u,e,{})},e.$={attr:u.attr,text:u.text,count:u.count,list:o.list,html:u.html}},function(t,e){t.exports=cheerio},function(t,e,r){"use strict";Object.defineProperty(e,"__esModule",{value:!0}),e.attr=function(t,e){return{type:"attr",select:t,attr:e}},e.text=function(t){return{type:"text",select:t}},e.count=function(t){return{type:"count",select:t}},e.html=function(t){return{type:"html",select:t}}},function(t,e,r){"use strict";Object.defineProperty(e,"__esModule",{value:!0}),e.list=function(t,e){return{type:"list",select:t,query:e}}}]);
//# sourceMappingURL=data:application/json;charset=utf-8;base64,{"version":3,"sources":["webpack://scrapq/webpack/bootstrap","webpack://scrapq/./lib/index.ts","webpack://scrapq/external \"cheerio\"","webpack://scrapq/./lib/selectors.ts","webpack://scrapq/./lib/controls.ts"],"names":["installedModules","__webpack_require__","moduleId","exports","module","i","l","modules","call","m","c","d","name","getter","o","Object","defineProperty","enumerable","get","r","Symbol","toStringTag","value","t","mode","__esModule","ns","create","key","bind","n","object","property","prototype","hasOwnProperty","p","s","isSelectorOrControl","test","scrapSelector","$","context","selector","type","select","text","trim","el","attr","els","length","result","eq","scrapedEl","query","scrapQuery","push","html","Error","JSON","stringify","ref","keys","forEach","prop","val","load","root","count","list","cheerio","attribute"],"mappings":"uBACE,IAAIA,EAAmB,GAGvB,SAASC,EAAoBC,GAG5B,GAAGF,EAAiBE,GACnB,OAAOF,EAAiBE,GAAUC,QAGnC,IAAIC,EAASJ,EAAiBE,GAAY,CACzCG,EAAGH,EACHI,GAAG,EACHH,QAAS,IAUV,OANAI,EAAQL,GAAUM,KAAKJ,EAAOD,QAASC,EAAQA,EAAOD,QAASF,GAG/DG,EAAOE,GAAI,EAGJF,EAAOD,QA0Df,OArDAF,EAAoBQ,EAAIF,EAGxBN,EAAoBS,EAAIV,EAGxBC,EAAoBU,EAAI,SAASR,EAASS,EAAMC,GAC3CZ,EAAoBa,EAAEX,EAASS,IAClCG,OAAOC,eAAeb,EAASS,EAAM,CAAEK,YAAY,EAAMC,IAAKL,KAKhEZ,EAAoBkB,EAAI,SAAShB,GACX,oBAAXiB,QAA0BA,OAAOC,aAC1CN,OAAOC,eAAeb,EAASiB,OAAOC,YAAa,CAAEC,MAAO,WAE7DP,OAAOC,eAAeb,EAAS,aAAc,CAAEmB,OAAO,KAQvDrB,EAAoBsB,EAAI,SAASD,EAAOE,GAEvC,GADU,EAAPA,IAAUF,EAAQrB,EAAoBqB,IAC/B,EAAPE,EAAU,OAAOF,EACpB,GAAW,EAAPE,GAA8B,iBAAVF,GAAsBA,GAASA,EAAMG,WAAY,OAAOH,EAChF,IAAII,EAAKX,OAAOY,OAAO,MAGvB,GAFA1B,EAAoBkB,EAAEO,GACtBX,OAAOC,eAAeU,EAAI,UAAW,CAAET,YAAY,EAAMK,MAAOA,IACtD,EAAPE,GAA4B,iBAATF,EAAmB,IAAI,IAAIM,KAAON,EAAOrB,EAAoBU,EAAEe,EAAIE,EAAK,SAASA,GAAO,OAAON,EAAMM,IAAQC,KAAK,KAAMD,IAC9I,OAAOF,GAIRzB,EAAoB6B,EAAI,SAAS1B,GAChC,IAAIS,EAAST,GAAUA,EAAOqB,WAC7B,WAAwB,OAAOrB,EAAgB,SAC/C,WAA8B,OAAOA,GAEtC,OADAH,EAAoBU,EAAEE,EAAQ,IAAKA,GAC5BA,GAIRZ,EAAoBa,EAAI,SAASiB,EAAQC,GAAY,OAAOjB,OAAOkB,UAAUC,eAAe1B,KAAKuB,EAAQC,IAGzG/B,EAAoBkC,EAAI,GAIjBlC,EAAoBA,EAAoBmC,EAAI,G,gFClFrD,WACA,OAEA,OAEA,SAASC,EAAoBC,GACzB,MAAK,SAAUA,GAAU,WAAYA,EAMzC,SAASC,EAAcC,EAAkBC,EAAkBC,GACvD,OAAQA,EAASC,MACb,IAAK,OACD,IAAM,EAA4B,KAApBD,EAASE,OACjBJ,EAAEC,GAASI,OACXL,EAAEE,EAASE,OAAQH,GAASI,OAClC,OAAO,GAAQ,EAAKC,OAExB,IAAK,OAKD,OAJMC,EAA0B,KAApBL,EAASE,OACfH,EACAD,EAAEE,EAASE,OAAQH,IACTO,KAAKN,EAASM,MAGlC,IAAK,QAGD,OAFMC,EAAMT,EAAEE,EAASE,OAAQH,IACbS,OAGtB,IAAK,OAGD,IAFA,IAAMC,EAAgB,GAChBF,EAAMT,EAAEE,EAASE,OAAQH,GACtBpC,EAAI,EAAGA,EAAI4C,EAAIC,OAAQ7C,IAAK,CACjC,IAAM0C,EAAKE,EAAIG,GAAG/C,GACZgD,EAAYhB,EAAoBK,EAASY,OACzCf,EAAcC,EAAGO,EAAIL,EAASY,OAC9BC,EAAWf,EAAGO,EAAIL,EAASY,MAAO,IACxCH,EAAOK,KAAKH,GAEhB,OAAOF,EAEX,IAAK,OACD,GAAwB,KAApBT,EAASE,OAET,OADaJ,EAAEC,GAASgB,OAGxB,IACM,GADAV,EAAKP,EAAEE,EAASE,OAAQH,IACdgB,OAChB,MAAwB,iBAAT,EACT,EAAKX,OACL,EAGd,QACI,MAAM,IAAIY,MAAM,uBAAuBC,KAAKC,UAAUlB,GAAS,MAK3E,SAASa,EAA4Bf,EAAkBC,EAAkBa,EAAUO,GASlF,OARG9C,OAAO+C,KAAKR,GAAOS,SAAQ,SAAAC,GACvB,IAAMC,EAAMX,EAAMU,GACpB3B,EAAoB4B,GACvBJ,EAAIG,GAAQzB,EAAcC,EAAGC,EAASwB,GAEtCJ,EAAIG,GAAQT,EAAWf,EAAGC,EAASwB,EAAK,OAGnCJ,EAKR,iBACIJ,EACAH,GAEA,IAAMd,EAAI,EAAA0B,KAAKT,GACTU,EAAO3B,EAAE2B,OACf,OAAI9B,EAAoBiB,GACbf,EAAcC,EAAG2B,EAAMb,GAEvBC,EAAWf,EAAG2B,EAAMb,EAAgB,KAItC,EAAAd,EAAI,CACbQ,KAAI,OACJH,KAAI,OACJuB,MAAK,QACLC,KAAI,OACJZ,KAAI,S,cC9FRrD,EAAOD,QAAUmE,S,8ECkCjB,gBAAqB5B,EAAkB6B,GACnC,MAAO,CACH5B,KAAM,OACNC,OAAQF,EACRM,KAAMuB,IAId,gBAAqB7B,GACjB,MAAO,CACHC,KAAM,OACNC,OAAQF,IAIhB,iBAAsBA,GAClB,MAAO,CACHC,KAAM,QACNC,OAAQF,IAIhB,gBAAqBA,GACjB,MAAO,CACHC,KAAM,OACNC,OAAQF,K,8ECxChB,gBAAiEA,EAAkBY,GAC/E,MAAO,CACHX,KAAM,OACNC,OAAQF,EACRY,MAAK","file":"scrapq.min.js","sourcesContent":[" \t// The module cache\n \tvar installedModules = {};\n\n \t// The require function\n \tfunction __webpack_require__(moduleId) {\n\n \t\t// Check if module is in cache\n \t\tif(installedModules[moduleId]) {\n \t\t\treturn installedModules[moduleId].exports;\n \t\t}\n \t\t// Create a new module (and put it into the cache)\n \t\tvar module = installedModules[moduleId] = {\n \t\t\ti: moduleId,\n \t\t\tl: false,\n \t\t\texports: {}\n \t\t};\n\n \t\t// Execute the module function\n \t\tmodules[moduleId].call(module.exports, module, module.exports, __webpack_require__);\n\n \t\t// Flag the module as loaded\n \t\tmodule.l = true;\n\n \t\t// Return the exports of the module\n \t\treturn module.exports;\n \t}\n\n\n \t// expose the modules object (__webpack_modules__)\n \t__webpack_require__.m = modules;\n\n \t// expose the module cache\n \t__webpack_require__.c = installedModules;\n\n \t// define getter function for harmony exports\n \t__webpack_require__.d = function(exports, name, getter) {\n \t\tif(!__webpack_require__.o(exports, name)) {\n \t\t\tObject.defineProperty(exports, name, { enumerable: true, get: getter });\n \t\t}\n \t};\n\n \t// define __esModule on exports\n \t__webpack_require__.r = function(exports) {\n \t\tif(typeof Symbol !== 'undefined' && Symbol.toStringTag) {\n \t\t\tObject.defineProperty(exports, Symbol.toStringTag, { value: 'Module' });\n \t\t}\n \t\tObject.defineProperty(exports, '__esModule', { value: true });\n \t};\n\n \t// create a fake namespace object\n \t// mode & 1: value is a module id, require it\n \t// mode & 2: merge all properties of value into the ns\n \t// mode & 4: return value when already ns object\n \t// mode & 8|1: behave like require\n \t__webpack_require__.t = function(value, mode) {\n \t\tif(mode & 1) value = __webpack_require__(value);\n \t\tif(mode & 8) return value;\n \t\tif((mode & 4) && typeof value === 'object' && value && value.__esModule) return value;\n \t\tvar ns = Object.create(null);\n \t\t__webpack_require__.r(ns);\n \t\tObject.defineProperty(ns, 'default', { enumerable: true, value: value });\n \t\tif(mode & 2 && typeof value != 'string') for(var key in value) __webpack_require__.d(ns, key, function(key) { return value[key]; }.bind(null, key));\n \t\treturn ns;\n \t};\n\n \t// getDefaultExport function for compatibility with non-harmony modules\n \t__webpack_require__.n = function(module) {\n \t\tvar getter = module && module.__esModule ?\n \t\t\tfunction getDefault() { return module['default']; } :\n \t\t\tfunction getModuleExports() { return module; };\n \t\t__webpack_require__.d(getter, 'a', getter);\n \t\treturn getter;\n \t};\n\n \t// Object.prototype.hasOwnProperty.call\n \t__webpack_require__.o = function(object, property) { return Object.prototype.hasOwnProperty.call(object, property); };\n\n \t// __webpack_public_path__\n \t__webpack_require__.p = \"\";\n\n\n \t// Load entry module and return exports\n \treturn __webpack_require__(__webpack_require__.s = 0);\n","import { load } from \"cheerio\";\nimport { AnySelector, text, count, attr, html } from \"./selectors\";\nimport { Query, GetResult } from \"./helpers\";\nimport { AnyControl, list } from \"./controls\";\n\nfunction isSelectorOrControl(test: any): test is (AnySelector | AnyControl) {\n    if ((\"type\" in test) && (\"select\" in test)) {\n        return true;\n    }\n    return false;\n}\n\nfunction scrapSelector($: CheerioStatic, context: Cheerio, selector: AnySelector | AnyControl) {\n    switch (selector.type) {\n        case \"text\": {\n            const text = (selector.select === \"\")\n                ? $(context).text()\n                : $(selector.select, context).text();\n            return text || text.trim();\n        }\n        case \"attr\": {\n            const el = (selector.select === \"\")\n                ? context\n                : $(selector.select, context);\n            const attr = el.attr(selector.attr);\n            return attr;\n        }\n        case \"count\": {\n            const els = $(selector.select, context);\n            const count = els.length;\n            return count;\n        }\n        case \"list\": {\n            const result: any[] = [];\n            const els = $(selector.select, context);\n            for (let i = 0; i < els.length; i++) {\n                const el = els.eq(i);\n                const scrapedEl = isSelectorOrControl(selector.query)\n                    ? scrapSelector($, el, selector.query)\n                    : scrapQuery($, el, selector.query, {});\n                result.push(scrapedEl);\n            }\n            return result;\n        }\n        case \"html\": {\n            if (selector.select === \"\") {\n                const html = $(context).html();\n                return html;\n            } else {\n                const el = $(selector.select, context);\n                const html = el.html();\n                return (typeof html === \"string\")\n                    ? html.trim()\n                    : html;\n            }\n        }\n        default: {\n            throw new Error(`Undefined selector \"${JSON.stringify(selector)}\"`);\n        }\n    }\n}\n\nfunction scrapQuery<Q extends Query>($: CheerioStatic, context: Cheerio, query: Q, ref: any): GetResult<Q> {\n    Object.keys(query).forEach(prop => {\n        const val = query[prop];\n\t\tif (isSelectorOrControl(val)) {\n\t\t\tref[prop] = scrapSelector($, context, val);\n\t\t} else {\n\t\t\tref[prop] = scrapQuery($, context, val, {});\n\t\t}\n\t});\n\treturn ref;\n}\n\n\n\nexport function scrap<Q extends Query | AnyControl | AnySelector>(\n    html: string,\n    query: Q\n): GetResult<Q> {\n    const $ = load(html);\n    const root = $.root();\n    if (isSelectorOrControl(query)) {\n        return scrapSelector($, root, query) as any;\n    } else {\n        return scrapQuery($, root, query as Query, {}) as any;\n    }\n}\n\nexport const $ = {\n    attr,\n    text,\n    count,\n    list,\n    html\n};\n","module.exports = cheerio;","interface CountType {\n    type: \"count\";\n    select: string;\n}\n\ninterface TextType {\n    type: \"text\";\n    select: string;\n}\n\ninterface AttrType {\n    type: \"attr\";\n    select: string;\n    attr: string;\n}\n\ninterface HtmlType {\n    type: \"html\";\n    select: string;\n}\n\n// EXPORTS\n\nexport interface SelectorTypes {\n    text: string;\n    attr: string;\n    count: number;\n    html: string;\n}\n\nexport type AnySelector = TextType | AttrType | CountType | HtmlType;\n\n// DSL\n\nexport function attr(selector: string, attribute: string): AttrType {\n    return {\n        type: \"attr\",\n        select: selector,\n        attr: attribute\n    }\n}\n\nexport function text(selector: string): TextType {\n    return {\n        type: \"text\",\n        select: selector\n    };\n}\n\nexport function count(selector: string): CountType {\n    return {\n        type: \"count\",\n        select: selector\n    };\n}\n\nexport function html(selector: string): HtmlType {\n    return {\n        type: \"html\",\n        select: selector\n    }\n}\n","import { AnySelector } from \"./selectors\";\nimport { Query } from \"./helpers\";\n\nexport interface ControlTypes<Q> {\n    list: Array<Q>;\n}\n\n// EXPORTS\n\nexport interface ListType<Q extends AnySelector | AnyControl | Query> {\n    type: \"list\";\n    select: string;\n    query: Q;\n}\n\nexport type AnyControl = ListType<any>;\n\n// DSL\n\nexport function list<Q extends Query | AnyControl | AnySelector>(selector: string, query: Q): ListType<Q> {\n    return {\n        type: \"list\",\n        select: selector,\n        query\n    };\n}\n"],"sourceRoot":""}
var scrapq=function(t){var e={};function r(n){if(e[n])return e[n].exports;var u=e[n]={i:n,l:!1,exports:{}};return t[n].call(u.exports,u,u.exports,r),u.l=!0,u.exports}return r.m=t,r.c=e,r.d=function(t,e,n){r.o(t,e)||Object.defineProperty(t,e,{enumerable:!0,get:n})},r.r=function(t){"undefined"!=typeof Symbol&&Symbol.toStringTag&&Object.defineProperty(t,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(t,"__esModule",{value:!0})},r.t=function(t,e){if(1&e&&(t=r(t)),8&e)return t;if(4&e&&"object"==typeof t&&t&&t.__esModule)return t;var n=Object.create(null);if(r.r(n),Object.defineProperty(n,"default",{enumerable:!0,value:t}),2&e&&"string"!=typeof t)for(var u in t)r.d(n,u,function(e){return t[e]}.bind(null,u));return n},r.n=function(t){var e=t&&t.__esModule?function(){return t.default}:function(){return t};return r.d(e,"a",e),e},r.o=function(t,e){return Object.prototype.hasOwnProperty.call(t,e)},r.p="",r(r.s=0)}([function(t,e,r){"use strict";Object.defineProperty(e,"__esModule",{value:!0});var n=r(1),u=r(2),c=r(3);function o(t){return"type"in t&&"select"in t}function i(t,e,r){switch(r.type){case"text":var n=""===r.select?t(e).text():t(r.select,e).text();return n&&n.trim();case"attr":return(f=""===r.select?e:t(r.select,e)).attr(r.attr);case"count":return(c=t(r.select,e)).length;case"exists":return!!(c=t(r.select,e)).length;case"list":for(var u=[],c=t(r.select,e),l=0;l<c.length;l++){var f=c.eq(l),a=o(r.query)?i(t,f,r.query):s(t,f,r.query,{});u.push(a)}return u;case"html":if(""===r.select)return t(e).html();var p=(f=t(r.select,e)).html();return"string"==typeof p?p.trim():p;default:throw new Error('Undefined selector "'+JSON.stringify(r)+'"')}}function s(t,e,r,n){return Object.keys(r).forEach((function(u){var c=r[u];o(c)?n[u]=i(t,e,c):n[u]=s(t,e,c,{})})),n}e.scrap=function(t,e){var r=n.load(t),u=r.root();return o(e)?i(r,u,e):s(r,u,e,{})},e.$={attr:u.attr,text:u.text,count:u.count,list:c.list,html:u.html,exists:u.exists}},function(t,e){t.exports=cheerio},function(t,e,r){"use strict";Object.defineProperty(e,"__esModule",{value:!0}),e.attr=function(t,e){return{type:"attr",select:t,attr:e}},e.text=function(t){return{type:"text",select:t}},e.count=function(t){return{type:"count",select:t}},e.html=function(t){return{type:"html",select:t}},e.exists=function(t){return{type:"exists",select:t}}},function(t,e,r){"use strict";Object.defineProperty(e,"__esModule",{value:!0}),e.list=function(t,e){return{type:"list",select:t,query:e}}}]);
//# sourceMappingURL=data:application/json;charset=utf-8;base64,{"version":3,"sources":["webpack://scrapq/webpack/bootstrap","webpack://scrapq/./lib/index.ts","webpack://scrapq/external \"cheerio\"","webpack://scrapq/./lib/selectors.ts","webpack://scrapq/./lib/controls.ts"],"names":["installedModules","__webpack_require__","moduleId","exports","module","i","l","modules","call","m","c","d","name","getter","o","Object","defineProperty","enumerable","get","r","Symbol","toStringTag","value","t","mode","__esModule","ns","create","key","bind","n","object","property","prototype","hasOwnProperty","p","s","isSelectorOrControl","test","scrapSelector","$","context","selector","type","select","text","trim","el","attr","els","length","result","eq","scrapedEl","query","scrapQuery","push","html","Error","JSON","stringify","ref","keys","forEach","prop","val","load","root","count","list","exists","cheerio","attribute"],"mappings":"uBACE,IAAIA,EAAmB,GAGvB,SAASC,EAAoBC,GAG5B,GAAGF,EAAiBE,GACnB,OAAOF,EAAiBE,GAAUC,QAGnC,IAAIC,EAASJ,EAAiBE,GAAY,CACzCG,EAAGH,EACHI,GAAG,EACHH,QAAS,IAUV,OANAI,EAAQL,GAAUM,KAAKJ,EAAOD,QAASC,EAAQA,EAAOD,QAASF,GAG/DG,EAAOE,GAAI,EAGJF,EAAOD,QA0Df,OArDAF,EAAoBQ,EAAIF,EAGxBN,EAAoBS,EAAIV,EAGxBC,EAAoBU,EAAI,SAASR,EAASS,EAAMC,GAC3CZ,EAAoBa,EAAEX,EAASS,IAClCG,OAAOC,eAAeb,EAASS,EAAM,CAAEK,YAAY,EAAMC,IAAKL,KAKhEZ,EAAoBkB,EAAI,SAAShB,GACX,oBAAXiB,QAA0BA,OAAOC,aAC1CN,OAAOC,eAAeb,EAASiB,OAAOC,YAAa,CAAEC,MAAO,WAE7DP,OAAOC,eAAeb,EAAS,aAAc,CAAEmB,OAAO,KAQvDrB,EAAoBsB,EAAI,SAASD,EAAOE,GAEvC,GADU,EAAPA,IAAUF,EAAQrB,EAAoBqB,IAC/B,EAAPE,EAAU,OAAOF,EACpB,GAAW,EAAPE,GAA8B,iBAAVF,GAAsBA,GAASA,EAAMG,WAAY,OAAOH,EAChF,IAAII,EAAKX,OAAOY,OAAO,MAGvB,GAFA1B,EAAoBkB,EAAEO,GACtBX,OAAOC,eAAeU,EAAI,UAAW,CAAET,YAAY,EAAMK,MAAOA,IACtD,EAAPE,GAA4B,iBAATF,EAAmB,IAAI,IAAIM,KAAON,EAAOrB,EAAoBU,EAAEe,EAAIE,EAAK,SAASA,GAAO,OAAON,EAAMM,IAAQC,KAAK,KAAMD,IAC9I,OAAOF,GAIRzB,EAAoB6B,EAAI,SAAS1B,GAChC,IAAIS,EAAST,GAAUA,EAAOqB,WAC7B,WAAwB,OAAOrB,EAAgB,SAC/C,WAA8B,OAAOA,GAEtC,OADAH,EAAoBU,EAAEE,EAAQ,IAAKA,GAC5BA,GAIRZ,EAAoBa,EAAI,SAASiB,EAAQC,GAAY,OAAOjB,OAAOkB,UAAUC,eAAe1B,KAAKuB,EAAQC,IAGzG/B,EAAoBkC,EAAI,GAIjBlC,EAAoBA,EAAoBmC,EAAI,G,gFClFrD,WACA,OAEA,OAEA,SAASC,EAAoBC,GACzB,MAAK,SAAUA,GAAU,WAAYA,EAMzC,SAASC,EAAcC,EAAkBC,EAAkBC,GACvD,OAAQA,EAASC,MACb,IAAK,OACD,IAAM,EAA4B,KAApBD,EAASE,OACjBJ,EAAEC,GAASI,OACXL,EAAEE,EAASE,OAAQH,GAASI,OAClC,OAAO,GAAQ,EAAKC,OAExB,IAAK,OAKD,OAJMC,EAA0B,KAApBL,EAASE,OACfH,EACAD,EAAEE,EAASE,OAAQH,IACTO,KAAKN,EAASM,MAGlC,IAAK,QAGD,OAFMC,EAAMT,EAAEE,EAASE,OAAQH,IACbS,OAGtB,IAAK,SAGD,SAFMD,EAAMT,EAAEE,EAASE,OAAQH,IACZS,OAGvB,IAAK,OAGD,IAFA,IAAMC,EAAgB,GAChBF,EAAMT,EAAEE,EAASE,OAAQH,GACtBpC,EAAI,EAAGA,EAAI4C,EAAIC,OAAQ7C,IAAK,CACjC,IAAM0C,EAAKE,EAAIG,GAAG/C,GACZgD,EAAYhB,EAAoBK,EAASY,OACzCf,EAAcC,EAAGO,EAAIL,EAASY,OAC9BC,EAAWf,EAAGO,EAAIL,EAASY,MAAO,IACxCH,EAAOK,KAAKH,GAEhB,OAAOF,EAEX,IAAK,OACD,GAAwB,KAApBT,EAASE,OAET,OADaJ,EAAEC,GAASgB,OAGxB,IACM,GADAV,EAAKP,EAAEE,EAASE,OAAQH,IACdgB,OAChB,MAAwB,iBAAT,EACT,EAAKX,OACL,EAGd,QACI,MAAM,IAAIY,MAAM,uBAAuBC,KAAKC,UAAUlB,GAAS,MAK3E,SAASa,EAA4Bf,EAAkBC,EAAkBa,EAAUO,GASlF,OARG9C,OAAO+C,KAAKR,GAAOS,SAAQ,SAAAC,GACvB,IAAMC,EAAMX,EAAMU,GACpB3B,EAAoB4B,GACvBJ,EAAIG,GAAQzB,EAAcC,EAAGC,EAASwB,GAEtCJ,EAAIG,GAAQT,EAAWf,EAAGC,EAASwB,EAAK,OAGnCJ,EAGR,iBACIJ,EACAH,GAEA,IAAMd,EAAI,EAAA0B,KAAKT,GACTU,EAAO3B,EAAE2B,OACf,OAAI9B,EAAoBiB,GACbf,EAAcC,EAAG2B,EAAMb,GAEvBC,EAAWf,EAAG2B,EAAMb,EAAgB,KAItC,EAAAd,EAAI,CACbQ,KAAI,OACJH,KAAI,OACJuB,MAAK,QACLC,KAAI,OACJZ,KAAI,OACJa,OAAM,W,cClGVlE,EAAOD,QAAUoE,S,8ECgCjB,gBAAqB7B,EAAkB8B,GACnC,MAAO,CACH7B,KAAM,OACNC,OAAQF,EACRM,KAAMwB,IAId,gBAAqB9B,GACjB,MAAO,CACHC,KAAM,OACNC,OAAQF,IAIhB,iBAAsBA,GAClB,MAAO,CACHC,KAAM,QACNC,OAAQF,IAIhB,gBAAqBA,GACjB,MAAO,CACHC,KAAM,OACNC,OAAQF,IAIhB,kBAAuBA,GACnB,MAAO,CACHC,KAAM,SACNC,OAAQF,K,8EC7ChB,gBAAiEA,EAAkBY,GAC/E,MAAO,CACHX,KAAM,OACNC,OAAQF,EACRY,MAAK","file":"scrapq.min.js","sourcesContent":[" \t// The module cache\n \tvar installedModules = {};\n\n \t// The require function\n \tfunction __webpack_require__(moduleId) {\n\n \t\t// Check if module is in cache\n \t\tif(installedModules[moduleId]) {\n \t\t\treturn installedModules[moduleId].exports;\n \t\t}\n \t\t// Create a new module (and put it into the cache)\n \t\tvar module = installedModules[moduleId] = {\n \t\t\ti: moduleId,\n \t\t\tl: false,\n \t\t\texports: {}\n \t\t};\n\n \t\t// Execute the module function\n \t\tmodules[moduleId].call(module.exports, module, module.exports, __webpack_require__);\n\n \t\t// Flag the module as loaded\n \t\tmodule.l = true;\n\n \t\t// Return the exports of the module\n \t\treturn module.exports;\n \t}\n\n\n \t// expose the modules object (__webpack_modules__)\n \t__webpack_require__.m = modules;\n\n \t// expose the module cache\n \t__webpack_require__.c = installedModules;\n\n \t// define getter function for harmony exports\n \t__webpack_require__.d = function(exports, name, getter) {\n \t\tif(!__webpack_require__.o(exports, name)) {\n \t\t\tObject.defineProperty(exports, name, { enumerable: true, get: getter });\n \t\t}\n \t};\n\n \t// define __esModule on exports\n \t__webpack_require__.r = function(exports) {\n \t\tif(typeof Symbol !== 'undefined' && Symbol.toStringTag) {\n \t\t\tObject.defineProperty(exports, Symbol.toStringTag, { value: 'Module' });\n \t\t}\n \t\tObject.defineProperty(exports, '__esModule', { value: true });\n \t};\n\n \t// create a fake namespace object\n \t// mode & 1: value is a module id, require it\n \t// mode & 2: merge all properties of value into the ns\n \t// mode & 4: return value when already ns object\n \t// mode & 8|1: behave like require\n \t__webpack_require__.t = function(value, mode) {\n \t\tif(mode & 1) value = __webpack_require__(value);\n \t\tif(mode & 8) return value;\n \t\tif((mode & 4) && typeof value === 'object' && value && value.__esModule) return value;\n \t\tvar ns = Object.create(null);\n \t\t__webpack_require__.r(ns);\n \t\tObject.defineProperty(ns, 'default', { enumerable: true, value: value });\n \t\tif(mode & 2 && typeof value != 'string') for(var key in value) __webpack_require__.d(ns, key, function(key) { return value[key]; }.bind(null, key));\n \t\treturn ns;\n \t};\n\n \t// getDefaultExport function for compatibility with non-harmony modules\n \t__webpack_require__.n = function(module) {\n \t\tvar getter = module && module.__esModule ?\n \t\t\tfunction getDefault() { return module['default']; } :\n \t\t\tfunction getModuleExports() { return module; };\n \t\t__webpack_require__.d(getter, 'a', getter);\n \t\treturn getter;\n \t};\n\n \t// Object.prototype.hasOwnProperty.call\n \t__webpack_require__.o = function(object, property) { return Object.prototype.hasOwnProperty.call(object, property); };\n\n \t// __webpack_public_path__\n \t__webpack_require__.p = \"\";\n\n\n \t// Load entry module and return exports\n \treturn __webpack_require__(__webpack_require__.s = 0);\n","import { load } from \"cheerio\";\nimport { AnySelector, text, count, attr, html, exists } from \"./selectors\";\nimport { Query, TypeOfQuery } from \"./helpers\";\nimport { AnyControl, list } from \"./controls\";\n\nfunction isSelectorOrControl(test: any): test is (AnySelector | AnyControl) {\n    if ((\"type\" in test) && (\"select\" in test)) {\n        return true;\n    }\n    return false;\n}\n\nfunction scrapSelector($: CheerioStatic, context: Cheerio, selector: AnySelector | AnyControl) {\n    switch (selector.type) {\n        case \"text\": {\n            const text = (selector.select === \"\")\n                ? $(context).text()\n                : $(selector.select, context).text();\n            return text && text.trim();\n        }\n        case \"attr\": {\n            const el = (selector.select === \"\")\n                ? context\n                : $(selector.select, context);\n            const attr = el.attr(selector.attr);\n            return attr;\n        }\n        case \"count\": {\n            const els = $(selector.select, context);\n            const count = els.length;\n            return count;\n        }\n        case \"exists\": {\n            const els = $(selector.select, context);\n            const exists = els.length ? true : false;\n            return exists;\n        }\n        case \"list\": {\n            const result: any[] = [];\n            const els = $(selector.select, context);\n            for (let i = 0; i < els.length; i++) {\n                const el = els.eq(i);\n                const scrapedEl = isSelectorOrControl(selector.query)\n                    ? scrapSelector($, el, selector.query)\n                    : scrapQuery($, el, selector.query, {});\n                result.push(scrapedEl);\n            }\n            return result;\n        }\n        case \"html\": {\n            if (selector.select === \"\") {\n                const html = $(context).html();\n                return html;\n            } else {\n                const el = $(selector.select, context);\n                const html = el.html();\n                return (typeof html === \"string\")\n                    ? html.trim()\n                    : html;\n            }\n        }\n        default: {\n            throw new Error(`Undefined selector \"${JSON.stringify(selector)}\"`);\n        }\n    }\n}\n\nfunction scrapQuery<Q extends Query>($: CheerioStatic, context: Cheerio, query: Q, ref: any): TypeOfQuery<Q> {\n    Object.keys(query).forEach(prop => {\n        const val = query[prop];\n\t\tif (isSelectorOrControl(val)) {\n\t\t\tref[prop] = scrapSelector($, context, val);\n\t\t} else {\n\t\t\tref[prop] = scrapQuery($, context, val, {});\n\t\t}\n\t});\n\treturn ref;\n}\n\nexport function scrap<Q extends Query | AnyControl | AnySelector>(\n    html: string,\n    query: Q\n): TypeOfQuery<Q> {\n    const $ = load(html);\n    const root = $.root();\n    if (isSelectorOrControl(query)) {\n        return scrapSelector($, root, query) as any;\n    } else {\n        return scrapQuery($, root, query as Query, {}) as any;\n    }\n}\n\nexport const $ = {\n    attr,\n    text,\n    count,\n    list,\n    html,\n    exists,\n};\n","module.exports = cheerio;","interface CountType {\n    type: \"count\";\n    select: string;\n}\n\ninterface TextType {\n    type: \"text\";\n    select: string;\n}\n\ninterface AttrType {\n    type: \"attr\";\n    select: string;\n    attr: string;\n}\n\ninterface HtmlType {\n    type: \"html\";\n    select: string;\n}\n\ninterface ExistsType {\n    type: \"exists\",\n    select: string;\n}\n\n// EXPORTS\n\nexport type AnySelector = TextType | AttrType | CountType | HtmlType | ExistsType;\n\n// DSL\n\nexport function attr(selector: string, attribute: string): AttrType {\n    return {\n        type: \"attr\",\n        select: selector,\n        attr: attribute\n    }\n}\n\nexport function text(selector: string): TextType {\n    return {\n        type: \"text\",\n        select: selector\n    };\n}\n\nexport function count(selector: string): CountType {\n    return {\n        type: \"count\",\n        select: selector\n    };\n}\n\nexport function html(selector: string): HtmlType {\n    return {\n        type: \"html\",\n        select: selector\n    };\n}\n\nexport function exists(selector: string): ExistsType {\n    return {\n        type: \"exists\",\n        select: selector\n    };\n}\n","import { AnySelector } from \"./selectors\";\nimport { Query } from \"./helpers\";\n\nexport interface ControlTypes<Q> {\n    list: Array<Q>;\n}\n\n// EXPORTS\n\nexport interface ListType<Q extends AnySelector | AnyControl | Query> {\n    type: \"list\";\n    select: string;\n    query: Q;\n}\n\nexport type AnyControl = ListType<any>;\n\n// DSL\n\nexport function list<Q extends Query | AnyControl | AnySelector>(selector: string, query: Q): ListType<Q> {\n    return {\n        type: \"list\",\n        select: selector,\n        query\n    };\n}\n"],"sourceRoot":""}

@@ -1,2 +0,2 @@

import { AnySelector, SelectorTypes } from "./selectors";
import { AnySelector } from "./selectors";
import { ListType, AnyControl } from "./controls";

@@ -6,8 +6,15 @@ export interface Query {

}
export declare type GetResult<Q extends AnySelector | ListType<any> | Query> = {
0: Q extends AnySelector ? SelectorTypes[Q["type"]] : never;
1: Q extends ListType<infer T> ? GetResult<T>[] : never;
export interface SelectorResultType {
text: string;
attr: string;
count: number;
html: string;
exists: boolean;
}
export declare type TypeOfQuery<Q extends AnySelector | ListType<any> | Query> = {
0: Q extends AnySelector ? SelectorResultType[Q["type"]] : never;
1: Q extends ListType<infer T> ? TypeOfQuery<T>[] : never;
2: Q extends Query ? {
[prop in keyof Q]: GetResult<Q[prop]>;
[prop in keyof Q]: TypeOfQuery<Q[prop]>;
} : never;
}[Q extends AnySelector ? 0 : Q extends ListType<any> ? 1 : Q extends Query ? 2 : boolean];

@@ -1,5 +0,5 @@

import { AnySelector, text, count, attr, html } from "./selectors";
import { Query, GetResult } from "./helpers";
import { AnySelector, text, count, attr, html, exists } from "./selectors";
import { Query, TypeOfQuery } from "./helpers";
import { AnyControl, list } from "./controls";
export declare function scrap<Q extends Query | AnyControl | AnySelector>(html: string, query: Q): GetResult<Q>;
export declare function scrap<Q extends Query | AnyControl | AnySelector>(html: string, query: Q): TypeOfQuery<Q>;
export declare const $: {

@@ -11,2 +11,3 @@ attr: typeof attr;

html: typeof html;
exists: typeof exists;
};

@@ -18,3 +18,3 @@ "use strict";

: $(selector.select, context).text();
return text_1 || text_1.trim();
return text_1 && text_1.trim();
}

@@ -33,2 +33,7 @@ case "attr": {

}
case "exists": {
var els = $(selector.select, context);
var exists_1 = els.length ? true : false;
return exists_1;
}
case "list": {

@@ -92,4 +97,5 @@ var result = [];

list: controls_1.list,
html: selectors_1.html
html: selectors_1.html,
exists: selectors_1.exists,
};
//# sourceMappingURL=index.js.map
// Generated by dts-bundle v0.7.3
declare module 'scrapq' {
import { AnySelector, text, count, attr, html } from "scrapq/selectors";
import { Query, GetResult } from "scrapq/helpers";
import { AnySelector, text, count, attr, html, exists } from "scrapq/selectors";
import { Query, TypeOfQuery } from "scrapq/helpers";
import { AnyControl, list } from "scrapq/controls";
export function scrap<Q extends Query | AnyControl | AnySelector>(html: string, query: Q): GetResult<Q>;
export function scrap<Q extends Query | AnyControl | AnySelector>(html: string, query: Q): TypeOfQuery<Q>;
export const $: {

@@ -14,2 +14,3 @@ attr: typeof attr;

html: typeof html;
exists: typeof exists;
};

@@ -36,9 +37,7 @@ }

}
export interface SelectorTypes {
text: string;
attr: string;
count: number;
html: string;
interface ExistsType {
type: "exists";
select: string;
}
export type AnySelector = TextType | AttrType | CountType | HtmlType;
export type AnySelector = TextType | AttrType | CountType | HtmlType | ExistsType;
export function attr(selector: string, attribute: string): AttrType;

@@ -48,2 +47,3 @@ export function text(selector: string): TextType;

export function html(selector: string): HtmlType;
export function exists(selector: string): ExistsType;
export {};

@@ -53,3 +53,3 @@ }

declare module 'scrapq/helpers' {
import { AnySelector, SelectorTypes } from "scrapq/selectors";
import { AnySelector } from "scrapq/selectors";
import { ListType, AnyControl } from "scrapq/controls";

@@ -59,7 +59,14 @@ export interface Query {

}
export type GetResult<Q extends AnySelector | ListType<any> | Query> = {
0: Q extends AnySelector ? SelectorTypes[Q["type"]] : never;
1: Q extends ListType<infer T> ? GetResult<T>[] : never;
export interface SelectorResultType {
text: string;
attr: string;
count: number;
html: string;
exists: boolean;
}
export type TypeOfQuery<Q extends AnySelector | ListType<any> | Query> = {
0: Q extends AnySelector ? SelectorResultType[Q["type"]] : never;
1: Q extends ListType<infer T> ? TypeOfQuery<T>[] : never;
2: Q extends Query ? {
[prop in keyof Q]: GetResult<Q[prop]>;
[prop in keyof Q]: TypeOfQuery<Q[prop]>;
} : never;

@@ -66,0 +73,0 @@ }[Q extends AnySelector ? 0 : Q extends ListType<any> ? 1 : Q extends Query ? 2 : boolean];

@@ -18,9 +18,7 @@ interface CountType {

}
export interface SelectorTypes {
text: string;
attr: string;
count: number;
html: string;
interface ExistsType {
type: "exists";
select: string;
}
export declare type AnySelector = TextType | AttrType | CountType | HtmlType;
export declare type AnySelector = TextType | AttrType | CountType | HtmlType | ExistsType;
export declare function attr(selector: string, attribute: string): AttrType;

@@ -30,2 +28,3 @@ export declare function text(selector: string): TextType;

export declare function html(selector: string): HtmlType;
export declare function exists(selector: string): ExistsType;
export {};

@@ -33,2 +33,9 @@ "use strict";

exports.html = html;
function exists(selector) {
return {
type: "exists",
select: selector
};
}
exports.exists = exists;
//# sourceMappingURL=selectors.js.map

@@ -1,2 +0,2 @@

import { AnySelector, SelectorTypes } from "./selectors";
import { AnySelector } from "./selectors";
import { ListType, AnyControl } from "./controls";

@@ -8,7 +8,15 @@

export type GetResult<Q extends AnySelector | ListType<any> | Query> = {
0: Q extends AnySelector ? SelectorTypes[Q["type"]] : never;
1: Q extends ListType<infer T> ? GetResult<T>[] : never;
export interface SelectorResultType {
text: string;
attr: string;
count: number;
html: string;
exist: boolean;
}
export type TypeOfQuery<Q extends AnySelector | ListType<any> | Query> = {
0: Q extends AnySelector ? SelectorResultType[Q["type"]] : never;
1: Q extends ListType<infer T> ? TypeOfQuery<T>[] : never;
2: Q extends Query ? {
[prop in keyof Q]: GetResult<Q[prop]>
[prop in keyof Q]: TypeOfQuery<Q[prop]>
}: never;

@@ -15,0 +23,0 @@ }[Q extends AnySelector ? 0

import { load } from "cheerio";
import { AnySelector, text, count, attr, html } from "./selectors";
import { Query, GetResult } from "./helpers";
import { AnySelector, text, count, attr, html, exist } from "./selectors";
import { Query, TypeOfQuery } from "./helpers";
import { AnyControl, list } from "./controls";

@@ -19,3 +19,3 @@

: $(selector.select, context).text();
return text || text.trim();
return text && text.trim();
}

@@ -34,2 +34,7 @@ case "attr": {

}
case "exist": {
const els = $(selector.select, context);
const exist = els.length ? true : false;
return exist;
}
case "list": {

@@ -65,3 +70,3 @@ const result: any[] = [];

function scrapQuery<Q extends Query>($: CheerioStatic, context: Cheerio, query: Q, ref: any): GetResult<Q> {
function scrapQuery<Q extends Query>($: CheerioStatic, context: Cheerio, query: Q, ref: any): TypeOfQuery<Q> {
Object.keys(query).forEach(prop => {

@@ -78,8 +83,6 @@ const val = query[prop];

export function scrap<Q extends Query | AnyControl | AnySelector>(
html: string,
query: Q
): GetResult<Q> {
): TypeOfQuery<Q> {
const $ = load(html);

@@ -99,3 +102,4 @@ const root = $.root();

list,
html
html,
exist,
};

@@ -22,13 +22,11 @@ interface CountType {

interface ExistType {
type: "exist",
select: string;
}
// EXPORTS
export interface SelectorTypes {
text: string;
attr: string;
count: number;
html: string;
}
export type AnySelector = TextType | AttrType | CountType | HtmlType | ExistType;
export type AnySelector = TextType | AttrType | CountType | HtmlType;
// DSL

@@ -62,3 +60,10 @@

select: selector
}
};
}
export function exist(selector: string): ExistType {
return {
type: "exist",
select: selector
};
}
{
"name": "scrapq",
"version": "2.0.1",
"version": "2.1.0",
"description": "Lightweight Typescript library for scrapping html",

@@ -9,5 +9,3 @@ "main": "./dist/index.js",

"scripts": {
"test": "npm run test:basic && npm run test:exhaustive",
"test:basic": "jasmine-ts ./test/basic.test.ts",
"test:exhaustive": "jasmine-ts ./test/**/*.ts",
"test": "ts-node node_modules/tape/bin/tape test/**/*.ts",
"dist": "npm run test; npm run build; npm run build:web",

@@ -31,7 +29,6 @@ "build": "npm run build:node && npm run build:web && npm run build:dts",

"devDependencies": {
"@types/jasmine": "^2.8.16",
"@types/node": "^10.17.15",
"jasmine": "^3.5.0",
"jasmine-ts": "^0.2.1",
"ts-loader": "^5.4.5",
"@types/tape": "^4.2.34",
"tape": "^4.13.2",
"ts-loader": "^7.0.0",
"ts-node": "^8.8.2",
"typescript": "^3.7.5",

@@ -38,0 +35,0 @@ "webpack": "^4.41.6",

@@ -104,22 +104,26 @@ # ScrapQ

`Q.text(selector: string): string`
`$.text(selector: string): string`
get text from an element
`Q.attr(selector: string, htmlAttribute: string): string`
`$.attr(selector: string, htmlAttribute: string): string`
get attribute from an element
`Q.html(selector: string): string`
`$.html(selector: string): string`
get html
`Q.count(selector: string): number`
`$.count(selector: string): number`
get elements count
`$.exist(selector: string): boolean`
check if element exists
### Controls
`Q.List(selector: string, query: Query | QueryType, predicate?): Array<query>`
`$.list(selector: string, query: Query | QueryType, predicate?): Array<query>`
get list of items

@@ -0,1 +1,2 @@

import test from "tape";
import { scrap, $ } from '../lib';

@@ -13,19 +14,21 @@

describe('Basic', () => {
test('Basic', (main) => {
it('should scrap <h1/> text from string', () => {
test('should scrap <h1/> text from string', (t) => {
const result = scrap(STR_TO_SCRAP, {
title: $.text('h1.title')
});
expect(result).toEqual({ title: 'Hello'});
t.equal(result, { title: 'Hello'});
t.end();
});
it('should scrap attributes from <h1/>', () => {
test('should scrap attributes from <h1/>', (t) => {
const result = scrap(STR_TO_SCRAP, {
title: $.attr('h1.title', 'class')
});
expect(result).toEqual({ title: 'title'});
t.equal(result, { title: 'title'});
t.end();
});
it('should scrap items from <span/>', () => {
test('should scrap items from <span/>', (t) => {
const result = scrap(STR_TO_SCRAP, {

@@ -36,7 +39,8 @@ items: $.list('li', {

});
expect(result.items.length).toBe(3);
expect(result.items[2].text).toBe('Bonjour')
t.equal(result.items.length, 3);
t.equal(result.items[2].text, 'Bonjour');
t.end();
});
it('should scrap text from <li><span/>', () => {
test('should scrap text from <li><span/>', (t) => {
const result = scrap(STR_TO_SCRAP, {

@@ -47,7 +51,8 @@ items: $.list('li', {

});
expect(result.items.length).toBe(3);
expect(result.items[2].text).toBe('Bonjour')
t.equal(result.items.length, 3);
t.equal(result.items[2].text, 'Bonjour');
t.end();
});
it('should scrap text from <span/> by omitting <li/>', () => {
test('should scrap text from <span/> by omitting <li/>', (t) => {
const result = scrap(STR_TO_SCRAP, {

@@ -58,11 +63,12 @@ items: $.list('span', {

});
expect(result.items.length).toBe(3);
expect(result.items[2].text).toBe('Bonjour')
t.equal(result.items.length, 3);
t.equal(result.items[2].text, 'Bonjour');
t.end();
});
it('should get list of texts', () => {
test('should get list of texts', (t) => {
const result = scrap(STR_TO_SCRAP, {
texts: $.list('li', $.text('span'))
});
expect(result.texts).toEqual([
t.equals(result.texts, [
'Guten Tag',

@@ -72,5 +78,6 @@ 'Ciao',

]);
t.end();
});
it('should user deep query', () => {
test('should user deep query', (t) => {
const result = scrap(STR_TO_SCRAP, {

@@ -82,31 +89,36 @@ title: $.text('.title'),

});
expect(result.title).toBe('Hello');
expect(result.data.msg).toBe('Ciao');
t.equal(result.title, 'Hello');
t.equal(result.data.msg, 'Ciao');
t.end();
});
it('should count <span/> elements', () => {
test('should count <span/> elements', (t) => {
const result = scrap(STR_TO_SCRAP, {
spanCount: $.count('span')
});
expect(result.spanCount).toBe(3);
t.equal(result.spanCount, 3);
t.end();
});
it('should count not exists element', () => {
test('should count not exists element', (t) => {
const result = scrap(STR_TO_SCRAP, {
spanCount: $.count('table')
});
expect(result.spanCount).toBe(0);
t.equal(result.spanCount, 0);
t.end();
});
it('should use only selector to scrap title', () => {
test('should use only selector to scrap title', (t) => {
const title = scrap(STR_TO_SCRAP, $.text('.title'));
expect(title).toBe('Hello');
t.equal(title, 'Hello');
});
it('should use only selector to scrap <span/>', () => {
test('should use only selector to scrap <span/>', (t) => {
const spans = scrap(STR_TO_SCRAP, $.list('span', $.text('')));
expect(spans.length).toBe(3);
expect(spans[0]).toBe('Guten Tag');
t.equal(spans.length, 3);
t.equal(spans[0], 'Guten Tag');
t.end();
});
main.end();
});

@@ -0,12 +1,15 @@

import test from "tape";
import { scrap, $ } from "../../lib";
import { html } from "../data";
describe("select", () => {
it("should scrap items from <span/>", () => {
test("select", (main) => {
test("should scrap items from <span/>", (t) => {
const spans = scrap(html, $.list("span", $.text("")));
expect(spans.length).toBe(3);
expect(spans[0]).toBe("Guten Tag");
t.equal(spans.length, 3);
t.equal(spans[0], "Guten Tag");
t.end();
});
it("should scrap items from <span/> using query", () => {
test("should scrap items from <span/> using query", (t) => {
const result = scrap(html, {

@@ -17,5 +20,8 @@ items: $.list("li", {

});
expect(result.items.length).toBe(3);
expect(result.items[2].text).toBe("Bonjour");
t.equal(result.items.length, 3);
t.equal(result.items[2].text, "Bonjour");
t.end();
});
main.end();
});

@@ -0,1 +1,2 @@

import test from "tape";
import { readFileSync } from "fs";

@@ -6,4 +7,5 @@ import { scrap, $ } from "../../lib";

describe("agescx documentation", () => {
it("should get all navigation items from agescx", () => {
test("agescx documentation", (main) => {
test("should get all navigation items from agescx", (t) => {
const result = scrap(shtml, {

@@ -22,8 +24,11 @@ navs: $.list("ul.navbar-nav>li:not(.disabled)", {

expect(result.navs.length).toBe(9);
expect(result.navs[2].submenu.length).toBe(2);
expect(result.navs[2].submenu[0].text).toBe("Adding new unit");
expect(result.content.length).toBeGreaterThan(30);
expect(result.title).toBe("Agescx Documentation");
t.equal(result.navs.length, 9);
t.equal(result.navs[2].submenu.length, 2);
t.equal(result.navs[2].submenu[0].text, "Adding new unit");
t.equal(result.content.length, 1114);
t.equal(result.title, "Agescx Documentation");
t.end();
});
main.end();
});

@@ -0,21 +1,28 @@

import test from "tape";
import { scrap, $ } from "../../lib";
import { html } from "../data";
describe("attr", () => {
it("should scrap href attr from an <a/>", () => {
test("attr", (main) => {
test("should scrap href attr from an <a/>", (t) => {
const result = scrap(html, $.attr("a", "href"));
expect(result).toBe("/read-more");
t.equal(result, "/read-more");
t.end();
});
it("should scrap data-extra from <div/>", () => {
test("should scrap data-extra from <div/>", (t) => {
const result = scrap(html, $.attr(".footer", "data-extra"));
expect(result).toBe("footer");
t.equal(result, "footer");
t.end();
});
it("should scrap data using query", () => {
test("should scrap data using query", (t) => {
const result = scrap(html, {
footer: $.attr(".footer", "data-extra")
});
expect(result.footer).toBe("footer");
t.equal(result.footer, "footer");
t.end();
});
main.end();
});

@@ -0,26 +1,34 @@

import test from "tape";
import { scrap, $ } from "../../lib";
import { html } from "../data";
describe("count", () => {
it("should count <li/> elements", () => {
test("count", (main) => {
test("should count <li/> elements", (t) => {
const result = scrap(html, $.count("li"));
expect(result).toBe(3);
t.equal(result, 3);
t.end();
});
it("should count <h1/>", () => {
test("should count <h1/>", (t) => {
const result = scrap(html, $.count("h1"));
expect(result).toBe(1);
t.equal(result, 1);
t.end();
});
it("should count non-existing element", () => {
test("should count non-existing element", (t) => {
const result = scrap(html, $.count("h3"));
expect(result).toBe(0);
t.equal(result, 0);
t.end();
});
it("should count using query", () => {
test("should count using query", (t) => {
const result = scrap(html, {
liCounts: $.count("li")
});
expect(result.liCounts).toBe(3);
t.equal(result.liCounts, 3);
t.end();
});
main.end();
});

@@ -0,16 +1,22 @@

import test from "tape";
import { scrap, $ } from "../../lib";
import { html } from "../data";
describe("html", () => {
it("should get html from <ul/>", () => {
test("html", (main) => {
test("should get html from <ul/>", (t) => {
const result = scrap(html, $.html("ul>li:first-child"));
expect(result).toBe(`<span>Guten Tag</span>`);
t.equal(result, `<span>Guten Tag</span>`);
t.end();
});
it("should count using query", () => {
test("should count using query", (t) => {
const result = scrap(html, {
footer: $.html("ul>li:last-child")
});
expect(result.footer).toBe(`<span>Bonjour</span>`);
t.equal(result.footer, `<span>Bonjour</span>`);
t.end();
});
main.end();
});

@@ -0,21 +1,28 @@

import test from "tape";
import { scrap, $ } from "../../lib";
import { html } from "../data";
describe("text", () => {
it("should get text from .msg", () => {
test("text", (main) => {
test("should get text from .msg", (t) => {
const result = scrap(html, $.text(".msg"));
expect(result).toBe("Ciao");
t.equal(result, "Ciao");
t.end();
});
it("should not get text from non existing element", () => {
test("should not get text from non existing element", (t) => {
const result = scrap(html, $.text("h3"));
expect(result).toBe("");
t.equal(result, "");
t.end();
});
it("should count using query", () => {
test("should count using query", (t) => {
const result = scrap(html, {
link: $.text("a")
});
expect(result.link).toBe("read more ...");
t.equal(result.link, "read more ...");
t.end();
});
main.end();
});
# TODO
- [ ] add strict mode for parsing
- [x] add if control
- [ ] add if control
- [ ] better context passing (if)

@@ -9,2 +9,1 @@ - [ ] fix test for non existing elements

- [x] test nested lists
- [x] callback function to convert selector output

Sorry, the diff of this file is not supported yet

Sorry, the diff of this file is not supported yet

SocketSocket SOC 2 Logo

Product

  • Package Alerts
  • Integrations
  • Docs
  • Pricing
  • FAQ
  • Roadmap
  • Changelog

Packages

npm

Stay in touch

Get open source security insights delivered straight into your inbox.


  • Terms
  • Privacy
  • Security

Made with ⚡️ by Socket Inc