@jocmp/mercury-parser 2.2.3-dev → 2.2.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +13 -10
- package/dist/generate-custom-parser.js +122 -61
- package/dist/generate-custom-parser.js.map +1 -1
- package/dist/mercury.js +148 -50
- package/dist/mercury.js.map +1 -1
- package/dist/mercury.web.js +1 -1
- package/dist/mercury.web.js.map +1 -1
- package/node_modules/browser-request/.gitignore +3 -0
- package/node_modules/browser-request/.npmignore +3 -0
- package/node_modules/browser-request/AUTHORS +3 -0
- package/node_modules/browser-request/LICENSE +202 -0
- package/node_modules/browser-request/README.md +107 -0
- package/node_modules/browser-request/index.js +476 -0
- package/node_modules/browser-request/package.json +48 -0
- package/node_modules/browser-request/test.js +20 -0
- package/node_modules/http-headers/.travis.yml +10 -0
- package/node_modules/http-headers/LICENSE +21 -0
- package/node_modules/http-headers/README.md +205 -0
- package/node_modules/http-headers/index.js +137 -0
- package/node_modules/http-headers/package.json +41 -0
- package/node_modules/http-headers/test.js +163 -0
- package/node_modules/jquery/AUTHORS.txt +331 -0
- package/node_modules/jquery/LICENSE.txt +20 -0
- package/node_modules/jquery/README.md +62 -0
- package/node_modules/jquery/bower.json +14 -0
- package/node_modules/jquery/dist/jquery.js +10881 -0
- package/node_modules/jquery/dist/jquery.min.js +2 -0
- package/node_modules/jquery/dist/jquery.min.map +1 -0
- package/node_modules/jquery/dist/jquery.slim.js +8782 -0
- package/node_modules/jquery/dist/jquery.slim.min.js +2 -0
- package/node_modules/jquery/dist/jquery.slim.min.map +1 -0
- package/node_modules/jquery/external/sizzle/LICENSE.txt +36 -0
- package/node_modules/jquery/external/sizzle/dist/sizzle.js +2478 -0
- package/node_modules/jquery/external/sizzle/dist/sizzle.min.js +3 -0
- package/node_modules/jquery/external/sizzle/dist/sizzle.min.map +1 -0
- package/node_modules/jquery/package.json +116 -0
- package/node_modules/jquery/src/ajax/jsonp.js +103 -0
- package/node_modules/jquery/src/ajax/load.js +77 -0
- package/node_modules/jquery/src/ajax/script.js +74 -0
- package/node_modules/jquery/src/ajax/var/location.js +5 -0
- package/node_modules/jquery/src/ajax/var/nonce.js +5 -0
- package/node_modules/jquery/src/ajax/var/rquery.js +5 -0
- package/node_modules/jquery/src/ajax/xhr.js +170 -0
- package/node_modules/jquery/src/ajax.js +876 -0
- package/node_modules/jquery/src/attributes/attr.js +141 -0
- package/node_modules/jquery/src/attributes/classes.js +186 -0
- package/node_modules/jquery/src/attributes/prop.js +143 -0
- package/node_modules/jquery/src/attributes/support.js +33 -0
- package/node_modules/jquery/src/attributes/val.js +191 -0
- package/node_modules/jquery/src/attributes.js +13 -0
- package/node_modules/jquery/src/callbacks.js +236 -0
- package/node_modules/jquery/src/core/DOMEval.js +43 -0
- package/node_modules/jquery/src/core/access.js +72 -0
- package/node_modules/jquery/src/core/camelCase.js +23 -0
- package/node_modules/jquery/src/core/init.js +129 -0
- package/node_modules/jquery/src/core/isAttached.js +26 -0
- package/node_modules/jquery/src/core/nodeName.js +13 -0
- package/node_modules/jquery/src/core/parseHTML.js +65 -0
- package/node_modules/jquery/src/core/parseXML.js +35 -0
- package/node_modules/jquery/src/core/ready-no-deferred.js +97 -0
- package/node_modules/jquery/src/core/ready.js +86 -0
- package/node_modules/jquery/src/core/readyException.js +13 -0
- package/node_modules/jquery/src/core/stripAndCollapse.js +14 -0
- package/node_modules/jquery/src/core/support.js +20 -0
- package/node_modules/jquery/src/core/toType.js +20 -0
- package/node_modules/jquery/src/core/var/rsingleTag.js +7 -0
- package/node_modules/jquery/src/core.js +400 -0
- package/node_modules/jquery/src/css/addGetHookIf.js +26 -0
- package/node_modules/jquery/src/css/adjustCSS.js +74 -0
- package/node_modules/jquery/src/css/curCSS.js +65 -0
- package/node_modules/jquery/src/css/finalPropName.js +42 -0
- package/node_modules/jquery/src/css/hiddenVisibleSelectors.js +15 -0
- package/node_modules/jquery/src/css/showHide.js +105 -0
- package/node_modules/jquery/src/css/support.js +152 -0
- package/node_modules/jquery/src/css/var/cssExpand.js +5 -0
- package/node_modules/jquery/src/css/var/getStyles.js +17 -0
- package/node_modules/jquery/src/css/var/isHiddenWithinTree.js +34 -0
- package/node_modules/jquery/src/css/var/rboxStyle.js +7 -0
- package/node_modules/jquery/src/css/var/rnumnonpx.js +7 -0
- package/node_modules/jquery/src/css/var/swap.js +26 -0
- package/node_modules/jquery/src/css.js +494 -0
- package/node_modules/jquery/src/data/Data.js +162 -0
- package/node_modules/jquery/src/data/var/acceptData.js +19 -0
- package/node_modules/jquery/src/data/var/dataPriv.js +7 -0
- package/node_modules/jquery/src/data/var/dataUser.js +7 -0
- package/node_modules/jquery/src/data.js +180 -0
- package/node_modules/jquery/src/deferred/exceptionHook.js +21 -0
- package/node_modules/jquery/src/deferred.js +399 -0
- package/node_modules/jquery/src/deprecated/ajax-event-alias.js +22 -0
- package/node_modules/jquery/src/deprecated/event.js +50 -0
- package/node_modules/jquery/src/deprecated.js +87 -0
- package/node_modules/jquery/src/dimensions.js +60 -0
- package/node_modules/jquery/src/effects/Tween.js +125 -0
- package/node_modules/jquery/src/effects/animatedSelector.js +15 -0
- package/node_modules/jquery/src/effects.js +702 -0
- package/node_modules/jquery/src/event/focusin.js +58 -0
- package/node_modules/jquery/src/event/support.js +11 -0
- package/node_modules/jquery/src/event/trigger.js +199 -0
- package/node_modules/jquery/src/event.js +874 -0
- package/node_modules/jquery/src/exports/amd.js +26 -0
- package/node_modules/jquery/src/exports/global.js +34 -0
- package/node_modules/jquery/src/jquery.js +41 -0
- package/node_modules/jquery/src/manipulation/_evalUrl.js +32 -0
- package/node_modules/jquery/src/manipulation/buildFragment.js +106 -0
- package/node_modules/jquery/src/manipulation/getAll.js +32 -0
- package/node_modules/jquery/src/manipulation/setGlobalEval.js +22 -0
- package/node_modules/jquery/src/manipulation/support.js +41 -0
- package/node_modules/jquery/src/manipulation/var/rscriptType.js +5 -0
- package/node_modules/jquery/src/manipulation/var/rtagName.js +8 -0
- package/node_modules/jquery/src/manipulation/wrapMap.js +30 -0
- package/node_modules/jquery/src/manipulation.js +480 -0
- package/node_modules/jquery/src/offset.js +232 -0
- package/node_modules/jquery/src/queue/delay.js +24 -0
- package/node_modules/jquery/src/queue.js +145 -0
- package/node_modules/jquery/src/selector-native.js +241 -0
- package/node_modules/jquery/src/selector-sizzle.js +19 -0
- package/node_modules/jquery/src/selector.js +3 -0
- package/node_modules/jquery/src/serialize.js +134 -0
- package/node_modules/jquery/src/traversing/findFilter.js +97 -0
- package/node_modules/jquery/src/traversing/var/dir.js +22 -0
- package/node_modules/jquery/src/traversing/var/rneedsContext.js +8 -0
- package/node_modules/jquery/src/traversing/var/siblings.js +17 -0
- package/node_modules/jquery/src/traversing.js +198 -0
- package/node_modules/jquery/src/var/ObjectFunctionString.js +7 -0
- package/node_modules/jquery/src/var/arr.js +5 -0
- package/node_modules/jquery/src/var/class2type.js +6 -0
- package/node_modules/jquery/src/var/document.js +5 -0
- package/node_modules/jquery/src/var/documentElement.js +7 -0
- package/node_modules/jquery/src/var/flat.js +16 -0
- package/node_modules/jquery/src/var/fnToString.js +7 -0
- package/node_modules/jquery/src/var/getProto.js +5 -0
- package/node_modules/jquery/src/var/hasOwn.js +7 -0
- package/node_modules/jquery/src/var/indexOf.js +7 -0
- package/node_modules/jquery/src/var/isFunction.js +17 -0
- package/node_modules/jquery/src/var/isWindow.js +8 -0
- package/node_modules/jquery/src/var/pnum.js +5 -0
- package/node_modules/jquery/src/var/push.js +7 -0
- package/node_modules/jquery/src/var/rcheckableType.js +5 -0
- package/node_modules/jquery/src/var/rcssNum.js +9 -0
- package/node_modules/jquery/src/var/rnothtmlwhite.js +8 -0
- package/node_modules/jquery/src/var/slice.js +7 -0
- package/node_modules/jquery/src/var/support.js +6 -0
- package/node_modules/jquery/src/var/toString.js +7 -0
- package/node_modules/jquery/src/wrap.js +78 -0
- package/node_modules/moment/CHANGELOG.md +996 -0
- package/node_modules/moment/LICENSE +22 -0
- package/node_modules/moment/README.md +55 -0
- package/node_modules/moment/dist/locale/af.js +71 -0
- package/node_modules/moment/dist/locale/ar-dz.js +156 -0
- package/node_modules/moment/dist/locale/ar-kw.js +55 -0
- package/node_modules/moment/dist/locale/ar-ly.js +171 -0
- package/node_modules/moment/dist/locale/ar-ma.js +56 -0
- package/node_modules/moment/dist/locale/ar-ps.js +112 -0
- package/node_modules/moment/dist/locale/ar-sa.js +105 -0
- package/node_modules/moment/dist/locale/ar-tn.js +55 -0
- package/node_modules/moment/dist/locale/ar.js +189 -0
- package/node_modules/moment/dist/locale/az.js +102 -0
- package/node_modules/moment/dist/locale/be.js +142 -0
- package/node_modules/moment/dist/locale/bg.js +87 -0
- package/node_modules/moment/dist/locale/bm.js +52 -0
- package/node_modules/moment/dist/locale/bn-bd.js +129 -0
- package/node_modules/moment/dist/locale/bn.js +119 -0
- package/node_modules/moment/dist/locale/bo.js +124 -0
- package/node_modules/moment/dist/locale/br.js +168 -0
- package/node_modules/moment/dist/locale/bs.js +160 -0
- package/node_modules/moment/dist/locale/ca.js +100 -0
- package/node_modules/moment/dist/locale/cs.js +181 -0
- package/node_modules/moment/dist/locale/cv.js +63 -0
- package/node_modules/moment/dist/locale/cy.js +98 -0
- package/node_modules/moment/dist/locale/da.js +53 -0
- package/node_modules/moment/dist/locale/de-at.js +79 -0
- package/node_modules/moment/dist/locale/de-ch.js +78 -0
- package/node_modules/moment/dist/locale/de.js +78 -0
- package/node_modules/moment/dist/locale/dv.js +90 -0
- package/node_modules/moment/dist/locale/el.js +106 -0
- package/node_modules/moment/dist/locale/en-au.js +68 -0
- package/node_modules/moment/dist/locale/en-ca.js +64 -0
- package/node_modules/moment/dist/locale/en-gb.js +68 -0
- package/node_modules/moment/dist/locale/en-ie.js +68 -0
- package/node_modules/moment/dist/locale/en-il.js +64 -0
- package/node_modules/moment/dist/locale/en-in.js +68 -0
- package/node_modules/moment/dist/locale/en-nz.js +68 -0
- package/node_modules/moment/dist/locale/en-sg.js +68 -0
- package/node_modules/moment/dist/locale/eo.js +68 -0
- package/node_modules/moment/dist/locale/es-do.js +108 -0
- package/node_modules/moment/dist/locale/es-mx.js +110 -0
- package/node_modules/moment/dist/locale/es-us.js +110 -0
- package/node_modules/moment/dist/locale/es.js +110 -0
- package/node_modules/moment/dist/locale/et.js +78 -0
- package/node_modules/moment/dist/locale/eu.js +65 -0
- package/node_modules/moment/dist/locale/fa.js +113 -0
- package/node_modules/moment/dist/locale/fi.js +124 -0
- package/node_modules/moment/dist/locale/fil.js +58 -0
- package/node_modules/moment/dist/locale/fo.js +57 -0
- package/node_modules/moment/dist/locale/fr-ca.js +70 -0
- package/node_modules/moment/dist/locale/fr-ch.js +74 -0
- package/node_modules/moment/dist/locale/fr.js +108 -0
- package/node_modules/moment/dist/locale/fy.js +75 -0
- package/node_modules/moment/dist/locale/ga.js +95 -0
- package/node_modules/moment/dist/locale/gd.js +95 -0
- package/node_modules/moment/dist/locale/gl.js +75 -0
- package/node_modules/moment/dist/locale/gom-deva.js +126 -0
- package/node_modules/moment/dist/locale/gom-latn.js +124 -0
- package/node_modules/moment/dist/locale/gu.js +122 -0
- package/node_modules/moment/dist/locale/he.js +94 -0
- package/node_modules/moment/dist/locale/hi.js +168 -0
- package/node_modules/moment/dist/locale/hr.js +156 -0
- package/node_modules/moment/dist/locale/hu.js +118 -0
- package/node_modules/moment/dist/locale/hy-am.js +94 -0
- package/node_modules/moment/dist/locale/id.js +76 -0
- package/node_modules/moment/dist/locale/is.js +140 -0
- package/node_modules/moment/dist/locale/it-ch.js +64 -0
- package/node_modules/moment/dist/locale/it.js +106 -0
- package/node_modules/moment/dist/locale/ja.js +148 -0
- package/node_modules/moment/dist/locale/jv.js +76 -0
- package/node_modules/moment/dist/locale/ka.js +92 -0
- package/node_modules/moment/dist/locale/kk.js +82 -0
- package/node_modules/moment/dist/locale/km.js +103 -0
- package/node_modules/moment/dist/locale/kn.js +124 -0
- package/node_modules/moment/dist/locale/ko.js +75 -0
- package/node_modules/moment/dist/locale/ku-kmr.js +121 -0
- package/node_modules/moment/dist/locale/ku.js +118 -0
- package/node_modules/moment/dist/locale/ky.js +84 -0
- package/node_modules/moment/dist/locale/lb.js +137 -0
- package/node_modules/moment/dist/locale/lo.js +66 -0
- package/node_modules/moment/dist/locale/lt.js +125 -0
- package/node_modules/moment/dist/locale/lv.js +94 -0
- package/node_modules/moment/dist/locale/me.js +117 -0
- package/node_modules/moment/dist/locale/mi.js +60 -0
- package/node_modules/moment/dist/locale/mk.js +85 -0
- package/node_modules/moment/dist/locale/ml.js +82 -0
- package/node_modules/moment/dist/locale/mn.js +100 -0
- package/node_modules/moment/dist/locale/mr.js +203 -0
- package/node_modules/moment/dist/locale/ms-my.js +76 -0
- package/node_modules/moment/dist/locale/ms.js +75 -0
- package/node_modules/moment/dist/locale/mt.js +56 -0
- package/node_modules/moment/dist/locale/my.js +91 -0
- package/node_modules/moment/dist/locale/nb.js +60 -0
- package/node_modules/moment/dist/locale/ne.js +121 -0
- package/node_modules/moment/dist/locale/nl-be.js +102 -0
- package/node_modules/moment/dist/locale/nl.js +104 -0
- package/node_modules/moment/dist/locale/nn.js +59 -0
- package/node_modules/moment/dist/locale/oc-lnc.js +85 -0
- package/node_modules/moment/dist/locale/pa-in.js +122 -0
- package/node_modules/moment/dist/locale/pl.js +140 -0
- package/node_modules/moment/dist/locale/pt-br.js +58 -0
- package/node_modules/moment/dist/locale/pt.js +63 -0
- package/node_modules/moment/dist/locale/ro.js +76 -0
- package/node_modules/moment/dist/locale/ru.js +213 -0
- package/node_modules/moment/dist/locale/sd.js +81 -0
- package/node_modules/moment/dist/locale/se.js +57 -0
- package/node_modules/moment/dist/locale/si.js +69 -0
- package/node_modules/moment/dist/locale/sk.js +145 -0
- package/node_modules/moment/dist/locale/sl.js +171 -0
- package/node_modules/moment/dist/locale/sq.js +65 -0
- package/node_modules/moment/dist/locale/sr-cyrl.js +127 -0
- package/node_modules/moment/dist/locale/sr.js +129 -0
- package/node_modules/moment/dist/locale/ss.js +84 -0
- package/node_modules/moment/dist/locale/sv.js +68 -0
- package/node_modules/moment/dist/locale/sw.js +55 -0
- package/node_modules/moment/dist/locale/ta.js +131 -0
- package/node_modules/moment/dist/locale/te.js +88 -0
- package/node_modules/moment/dist/locale/tet.js +68 -0
- package/node_modules/moment/dist/locale/tg.js +117 -0
- package/node_modules/moment/dist/locale/th.js +65 -0
- package/node_modules/moment/dist/locale/tk.js +91 -0
- package/node_modules/moment/dist/locale/tl-ph.js +57 -0
- package/node_modules/moment/dist/locale/tlh.js +124 -0
- package/node_modules/moment/dist/locale/tr.js +106 -0
- package/node_modules/moment/dist/locale/tzl.js +89 -0
- package/node_modules/moment/dist/locale/tzm-latn.js +54 -0
- package/node_modules/moment/dist/locale/tzm.js +54 -0
- package/node_modules/moment/dist/locale/ug-cn.js +111 -0
- package/node_modules/moment/dist/locale/uk.js +167 -0
- package/node_modules/moment/dist/locale/ur.js +82 -0
- package/node_modules/moment/dist/locale/uz-latn.js +54 -0
- package/node_modules/moment/dist/locale/uz.js +51 -0
- package/node_modules/moment/dist/locale/vi.js +80 -0
- package/node_modules/moment/dist/locale/x-pseudo.js +73 -0
- package/node_modules/moment/dist/locale/yo.js +53 -0
- package/node_modules/moment/dist/locale/zh-cn.js +120 -0
- package/node_modules/moment/dist/locale/zh-hk.js +101 -0
- package/node_modules/moment/dist/locale/zh-mo.js +100 -0
- package/node_modules/moment/dist/locale/zh-tw.js +99 -0
- package/node_modules/moment/dist/moment.js +5680 -0
- package/node_modules/moment/ender.js +1 -0
- package/node_modules/moment/locale/af.js +82 -0
- package/node_modules/moment/locale/ar-dz.js +167 -0
- package/node_modules/moment/locale/ar-kw.js +66 -0
- package/node_modules/moment/locale/ar-ly.js +182 -0
- package/node_modules/moment/locale/ar-ma.js +67 -0
- package/node_modules/moment/locale/ar-ps.js +123 -0
- package/node_modules/moment/locale/ar-sa.js +116 -0
- package/node_modules/moment/locale/ar-tn.js +66 -0
- package/node_modules/moment/locale/ar.js +200 -0
- package/node_modules/moment/locale/az.js +113 -0
- package/node_modules/moment/locale/be.js +153 -0
- package/node_modules/moment/locale/bg.js +98 -0
- package/node_modules/moment/locale/bm.js +62 -0
- package/node_modules/moment/locale/bn-bd.js +140 -0
- package/node_modules/moment/locale/bn.js +130 -0
- package/node_modules/moment/locale/bo.js +135 -0
- package/node_modules/moment/locale/br.js +179 -0
- package/node_modules/moment/locale/bs.js +171 -0
- package/node_modules/moment/locale/ca.js +111 -0
- package/node_modules/moment/locale/cs.js +192 -0
- package/node_modules/moment/locale/cv.js +74 -0
- package/node_modules/moment/locale/cy.js +109 -0
- package/node_modules/moment/locale/da.js +64 -0
- package/node_modules/moment/locale/de-at.js +90 -0
- package/node_modules/moment/locale/de-ch.js +87 -0
- package/node_modules/moment/locale/de.js +89 -0
- package/node_modules/moment/locale/dv.js +101 -0
- package/node_modules/moment/locale/el.js +117 -0
- package/node_modules/moment/locale/en-au.js +79 -0
- package/node_modules/moment/locale/en-ca.js +75 -0
- package/node_modules/moment/locale/en-gb.js +79 -0
- package/node_modules/moment/locale/en-ie.js +79 -0
- package/node_modules/moment/locale/en-il.js +75 -0
- package/node_modules/moment/locale/en-in.js +79 -0
- package/node_modules/moment/locale/en-nz.js +79 -0
- package/node_modules/moment/locale/en-sg.js +79 -0
- package/node_modules/moment/locale/eo.js +79 -0
- package/node_modules/moment/locale/es-do.js +119 -0
- package/node_modules/moment/locale/es-mx.js +121 -0
- package/node_modules/moment/locale/es-us.js +121 -0
- package/node_modules/moment/locale/es.js +121 -0
- package/node_modules/moment/locale/et.js +89 -0
- package/node_modules/moment/locale/eu.js +76 -0
- package/node_modules/moment/locale/fa.js +124 -0
- package/node_modules/moment/locale/fi.js +135 -0
- package/node_modules/moment/locale/fil.js +69 -0
- package/node_modules/moment/locale/fo.js +68 -0
- package/node_modules/moment/locale/fr-ca.js +81 -0
- package/node_modules/moment/locale/fr-ch.js +85 -0
- package/node_modules/moment/locale/fr.js +119 -0
- package/node_modules/moment/locale/fy.js +86 -0
- package/node_modules/moment/locale/ga.js +106 -0
- package/node_modules/moment/locale/gd.js +106 -0
- package/node_modules/moment/locale/gl.js +86 -0
- package/node_modules/moment/locale/gom-deva.js +137 -0
- package/node_modules/moment/locale/gom-latn.js +135 -0
- package/node_modules/moment/locale/gu.js +133 -0
- package/node_modules/moment/locale/he.js +105 -0
- package/node_modules/moment/locale/hi.js +179 -0
- package/node_modules/moment/locale/hr.js +167 -0
- package/node_modules/moment/locale/hu.js +129 -0
- package/node_modules/moment/locale/hy-am.js +105 -0
- package/node_modules/moment/locale/id.js +87 -0
- package/node_modules/moment/locale/is.js +151 -0
- package/node_modules/moment/locale/it-ch.js +75 -0
- package/node_modules/moment/locale/it.js +117 -0
- package/node_modules/moment/locale/ja.js +159 -0
- package/node_modules/moment/locale/jv.js +87 -0
- package/node_modules/moment/locale/ka.js +103 -0
- package/node_modules/moment/locale/kk.js +93 -0
- package/node_modules/moment/locale/km.js +114 -0
- package/node_modules/moment/locale/kn.js +135 -0
- package/node_modules/moment/locale/ko.js +86 -0
- package/node_modules/moment/locale/ku-kmr.js +125 -0
- package/node_modules/moment/locale/ku.js +129 -0
- package/node_modules/moment/locale/ky.js +95 -0
- package/node_modules/moment/locale/lb.js +148 -0
- package/node_modules/moment/locale/lo.js +77 -0
- package/node_modules/moment/locale/lt.js +136 -0
- package/node_modules/moment/locale/lv.js +105 -0
- package/node_modules/moment/locale/me.js +128 -0
- package/node_modules/moment/locale/mi.js +71 -0
- package/node_modules/moment/locale/mk.js +97 -0
- package/node_modules/moment/locale/ml.js +93 -0
- package/node_modules/moment/locale/mn.js +111 -0
- package/node_modules/moment/locale/mr.js +214 -0
- package/node_modules/moment/locale/ms-my.js +87 -0
- package/node_modules/moment/locale/ms.js +86 -0
- package/node_modules/moment/locale/mt.js +67 -0
- package/node_modules/moment/locale/my.js +102 -0
- package/node_modules/moment/locale/nb.js +71 -0
- package/node_modules/moment/locale/ne.js +132 -0
- package/node_modules/moment/locale/nl-be.js +113 -0
- package/node_modules/moment/locale/nl.js +115 -0
- package/node_modules/moment/locale/nn.js +70 -0
- package/node_modules/moment/locale/oc-lnc.js +96 -0
- package/node_modules/moment/locale/pa-in.js +133 -0
- package/node_modules/moment/locale/pl.js +151 -0
- package/node_modules/moment/locale/pt-br.js +69 -0
- package/node_modules/moment/locale/pt.js +74 -0
- package/node_modules/moment/locale/ro.js +87 -0
- package/node_modules/moment/locale/ru.js +224 -0
- package/node_modules/moment/locale/sd.js +92 -0
- package/node_modules/moment/locale/se.js +68 -0
- package/node_modules/moment/locale/si.js +80 -0
- package/node_modules/moment/locale/sk.js +156 -0
- package/node_modules/moment/locale/sl.js +182 -0
- package/node_modules/moment/locale/sq.js +76 -0
- package/node_modules/moment/locale/sr-cyrl.js +138 -0
- package/node_modules/moment/locale/sr.js +140 -0
- package/node_modules/moment/locale/ss.js +95 -0
- package/node_modules/moment/locale/sv.js +79 -0
- package/node_modules/moment/locale/sw.js +66 -0
- package/node_modules/moment/locale/ta.js +142 -0
- package/node_modules/moment/locale/te.js +99 -0
- package/node_modules/moment/locale/tet.js +79 -0
- package/node_modules/moment/locale/tg.js +128 -0
- package/node_modules/moment/locale/th.js +76 -0
- package/node_modules/moment/locale/tk.js +102 -0
- package/node_modules/moment/locale/tl-ph.js +68 -0
- package/node_modules/moment/locale/tlh.js +135 -0
- package/node_modules/moment/locale/tr.js +117 -0
- package/node_modules/moment/locale/tzl.js +100 -0
- package/node_modules/moment/locale/tzm-latn.js +65 -0
- package/node_modules/moment/locale/tzm.js +65 -0
- package/node_modules/moment/locale/ug-cn.js +122 -0
- package/node_modules/moment/locale/uk.js +178 -0
- package/node_modules/moment/locale/ur.js +93 -0
- package/node_modules/moment/locale/uz-latn.js +65 -0
- package/node_modules/moment/locale/uz.js +62 -0
- package/node_modules/moment/locale/vi.js +91 -0
- package/node_modules/moment/locale/x-pseudo.js +84 -0
- package/node_modules/moment/locale/yo.js +64 -0
- package/node_modules/moment/locale/zh-cn.js +131 -0
- package/node_modules/moment/locale/zh-hk.js +112 -0
- package/node_modules/moment/locale/zh-mo.js +111 -0
- package/node_modules/moment/locale/zh-tw.js +110 -0
- package/node_modules/moment/min/locales.js +12800 -0
- package/node_modules/moment/min/locales.min.js +2 -0
- package/node_modules/moment/min/locales.min.js.map +1 -0
- package/node_modules/moment/min/moment-with-locales.js +18472 -0
- package/node_modules/moment/min/moment-with-locales.min.js +2 -0
- package/node_modules/moment/min/moment-with-locales.min.js.map +1 -0
- package/node_modules/moment/min/moment.min.js +2 -0
- package/node_modules/moment/min/moment.min.js.map +1 -0
- package/node_modules/moment/moment.d.ts +796 -0
- package/node_modules/moment/moment.js +5688 -0
- package/node_modules/moment/package.js +11 -0
- package/node_modules/moment/package.json +116 -0
- package/node_modules/moment/src/lib/create/check-overflow.js +57 -0
- package/node_modules/moment/src/lib/create/date-from-array.js +35 -0
- package/node_modules/moment/src/lib/create/from-anything.js +117 -0
- package/node_modules/moment/src/lib/create/from-array.js +187 -0
- package/node_modules/moment/src/lib/create/from-object.js +20 -0
- package/node_modules/moment/src/lib/create/from-string-and-array.js +67 -0
- package/node_modules/moment/src/lib/create/from-string-and-format.js +135 -0
- package/node_modules/moment/src/lib/create/from-string.js +258 -0
- package/node_modules/moment/src/lib/create/local.js +5 -0
- package/node_modules/moment/src/lib/create/parsing-flags.js +28 -0
- package/node_modules/moment/src/lib/create/utc.js +5 -0
- package/node_modules/moment/src/lib/create/valid.js +51 -0
- package/node_modules/moment/src/lib/duration/abs.js +18 -0
- package/node_modules/moment/src/lib/duration/add-subtract.js +21 -0
- package/node_modules/moment/src/lib/duration/as.js +76 -0
- package/node_modules/moment/src/lib/duration/bubble.js +68 -0
- package/node_modules/moment/src/lib/duration/clone.js +5 -0
- package/node_modules/moment/src/lib/duration/constructor.js +42 -0
- package/node_modules/moment/src/lib/duration/create.js +133 -0
- package/node_modules/moment/src/lib/duration/duration.js +16 -0
- package/node_modules/moment/src/lib/duration/get.js +27 -0
- package/node_modules/moment/src/lib/duration/humanize.js +114 -0
- package/node_modules/moment/src/lib/duration/iso-string.js +68 -0
- package/node_modules/moment/src/lib/duration/prototype.js +78 -0
- package/node_modules/moment/src/lib/duration/valid.js +55 -0
- package/node_modules/moment/src/lib/format/format.js +104 -0
- package/node_modules/moment/src/lib/locale/base-config.js +41 -0
- package/node_modules/moment/src/lib/locale/calendar.js +15 -0
- package/node_modules/moment/src/lib/locale/constructor.js +5 -0
- package/node_modules/moment/src/lib/locale/en.js +39 -0
- package/node_modules/moment/src/lib/locale/formats.js +36 -0
- package/node_modules/moment/src/lib/locale/invalid.js +5 -0
- package/node_modules/moment/src/lib/locale/lists.js +93 -0
- package/node_modules/moment/src/lib/locale/locale.js +45 -0
- package/node_modules/moment/src/lib/locale/locales.js +249 -0
- package/node_modules/moment/src/lib/locale/ordinal.js +8 -0
- package/node_modules/moment/src/lib/locale/pre-post-format.js +3 -0
- package/node_modules/moment/src/lib/locale/prototype.js +88 -0
- package/node_modules/moment/src/lib/locale/relative.js +32 -0
- package/node_modules/moment/src/lib/locale/set.js +56 -0
- package/node_modules/moment/src/lib/moment/add-subtract.js +61 -0
- package/node_modules/moment/src/lib/moment/calendar.js +53 -0
- package/node_modules/moment/src/lib/moment/clone.js +5 -0
- package/node_modules/moment/src/lib/moment/compare.js +72 -0
- package/node_modules/moment/src/lib/moment/constructor.js +80 -0
- package/node_modules/moment/src/lib/moment/creation-data.js +9 -0
- package/node_modules/moment/src/lib/moment/diff.js +79 -0
- package/node_modules/moment/src/lib/moment/format.js +78 -0
- package/node_modules/moment/src/lib/moment/from.js +20 -0
- package/node_modules/moment/src/lib/moment/get-set.js +117 -0
- package/node_modules/moment/src/lib/moment/locale.js +34 -0
- package/node_modules/moment/src/lib/moment/min-max.js +62 -0
- package/node_modules/moment/src/lib/moment/moment.js +28 -0
- package/node_modules/moment/src/lib/moment/now.js +3 -0
- package/node_modules/moment/src/lib/moment/prototype.js +197 -0
- package/node_modules/moment/src/lib/moment/start-end-of.js +164 -0
- package/node_modules/moment/src/lib/moment/to-type.js +42 -0
- package/node_modules/moment/src/lib/moment/to.js +20 -0
- package/node_modules/moment/src/lib/moment/valid.js +15 -0
- package/node_modules/moment/src/lib/parse/regex.js +84 -0
- package/node_modules/moment/src/lib/parse/token.js +36 -0
- package/node_modules/moment/src/lib/units/aliases.js +75 -0
- package/node_modules/moment/src/lib/units/constants.js +9 -0
- package/node_modules/moment/src/lib/units/day-of-month.js +35 -0
- package/node_modules/moment/src/lib/units/day-of-week.js +432 -0
- package/node_modules/moment/src/lib/units/day-of-year.js +28 -0
- package/node_modules/moment/src/lib/units/era.js +293 -0
- package/node_modules/moment/src/lib/units/hour.js +152 -0
- package/node_modules/moment/src/lib/units/millisecond.js +66 -0
- package/node_modules/moment/src/lib/units/minute.js +24 -0
- package/node_modules/moment/src/lib/units/month.js +340 -0
- package/node_modules/moment/src/lib/units/offset.js +249 -0
- package/node_modules/moment/src/lib/units/priorities.js +34 -0
- package/node_modules/moment/src/lib/units/quarter.js +24 -0
- package/node_modules/moment/src/lib/units/second.js +24 -0
- package/node_modules/moment/src/lib/units/timestamp.js +20 -0
- package/node_modules/moment/src/lib/units/timezone.js +16 -0
- package/node_modules/moment/src/lib/units/units.js +20 -0
- package/node_modules/moment/src/lib/units/week-calendar-utils.js +66 -0
- package/node_modules/moment/src/lib/units/week-year.js +128 -0
- package/node_modules/moment/src/lib/units/week.js +62 -0
- package/node_modules/moment/src/lib/units/year.js +75 -0
- package/node_modules/moment/src/lib/utils/abs-ceil.js +7 -0
- package/node_modules/moment/src/lib/utils/abs-floor.js +8 -0
- package/node_modules/moment/src/lib/utils/abs-round.js +7 -0
- package/node_modules/moment/src/lib/utils/compare-arrays.js +18 -0
- package/node_modules/moment/src/lib/utils/defaults.js +10 -0
- package/node_modules/moment/src/lib/utils/deprecate.js +69 -0
- package/node_modules/moment/src/lib/utils/extend.js +19 -0
- package/node_modules/moment/src/lib/utils/has-own-prop.js +3 -0
- package/node_modules/moment/src/lib/utils/hooks.js +13 -0
- package/node_modules/moment/src/lib/utils/index-of.js +18 -0
- package/node_modules/moment/src/lib/utils/is-array.js +6 -0
- package/node_modules/moment/src/lib/utils/is-calendar-spec.js +25 -0
- package/node_modules/moment/src/lib/utils/is-date.js +6 -0
- package/node_modules/moment/src/lib/utils/is-function.js +6 -0
- package/node_modules/moment/src/lib/utils/is-leap-year.js +3 -0
- package/node_modules/moment/src/lib/utils/is-moment-input.js +75 -0
- package/node_modules/moment/src/lib/utils/is-number.js +6 -0
- package/node_modules/moment/src/lib/utils/is-object-empty.js +15 -0
- package/node_modules/moment/src/lib/utils/is-object.js +8 -0
- package/node_modules/moment/src/lib/utils/is-string.js +3 -0
- package/node_modules/moment/src/lib/utils/is-undefined.js +3 -0
- package/node_modules/moment/src/lib/utils/keys.js +20 -0
- package/node_modules/moment/src/lib/utils/map.js +9 -0
- package/node_modules/moment/src/lib/utils/mod.js +3 -0
- package/node_modules/moment/src/lib/utils/some.js +20 -0
- package/node_modules/moment/src/lib/utils/to-int.js +12 -0
- package/node_modules/moment/src/lib/utils/zero-fill.js +10 -0
- package/node_modules/moment/src/locale/af.js +71 -0
- package/node_modules/moment/src/locale/ar-dz.js +156 -0
- package/node_modules/moment/src/locale/ar-kw.js +55 -0
- package/node_modules/moment/src/locale/ar-ly.js +171 -0
- package/node_modules/moment/src/locale/ar-ma.js +56 -0
- package/node_modules/moment/src/locale/ar-ps.js +112 -0
- package/node_modules/moment/src/locale/ar-sa.js +105 -0
- package/node_modules/moment/src/locale/ar-tn.js +55 -0
- package/node_modules/moment/src/locale/ar.js +189 -0
- package/node_modules/moment/src/locale/az.js +102 -0
- package/node_modules/moment/src/locale/be.js +142 -0
- package/node_modules/moment/src/locale/bg.js +87 -0
- package/node_modules/moment/src/locale/bm.js +52 -0
- package/node_modules/moment/src/locale/bn-bd.js +129 -0
- package/node_modules/moment/src/locale/bn.js +119 -0
- package/node_modules/moment/src/locale/bo.js +124 -0
- package/node_modules/moment/src/locale/br.js +168 -0
- package/node_modules/moment/src/locale/bs.js +160 -0
- package/node_modules/moment/src/locale/ca.js +100 -0
- package/node_modules/moment/src/locale/cs.js +181 -0
- package/node_modules/moment/src/locale/cv.js +63 -0
- package/node_modules/moment/src/locale/cy.js +98 -0
- package/node_modules/moment/src/locale/da.js +53 -0
- package/node_modules/moment/src/locale/de-at.js +79 -0
- package/node_modules/moment/src/locale/de-ch.js +78 -0
- package/node_modules/moment/src/locale/de.js +78 -0
- package/node_modules/moment/src/locale/dv.js +90 -0
- package/node_modules/moment/src/locale/el.js +106 -0
- package/node_modules/moment/src/locale/en-au.js +68 -0
- package/node_modules/moment/src/locale/en-ca.js +64 -0
- package/node_modules/moment/src/locale/en-gb.js +68 -0
- package/node_modules/moment/src/locale/en-ie.js +68 -0
- package/node_modules/moment/src/locale/en-il.js +64 -0
- package/node_modules/moment/src/locale/en-in.js +68 -0
- package/node_modules/moment/src/locale/en-nz.js +68 -0
- package/node_modules/moment/src/locale/en-sg.js +68 -0
- package/node_modules/moment/src/locale/eo.js +68 -0
- package/node_modules/moment/src/locale/es-do.js +108 -0
- package/node_modules/moment/src/locale/es-mx.js +110 -0
- package/node_modules/moment/src/locale/es-us.js +110 -0
- package/node_modules/moment/src/locale/es.js +110 -0
- package/node_modules/moment/src/locale/et.js +78 -0
- package/node_modules/moment/src/locale/eu.js +65 -0
- package/node_modules/moment/src/locale/fa.js +113 -0
- package/node_modules/moment/src/locale/fi.js +124 -0
- package/node_modules/moment/src/locale/fil.js +58 -0
- package/node_modules/moment/src/locale/fo.js +57 -0
- package/node_modules/moment/src/locale/fr-ca.js +70 -0
- package/node_modules/moment/src/locale/fr-ch.js +74 -0
- package/node_modules/moment/src/locale/fr.js +108 -0
- package/node_modules/moment/src/locale/fy.js +75 -0
- package/node_modules/moment/src/locale/ga.js +95 -0
- package/node_modules/moment/src/locale/gd.js +95 -0
- package/node_modules/moment/src/locale/gl.js +75 -0
- package/node_modules/moment/src/locale/gom-deva.js +126 -0
- package/node_modules/moment/src/locale/gom-latn.js +124 -0
- package/node_modules/moment/src/locale/gu.js +122 -0
- package/node_modules/moment/src/locale/he.js +94 -0
- package/node_modules/moment/src/locale/hi.js +168 -0
- package/node_modules/moment/src/locale/hr.js +156 -0
- package/node_modules/moment/src/locale/hu.js +118 -0
- package/node_modules/moment/src/locale/hy-am.js +94 -0
- package/node_modules/moment/src/locale/id.js +76 -0
- package/node_modules/moment/src/locale/is.js +140 -0
- package/node_modules/moment/src/locale/it-ch.js +64 -0
- package/node_modules/moment/src/locale/it.js +106 -0
- package/node_modules/moment/src/locale/ja.js +148 -0
- package/node_modules/moment/src/locale/jv.js +76 -0
- package/node_modules/moment/src/locale/ka.js +92 -0
- package/node_modules/moment/src/locale/kk.js +82 -0
- package/node_modules/moment/src/locale/km.js +103 -0
- package/node_modules/moment/src/locale/kn.js +124 -0
- package/node_modules/moment/src/locale/ko.js +75 -0
- package/node_modules/moment/src/locale/ku-kmr.js +121 -0
- package/node_modules/moment/src/locale/ku.js +118 -0
- package/node_modules/moment/src/locale/ky.js +84 -0
- package/node_modules/moment/src/locale/lb.js +137 -0
- package/node_modules/moment/src/locale/lo.js +66 -0
- package/node_modules/moment/src/locale/lt.js +125 -0
- package/node_modules/moment/src/locale/lv.js +94 -0
- package/node_modules/moment/src/locale/me.js +117 -0
- package/node_modules/moment/src/locale/mi.js +60 -0
- package/node_modules/moment/src/locale/mk.js +85 -0
- package/node_modules/moment/src/locale/ml.js +82 -0
- package/node_modules/moment/src/locale/mn.js +100 -0
- package/node_modules/moment/src/locale/mr.js +203 -0
- package/node_modules/moment/src/locale/ms-my.js +76 -0
- package/node_modules/moment/src/locale/ms.js +75 -0
- package/node_modules/moment/src/locale/mt.js +56 -0
- package/node_modules/moment/src/locale/my.js +91 -0
- package/node_modules/moment/src/locale/nb.js +60 -0
- package/node_modules/moment/src/locale/ne.js +121 -0
- package/node_modules/moment/src/locale/nl-be.js +102 -0
- package/node_modules/moment/src/locale/nl.js +104 -0
- package/node_modules/moment/src/locale/nn.js +59 -0
- package/node_modules/moment/src/locale/oc-lnc.js +85 -0
- package/node_modules/moment/src/locale/pa-in.js +122 -0
- package/node_modules/moment/src/locale/pl.js +140 -0
- package/node_modules/moment/src/locale/pt-br.js +58 -0
- package/node_modules/moment/src/locale/pt.js +63 -0
- package/node_modules/moment/src/locale/ro.js +76 -0
- package/node_modules/moment/src/locale/ru.js +213 -0
- package/node_modules/moment/src/locale/sd.js +81 -0
- package/node_modules/moment/src/locale/se.js +57 -0
- package/node_modules/moment/src/locale/si.js +69 -0
- package/node_modules/moment/src/locale/sk.js +145 -0
- package/node_modules/moment/src/locale/sl.js +171 -0
- package/node_modules/moment/src/locale/sq.js +65 -0
- package/node_modules/moment/src/locale/sr-cyrl.js +127 -0
- package/node_modules/moment/src/locale/sr.js +129 -0
- package/node_modules/moment/src/locale/ss.js +84 -0
- package/node_modules/moment/src/locale/sv.js +68 -0
- package/node_modules/moment/src/locale/sw.js +55 -0
- package/node_modules/moment/src/locale/ta.js +131 -0
- package/node_modules/moment/src/locale/te.js +88 -0
- package/node_modules/moment/src/locale/tet.js +68 -0
- package/node_modules/moment/src/locale/tg.js +117 -0
- package/node_modules/moment/src/locale/th.js +65 -0
- package/node_modules/moment/src/locale/tk.js +91 -0
- package/node_modules/moment/src/locale/tl-ph.js +57 -0
- package/node_modules/moment/src/locale/tlh.js +124 -0
- package/node_modules/moment/src/locale/tr.js +106 -0
- package/node_modules/moment/src/locale/tzl.js +89 -0
- package/node_modules/moment/src/locale/tzm-latn.js +54 -0
- package/node_modules/moment/src/locale/tzm.js +54 -0
- package/node_modules/moment/src/locale/ug-cn.js +111 -0
- package/node_modules/moment/src/locale/uk.js +167 -0
- package/node_modules/moment/src/locale/ur.js +82 -0
- package/node_modules/moment/src/locale/uz-latn.js +54 -0
- package/node_modules/moment/src/locale/uz.js +51 -0
- package/node_modules/moment/src/locale/vi.js +80 -0
- package/node_modules/moment/src/locale/x-pseudo.js +73 -0
- package/node_modules/moment/src/locale/yo.js +53 -0
- package/node_modules/moment/src/locale/zh-cn.js +120 -0
- package/node_modules/moment/src/locale/zh-hk.js +101 -0
- package/node_modules/moment/src/locale/zh-mo.js +100 -0
- package/node_modules/moment/src/locale/zh-tw.js +99 -0
- package/node_modules/moment/src/moment.js +93 -0
- package/node_modules/moment/ts3.1-typings/moment.d.ts +785 -0
- package/node_modules/moment-timezone/.editorconfig +22 -0
- package/node_modules/moment-timezone/LICENSE +20 -0
- package/node_modules/moment-timezone/README.md +64 -0
- package/node_modules/moment-timezone/builds/moment-timezone-with-data-10-year-range.js +1581 -0
- package/node_modules/moment-timezone/builds/moment-timezone-with-data-10-year-range.min.js +1 -0
- package/node_modules/moment-timezone/builds/moment-timezone-with-data-1970-2030.js +1581 -0
- package/node_modules/moment-timezone/builds/moment-timezone-with-data-1970-2030.min.js +1 -0
- package/node_modules/moment-timezone/builds/moment-timezone-with-data-2012-2022.js +1593 -0
- package/node_modules/moment-timezone/builds/moment-timezone-with-data-2012-2022.min.js +1 -0
- package/node_modules/moment-timezone/builds/moment-timezone-with-data.js +1581 -0
- package/node_modules/moment-timezone/builds/moment-timezone-with-data.min.js +1 -0
- package/node_modules/moment-timezone/builds/moment-timezone.min.js +1 -0
- package/node_modules/moment-timezone/changelog.md +277 -0
- package/node_modules/moment-timezone/composer.json +43 -0
- package/node_modules/moment-timezone/data/meta/latest.json +5877 -0
- package/node_modules/moment-timezone/data/packed/latest.json +852 -0
- package/node_modules/moment-timezone/index.d.ts +78 -0
- package/node_modules/moment-timezone/index.js +2 -0
- package/node_modules/moment-timezone/moment-timezone-utils.d.ts +70 -0
- package/node_modules/moment-timezone/moment-timezone-utils.js +339 -0
- package/node_modules/moment-timezone/moment-timezone.js +729 -0
- package/node_modules/moment-timezone/package.json +55 -0
- package/node_modules/next-line/.npmignore +1 -0
- package/node_modules/next-line/.travis.yml +8 -0
- package/node_modules/next-line/LICENSE +21 -0
- package/node_modules/next-line/README.md +30 -0
- package/node_modules/next-line/index.js +38 -0
- package/node_modules/next-line/package.json +38 -0
- package/node_modules/next-line/test.js +40 -0
- package/package.json +8 -9
package/README.md
CHANGED
|
@@ -1,5 +1,12 @@
|
|
|
1
1
|
# Mercury Parser - Extracting content from chaos
|
|
2
2
|
|
|
3
|
+
<a href="https://www.npmjs.com/package/@jocmp/mercury-parser">
|
|
4
|
+
<img src="https://img.shields.io/npm/v/@jocmp/mercury-parser.svg" alt="npm version">
|
|
5
|
+
</a>
|
|
6
|
+
<a href="https://github.com/jocmp/mercury-parser/actions/workflows/ci.yml">
|
|
7
|
+
<img src="https://github.com/jocmp/mercury-parser/actions/workflows/ci.yml/badge.svg" alt="CI">
|
|
8
|
+
</a>
|
|
9
|
+
|
|
3
10
|
Mercury Parser extracts the bits that humans care about from any URL you give it. That includes article content, titles, authors, published dates, excerpts, lead images, and more.
|
|
4
11
|
|
|
5
12
|
Mercury Parser allows you to easily create custom parsers using simple JavaScript and CSS selectors. This allows you to proactively manage parsing and migration edge cases. There are [many examples available](https://github.com/jocmp/mercury-parser/tree/master/src/extractors/custom) along with [documentation](https://github.com/jocmp/mercury-parser/blob/master/src/extractors/custom/README.md).
|
|
@@ -54,7 +61,7 @@ If Parser is unable to find a field, that field will return `null`.
|
|
|
54
61
|
|
|
55
62
|
##### Content Formats
|
|
56
63
|
|
|
57
|
-
By default,
|
|
64
|
+
By default, Mercury Parser returns the `content` field as HTML. However, you can override this behavior by passing in options to the `parse` function, specifying whether or not to scrape all pages of an article, and what type of output to return (valid values are `'html'`, `'markdown'`, and `'text'`). For example:
|
|
58
65
|
|
|
59
66
|
```javascript
|
|
60
67
|
Parser.parse(url, { contentType: 'markdown' }).then(result =>
|
|
@@ -84,7 +91,7 @@ Parser.parse(url, {
|
|
|
84
91
|
|
|
85
92
|
##### Pre-fetched HTML
|
|
86
93
|
|
|
87
|
-
You can use
|
|
94
|
+
You can use Mercury Parser to parse custom or pre-fetched HTML by passing an HTML string to the `parse` function as follows:
|
|
88
95
|
|
|
89
96
|
```javascript
|
|
90
97
|
Parser.parse(url, {
|
|
@@ -97,12 +104,12 @@ Note that the URL argument is still supplied, in order to identify the web site
|
|
|
97
104
|
|
|
98
105
|
#### The command-line parser
|
|
99
106
|
|
|
100
|
-
|
|
107
|
+
Mercury Parser also ships with a CLI, meaning you can use it from your command line like so:
|
|
101
108
|
|
|
102
|
-

|
|
103
110
|
|
|
104
111
|
```bash
|
|
105
|
-
# Install
|
|
112
|
+
# Install Mercury Parser globally
|
|
106
113
|
yarn global add @jocmp/mercury-parser
|
|
107
114
|
# or
|
|
108
115
|
npm -g install @jocmp/mercury-parser
|
|
@@ -140,10 +147,6 @@ Licensed under either of the below, at your preference:
|
|
|
140
147
|
|
|
141
148
|
## Contributing
|
|
142
149
|
|
|
143
|
-
For details on how to contribute to
|
|
150
|
+
For details on how to contribute to Mercury Parser, including how to write a custom content extractor for any site, see [CONTRIBUTING.md](./CONTRIBUTING.md)
|
|
144
151
|
|
|
145
152
|
Unless it is explicitly stated otherwise, any contribution intentionally submitted for inclusion in the work, as defined in the Apache-2.0 license, shall be dual licensed as above without any additional terms or conditions.
|
|
146
|
-
|
|
147
|
-
---
|
|
148
|
-
|
|
149
|
-
🔬 A Labs project from your friends at [Postlight](https://postlight.com). Happy coding!
|
|
@@ -5,7 +5,7 @@ function _interopDefault (ex) { return (ex && (typeof ex === 'object') && 'defau
|
|
|
5
5
|
var _slicedToArray = _interopDefault(require('@babel/runtime-corejs2/helpers/slicedToArray'));
|
|
6
6
|
var _toConsumableArray = _interopDefault(require('@babel/runtime-corejs2/helpers/toConsumableArray'));
|
|
7
7
|
var fs = _interopDefault(require('fs'));
|
|
8
|
-
var URL = _interopDefault(require('url'));
|
|
8
|
+
var URL$1 = _interopDefault(require('url'));
|
|
9
9
|
var inquirer = _interopDefault(require('inquirer'));
|
|
10
10
|
var ora = _interopDefault(require('ora'));
|
|
11
11
|
var child_process = require('child_process');
|
|
@@ -29,7 +29,6 @@ var postmanRequest = _interopDefault(require('postman-request'));
|
|
|
29
29
|
var assign = _interopDefault(require('@babel/runtime-corejs2/core-js/object/assign'));
|
|
30
30
|
var keys = _interopDefault(require('@babel/runtime-corejs2/core-js/object/keys'));
|
|
31
31
|
var stringDirection = _interopDefault(require('string-direction'));
|
|
32
|
-
var validUrl = _interopDefault(require('valid-url'));
|
|
33
32
|
var momentTimezone = _interopDefault(require('moment-timezone'));
|
|
34
33
|
var momentParseformat = _interopDefault(require('moment-parseformat'));
|
|
35
34
|
var wuzzy = _interopDefault(require('wuzzy'));
|
|
@@ -77,7 +76,7 @@ function absolutize($, rootUrl, attr) {
|
|
|
77
76
|
var attrs = getAttrs(node);
|
|
78
77
|
var url = attrs[attr];
|
|
79
78
|
if (!url) return;
|
|
80
|
-
var absoluteUrl = URL.resolve(baseUrl || rootUrl, url);
|
|
79
|
+
var absoluteUrl = URL$1.resolve(baseUrl || rootUrl, url);
|
|
81
80
|
setAttr(node, attr, absoluteUrl);
|
|
82
81
|
});
|
|
83
82
|
}
|
|
@@ -97,7 +96,7 @@ function absolutizeSet($, rootUrl, $content) {
|
|
|
97
96
|
// a candidate URL cannot start or end with a comma
|
|
98
97
|
// descriptors are separated from the URLs by unescaped whitespace
|
|
99
98
|
var parts = candidate.trim().replace(/,$/, '').split(/\s+/);
|
|
100
|
-
parts[0] = URL.resolve(rootUrl, parts[0]);
|
|
99
|
+
parts[0] = URL$1.resolve(rootUrl, parts[0]);
|
|
101
100
|
return parts.join(' ');
|
|
102
101
|
});
|
|
103
102
|
|
|
@@ -162,7 +161,7 @@ var _objectWithoutProperties = _interopDefault$1(objectWithoutProperties);
|
|
|
162
161
|
|
|
163
162
|
var _asyncToGenerator = _interopDefault$1(asyncToGenerator);
|
|
164
163
|
|
|
165
|
-
var URL$1 = _interopDefault$1(URL);
|
|
164
|
+
var URL$1$1 = _interopDefault$1(URL$1);
|
|
166
165
|
|
|
167
166
|
var cheerio$1 = _interopDefault$1(cheerio);
|
|
168
167
|
|
|
@@ -198,8 +197,6 @@ var _Object$keys = _interopDefault$1(keys);
|
|
|
198
197
|
|
|
199
198
|
var stringDirection$1 = _interopDefault$1(stringDirection);
|
|
200
199
|
|
|
201
|
-
var validUrl$1 = _interopDefault$1(validUrl);
|
|
202
|
-
|
|
203
200
|
var moment = _interopDefault$1(momentTimezone);
|
|
204
201
|
|
|
205
202
|
var parseFormat = _interopDefault$1(momentParseformat);
|
|
@@ -302,7 +299,7 @@ function isGoodSegment$1(segment, index, firstSegmentHasLetters) {
|
|
|
302
299
|
|
|
303
300
|
|
|
304
301
|
function articleBaseUrl$1(url, parsed) {
|
|
305
|
-
var parsedUrl = parsed || URL$1.parse(url);
|
|
302
|
+
var parsedUrl = parsed || URL$1$1.parse(url);
|
|
306
303
|
var protocol = parsedUrl.protocol,
|
|
307
304
|
host = parsedUrl.host,
|
|
308
305
|
path = parsedUrl.path;
|
|
@@ -455,7 +452,7 @@ function _fetchResource() {
|
|
|
455
452
|
_regeneratorRuntime.mark(function _callee(url, parsedUrl) {
|
|
456
453
|
var headers,
|
|
457
454
|
options,
|
|
458
|
-
|
|
455
|
+
_yield$get,
|
|
459
456
|
response,
|
|
460
457
|
body,
|
|
461
458
|
_args = arguments;
|
|
@@ -465,7 +462,7 @@ function _fetchResource() {
|
|
|
465
462
|
switch (_context.prev = _context.next) {
|
|
466
463
|
case 0:
|
|
467
464
|
headers = _args.length > 2 && _args[2] !== undefined ? _args[2] : {};
|
|
468
|
-
parsedUrl = parsedUrl || URL$1.parse(encodeURI(url));
|
|
465
|
+
parsedUrl = parsedUrl || URL$1$1.parse(encodeURI(url));
|
|
469
466
|
options = _objectSpread({
|
|
470
467
|
url: parsedUrl.href,
|
|
471
468
|
headers: _objectSpread({}, REQUEST_HEADERS, headers),
|
|
@@ -487,9 +484,9 @@ function _fetchResource() {
|
|
|
487
484
|
return get(options);
|
|
488
485
|
|
|
489
486
|
case 5:
|
|
490
|
-
|
|
491
|
-
response =
|
|
492
|
-
body =
|
|
487
|
+
_yield$get = _context.sent;
|
|
488
|
+
response = _yield$get.response;
|
|
489
|
+
body = _yield$get.body;
|
|
493
490
|
_context.prev = 8;
|
|
494
491
|
validateResponse(response);
|
|
495
492
|
return _context.abrupt("return", {
|
|
@@ -818,7 +815,7 @@ function markToKeep$1(article, $, url) {
|
|
|
818
815
|
}
|
|
819
816
|
|
|
820
817
|
if (url) {
|
|
821
|
-
var _URL$parse = URL$1.parse(url),
|
|
818
|
+
var _URL$parse = URL$1$1.parse(url),
|
|
822
819
|
protocol = _URL$parse.protocol,
|
|
823
820
|
hostname = _URL$parse.hostname;
|
|
824
821
|
|
|
@@ -1424,7 +1421,7 @@ function absolutize$1($, rootUrl, attr) {
|
|
|
1424
1421
|
var attrs = getAttrs$1(node);
|
|
1425
1422
|
var url = attrs[attr];
|
|
1426
1423
|
if (!url) return;
|
|
1427
|
-
var absoluteUrl = URL$1.resolve(baseUrl || rootUrl, url);
|
|
1424
|
+
var absoluteUrl = URL$1$1.resolve(baseUrl || rootUrl, url);
|
|
1428
1425
|
setAttr$1(node, attr, absoluteUrl);
|
|
1429
1426
|
});
|
|
1430
1427
|
}
|
|
@@ -1444,7 +1441,7 @@ function absolutizeSet$1($, rootUrl, $content) {
|
|
|
1444
1441
|
// a candidate URL cannot start or end with a comma
|
|
1445
1442
|
// descriptors are separated from the URLs by unescaped whitespace
|
|
1446
1443
|
var parts = candidate.trim().replace(/,$/, '').split(/\s+/);
|
|
1447
|
-
parts[0] = URL$1.resolve(rootUrl, parts[0]);
|
|
1444
|
+
parts[0] = URL$1$1.resolve(rootUrl, parts[0]);
|
|
1448
1445
|
return parts.join(' ');
|
|
1449
1446
|
});
|
|
1450
1447
|
|
|
@@ -2189,13 +2186,16 @@ var NewYorkerExtractor = {
|
|
|
2189
2186
|
var WiredExtractor = {
|
|
2190
2187
|
domain: 'www.wired.com',
|
|
2191
2188
|
title: {
|
|
2192
|
-
selectors: ['h1[data-testId="ContentHeaderHed"]'
|
|
2189
|
+
selectors: ['h1[data-testId="ContentHeaderHed"]' // enter title selectors
|
|
2190
|
+
]
|
|
2193
2191
|
},
|
|
2194
2192
|
author: {
|
|
2195
|
-
selectors: [['meta[name="article:author"]', 'value'], 'a[rel="author"]'
|
|
2193
|
+
selectors: [['meta[name="article:author"]', 'value'], 'a[rel="author"]' // enter author selectors
|
|
2194
|
+
]
|
|
2196
2195
|
},
|
|
2197
2196
|
content: {
|
|
2198
|
-
selectors: ['article.article.main-content', 'article.content'
|
|
2197
|
+
selectors: ['article.article.main-content', 'article.content' // enter content selectors
|
|
2198
|
+
],
|
|
2199
2199
|
// Is there anything in the content you selected that needs transformed
|
|
2200
2200
|
// before it's consumable content? E.g., unusual lazy loaded images
|
|
2201
2201
|
transforms: [],
|
|
@@ -2222,13 +2222,16 @@ var WiredExtractor = {
|
|
|
2222
2222
|
var MSNExtractor = {
|
|
2223
2223
|
domain: 'www.msn.com',
|
|
2224
2224
|
title: {
|
|
2225
|
-
selectors: ['h1'
|
|
2225
|
+
selectors: ['h1' // enter title selectors
|
|
2226
|
+
]
|
|
2226
2227
|
},
|
|
2227
2228
|
author: {
|
|
2228
|
-
selectors: ['span.authorname-txt'
|
|
2229
|
+
selectors: ['span.authorname-txt' // enter author selectors
|
|
2230
|
+
]
|
|
2229
2231
|
},
|
|
2230
2232
|
content: {
|
|
2231
|
-
selectors: ['div.richtext'
|
|
2233
|
+
selectors: ['div.richtext' // enter content selectors
|
|
2234
|
+
],
|
|
2232
2235
|
// Is there anything in the content you selected that needs transformed
|
|
2233
2236
|
// before it's consumable content? E.g., unusual lazy loaded images
|
|
2234
2237
|
transforms: [],
|
|
@@ -2255,10 +2258,12 @@ var MSNExtractor = {
|
|
|
2255
2258
|
var YahooExtractor = {
|
|
2256
2259
|
domain: 'www.yahoo.com',
|
|
2257
2260
|
title: {
|
|
2258
|
-
selectors: ['header.canvas-header'
|
|
2261
|
+
selectors: ['header.canvas-header' // enter title selectors
|
|
2262
|
+
]
|
|
2259
2263
|
},
|
|
2260
2264
|
author: {
|
|
2261
|
-
selectors: ['span.provider-name'
|
|
2265
|
+
selectors: ['span.provider-name' // enter author selectors
|
|
2266
|
+
]
|
|
2262
2267
|
},
|
|
2263
2268
|
content: {
|
|
2264
2269
|
selectors: [// enter content selectors
|
|
@@ -2291,10 +2296,12 @@ var BuzzfeedExtractor = {
|
|
|
2291
2296
|
domain: 'www.buzzfeed.com',
|
|
2292
2297
|
supportedDomains: ['www.buzzfeednews.com'],
|
|
2293
2298
|
title: {
|
|
2294
|
-
selectors: ['h1.embed-headline-title'
|
|
2299
|
+
selectors: ['h1.embed-headline-title' // enter title selectors
|
|
2300
|
+
]
|
|
2295
2301
|
},
|
|
2296
2302
|
author: {
|
|
2297
|
-
selectors: ['a[data-action="user/username"]', 'byline__author', ['meta[name="author"]', 'value']
|
|
2303
|
+
selectors: ['a[data-action="user/username"]', 'byline__author', ['meta[name="author"]', 'value'] // enter author selectors
|
|
2304
|
+
]
|
|
2298
2305
|
},
|
|
2299
2306
|
content: {
|
|
2300
2307
|
selectors: [['div[class^="featureimage_featureImageWrapper"]', '.js-subbuzz-wrapper'], ['.js-subbuzz-wrapper']],
|
|
@@ -2335,13 +2342,16 @@ var BuzzfeedExtractor = {
|
|
|
2335
2342
|
var WikiaExtractor = {
|
|
2336
2343
|
domain: 'fandom.wikia.com',
|
|
2337
2344
|
title: {
|
|
2338
|
-
selectors: ['h1.entry-title'
|
|
2345
|
+
selectors: ['h1.entry-title' // enter title selectors
|
|
2346
|
+
]
|
|
2339
2347
|
},
|
|
2340
2348
|
author: {
|
|
2341
|
-
selectors: ['.author vcard', '.fn'
|
|
2349
|
+
selectors: ['.author vcard', '.fn' // enter author selectors
|
|
2350
|
+
]
|
|
2342
2351
|
},
|
|
2343
2352
|
content: {
|
|
2344
|
-
selectors: ['.grid-content', '.entry-content'
|
|
2353
|
+
selectors: ['.grid-content', '.entry-content' // enter content selectors
|
|
2354
|
+
],
|
|
2345
2355
|
// Is there anything in the content you selected that needs transformed
|
|
2346
2356
|
// before it's consumable content? E.g., unusual lazy loaded images
|
|
2347
2357
|
transforms: [],
|
|
@@ -2368,10 +2378,12 @@ var WikiaExtractor = {
|
|
|
2368
2378
|
var LittleThingsExtractor = {
|
|
2369
2379
|
domain: 'www.littlethings.com',
|
|
2370
2380
|
title: {
|
|
2371
|
-
selectors: ['h1[class*="PostHeader"]', 'h1.post-title'
|
|
2381
|
+
selectors: ['h1[class*="PostHeader"]', 'h1.post-title' // enter title selectors
|
|
2382
|
+
]
|
|
2372
2383
|
},
|
|
2373
2384
|
author: {
|
|
2374
|
-
selectors: ['div[class^="PostHeader__ScAuthorNameSection"]', ['meta[name="author"]', 'value']
|
|
2385
|
+
selectors: ['div[class^="PostHeader__ScAuthorNameSection"]', ['meta[name="author"]', 'value'] // enter author selectors
|
|
2386
|
+
]
|
|
2375
2387
|
},
|
|
2376
2388
|
content: {
|
|
2377
2389
|
selectors: [// enter content selectors
|
|
@@ -2814,7 +2826,8 @@ var WwwThevergeComExtractor = {
|
|
|
2814
2826
|
// Is there anything that is in the result that shouldn't be?
|
|
2815
2827
|
// The clean selectors will remove anything that matches from
|
|
2816
2828
|
// the result
|
|
2817
|
-
clean: ['.aside', 'img.c-dynamic-image'
|
|
2829
|
+
clean: ['.aside', 'img.c-dynamic-image' // images come from noscript transform
|
|
2830
|
+
]
|
|
2818
2831
|
}
|
|
2819
2832
|
};
|
|
2820
2833
|
var WwwCnnComExtractor = {
|
|
@@ -3535,7 +3548,8 @@ var WwwThepoliticalinsiderComExtractor = {
|
|
|
3535
3548
|
]
|
|
3536
3549
|
},
|
|
3537
3550
|
lead_image_url: {
|
|
3538
|
-
selectors: [['meta[name="og:image"]', 'value']
|
|
3551
|
+
selectors: [['meta[name="og:image"]', 'value'] // enter selectors
|
|
3552
|
+
]
|
|
3539
3553
|
},
|
|
3540
3554
|
content: {
|
|
3541
3555
|
selectors: ['div#article-body'],
|
|
@@ -4866,7 +4880,8 @@ var WwwRedditComExtractor = {
|
|
|
4866
4880
|
content: {
|
|
4867
4881
|
selectors: [['div[data-test-id="post-content"] p'], // text post
|
|
4868
4882
|
['div[data-test-id="post-content"] a[target="_blank"]:not([data-click-id="timestamp"])', // external link
|
|
4869
|
-
'div[data-test-id="post-content"] div[data-click-id="media"]'
|
|
4883
|
+
'div[data-test-id="post-content"] div[data-click-id="media"]' // embedded media
|
|
4884
|
+
], // external link with media preview (YouTube, imgur album, etc...)
|
|
4870
4885
|
['div[data-test-id="post-content"] div[data-click-id="media"]'], // Embedded media (Reddit video)
|
|
4871
4886
|
['div[data-test-id="post-content"] a'], // external link
|
|
4872
4887
|
'div[data-test-id="post-content"]'],
|
|
@@ -5563,7 +5578,7 @@ var WiredJpExtractor = {
|
|
|
5563
5578
|
'img[data-original]': function imgDataOriginal($node) {
|
|
5564
5579
|
var dataOriginal = $node.attr('data-original');
|
|
5565
5580
|
var src = $node.attr('src');
|
|
5566
|
-
var url = URL$1.resolve(src, dataOriginal);
|
|
5581
|
+
var url = URL$1$1.resolve(src, dataOriginal);
|
|
5567
5582
|
$node.attr('src', url);
|
|
5568
5583
|
}
|
|
5569
5584
|
},
|
|
@@ -6168,6 +6183,52 @@ var WwwCbcCaExtractor = {
|
|
|
6168
6183
|
clean: []
|
|
6169
6184
|
}
|
|
6170
6185
|
};
|
|
6186
|
+
var WwwVersantsComExtractor = {
|
|
6187
|
+
domain: 'www.versants.com',
|
|
6188
|
+
title: {
|
|
6189
|
+
selectors: [['meta[name="og:title"]', 'value']]
|
|
6190
|
+
},
|
|
6191
|
+
author: {
|
|
6192
|
+
selectors: [['meta[name="author"]', 'value']]
|
|
6193
|
+
},
|
|
6194
|
+
date_published: {
|
|
6195
|
+
selectors: [['meta[name="article:published_time"]', 'value']]
|
|
6196
|
+
},
|
|
6197
|
+
lead_image_url: {
|
|
6198
|
+
selectors: [['meta[name="og:image"]', 'value']]
|
|
6199
|
+
},
|
|
6200
|
+
content: {
|
|
6201
|
+
selectors: ['.entry-content'],
|
|
6202
|
+
clean: ['.adv-link', '.versa-target']
|
|
6203
|
+
}
|
|
6204
|
+
};
|
|
6205
|
+
var Www1pezeshkComExtractor = {
|
|
6206
|
+
domain: 'www.1pezeshk.com',
|
|
6207
|
+
title: {
|
|
6208
|
+
selectors: [['meta[name="og:title"]', 'value'], 'h1.post-title']
|
|
6209
|
+
},
|
|
6210
|
+
author: {
|
|
6211
|
+
selectors: [['meta[name="author"]', 'value']]
|
|
6212
|
+
},
|
|
6213
|
+
date_published: {
|
|
6214
|
+
selectors: [['meta[name="article:published_time"]', 'value']]
|
|
6215
|
+
},
|
|
6216
|
+
lead_image_url: {
|
|
6217
|
+
selectors: [['.featured-area img', 'src']]
|
|
6218
|
+
},
|
|
6219
|
+
content: {
|
|
6220
|
+
selectors: ['article > .entry-content'],
|
|
6221
|
+
transforms: {
|
|
6222
|
+
img: function img($node) {
|
|
6223
|
+
$node.src = decodeURIComponent($node.src);
|
|
6224
|
+
}
|
|
6225
|
+
},
|
|
6226
|
+
// Is there anything that is in the result that shouldn't be?
|
|
6227
|
+
// The clean selectors will remove anything that matches from
|
|
6228
|
+
// the result
|
|
6229
|
+
clean: []
|
|
6230
|
+
}
|
|
6231
|
+
};
|
|
6171
6232
|
|
|
6172
6233
|
var CustomExtractors =
|
|
6173
6234
|
/*#__PURE__*/
|
|
@@ -6314,7 +6375,9 @@ _Object$freeze({
|
|
|
6314
6375
|
SpektrumExtractor: SpektrumExtractor,
|
|
6315
6376
|
PostlightComExtractor: PostlightComExtractor,
|
|
6316
6377
|
WwwInvestmentexecutiveComExtractor: WwwInvestmentexecutiveComExtractor,
|
|
6317
|
-
WwwCbcCaExtractor: WwwCbcCaExtractor
|
|
6378
|
+
WwwCbcCaExtractor: WwwCbcCaExtractor,
|
|
6379
|
+
WwwVersantsComExtractor: WwwVersantsComExtractor,
|
|
6380
|
+
Www1pezeshkComExtractor: Www1pezeshkComExtractor
|
|
6318
6381
|
});
|
|
6319
6382
|
|
|
6320
6383
|
var Extractors = _Object$keys(CustomExtractors).reduce(function (acc, key) {
|
|
@@ -6356,13 +6419,11 @@ function cleanAuthor(author) {
|
|
|
6356
6419
|
}
|
|
6357
6420
|
|
|
6358
6421
|
function clean$1(leadImageUrl) {
|
|
6359
|
-
|
|
6360
|
-
|
|
6361
|
-
|
|
6362
|
-
return
|
|
6422
|
+
try {
|
|
6423
|
+
return new URL(leadImageUrl.trim()).toString();
|
|
6424
|
+
} catch (_unused) {
|
|
6425
|
+
return null;
|
|
6363
6426
|
}
|
|
6364
|
-
|
|
6365
|
-
return null;
|
|
6366
6427
|
} // Return None if the dek wasn't good enough.
|
|
6367
6428
|
|
|
6368
6429
|
|
|
@@ -6549,7 +6610,7 @@ function cleanDomainFromTitle(splitTitle, url) {
|
|
|
6549
6610
|
//
|
|
6550
6611
|
// Strip out the big TLDs - it just makes the matching a bit more
|
|
6551
6612
|
// accurate. Not the end of the world if it doesn't strip right.
|
|
6552
|
-
var _URL$parse = URL$1.parse(url),
|
|
6613
|
+
var _URL$parse = URL$1$1.parse(url),
|
|
6553
6614
|
host = _URL$parse.host;
|
|
6554
6615
|
|
|
6555
6616
|
var nakedDomain = host.replace(DOMAIN_ENDINGS_RE, '');
|
|
@@ -7296,7 +7357,7 @@ function shouldScore(href, articleUrl, baseUrl, parsedUrl, linkText, previousUrl
|
|
|
7296
7357
|
|
|
7297
7358
|
var hostname = parsedUrl.hostname;
|
|
7298
7359
|
|
|
7299
|
-
var _URL$parse = URL$1.parse(href),
|
|
7360
|
+
var _URL$parse = URL$1$1.parse(href),
|
|
7300
7361
|
linkHost = _URL$parse.hostname; // Domain mismatch.
|
|
7301
7362
|
|
|
7302
7363
|
|
|
@@ -7378,7 +7439,7 @@ function scoreLinks(_ref) {
|
|
|
7378
7439
|
$ = _ref.$,
|
|
7379
7440
|
_ref$previousUrls = _ref.previousUrls,
|
|
7380
7441
|
previousUrls = _ref$previousUrls === void 0 ? [] : _ref$previousUrls;
|
|
7381
|
-
parsedUrl = parsedUrl || URL$1.parse(articleUrl);
|
|
7442
|
+
parsedUrl = parsedUrl || URL$1$1.parse(articleUrl);
|
|
7382
7443
|
var baseRegex = makeBaseRegex(baseUrl);
|
|
7383
7444
|
var isWp = isWordpress$1($); // Loop through all links, looking for hints that they may be next-page
|
|
7384
7445
|
// links. Things like having "page" in their textContent, className or
|
|
@@ -7440,7 +7501,7 @@ var GenericNextPageUrlExtractor = {
|
|
|
7440
7501
|
parsedUrl = _ref.parsedUrl,
|
|
7441
7502
|
_ref$previousUrls = _ref.previousUrls,
|
|
7442
7503
|
previousUrls = _ref$previousUrls === void 0 ? [] : _ref$previousUrls;
|
|
7443
|
-
parsedUrl = parsedUrl || URL$1.parse(url);
|
|
7504
|
+
parsedUrl = parsedUrl || URL$1$1.parse(url);
|
|
7444
7505
|
var articleUrl = removeAnchor$1(url);
|
|
7445
7506
|
var baseUrl = articleBaseUrl$1(url, parsedUrl);
|
|
7446
7507
|
var links = $('a[href]').toArray();
|
|
@@ -7475,7 +7536,7 @@ var GenericNextPageUrlExtractor = {
|
|
|
7475
7536
|
var CANONICAL_META_SELECTORS = ['og:url'];
|
|
7476
7537
|
|
|
7477
7538
|
function parseDomain(url) {
|
|
7478
|
-
var parsedUrl = URL$1.parse(url);
|
|
7539
|
+
var parsedUrl = URL$1$1.parse(url);
|
|
7479
7540
|
var hostname = parsedUrl.hostname;
|
|
7480
7541
|
return hostname;
|
|
7481
7542
|
}
|
|
@@ -7644,7 +7705,7 @@ function detectByHtml($) {
|
|
|
7644
7705
|
}
|
|
7645
7706
|
|
|
7646
7707
|
function getExtractor(url, parsedUrl, $) {
|
|
7647
|
-
parsedUrl = parsedUrl || URL$1.parse(url);
|
|
7708
|
+
parsedUrl = parsedUrl || URL$1$1.parse(url);
|
|
7648
7709
|
var _parsedUrl = parsedUrl,
|
|
7649
7710
|
hostname = _parsedUrl.hostname;
|
|
7650
7711
|
var baseDomain = hostname.split('.').slice(-2).join('.');
|
|
@@ -7868,6 +7929,12 @@ var RootExtractor = {
|
|
|
7868
7929
|
};
|
|
7869
7930
|
}
|
|
7870
7931
|
|
|
7932
|
+
var extendedResults = {};
|
|
7933
|
+
|
|
7934
|
+
if (extractor.extend) {
|
|
7935
|
+
extendedResults = selectExtendedTypes(extractor.extend, opts);
|
|
7936
|
+
}
|
|
7937
|
+
|
|
7871
7938
|
var title = extractResult(_objectSpread({}, opts, {
|
|
7872
7939
|
type: 'title'
|
|
7873
7940
|
}));
|
|
@@ -7916,12 +7983,6 @@ var RootExtractor = {
|
|
|
7916
7983
|
url = _ref3.url,
|
|
7917
7984
|
domain = _ref3.domain;
|
|
7918
7985
|
|
|
7919
|
-
var extendedResults = {};
|
|
7920
|
-
|
|
7921
|
-
if (extractor.extend) {
|
|
7922
|
-
extendedResults = selectExtendedTypes(extractor.extend, opts);
|
|
7923
|
-
}
|
|
7924
|
-
|
|
7925
7986
|
return _objectSpread({
|
|
7926
7987
|
title: title,
|
|
7927
7988
|
content: content,
|
|
@@ -8056,7 +8117,7 @@ var Parser = {
|
|
|
8056
8117
|
html = html || cheerio$1.html();
|
|
8057
8118
|
}
|
|
8058
8119
|
|
|
8059
|
-
parsedUrl = URL$1.parse(url);
|
|
8120
|
+
parsedUrl = URL$1$1.parse(url);
|
|
8060
8121
|
|
|
8061
8122
|
if (validateUrl(parsedUrl)) {
|
|
8062
8123
|
_context.next = 6;
|
|
@@ -8291,7 +8352,7 @@ var questions = [{
|
|
|
8291
8352
|
name: 'website',
|
|
8292
8353
|
message: "Paste a url to an article you'd like to create or extend a parser for:",
|
|
8293
8354
|
validate: function validate(value) {
|
|
8294
|
-
var _URL$parse = URL.parse(value),
|
|
8355
|
+
var _URL$parse = URL$1.parse(value),
|
|
8295
8356
|
hostname = _URL$parse.hostname;
|
|
8296
8357
|
|
|
8297
8358
|
if (hostname) return true;
|
|
@@ -8325,7 +8386,7 @@ function confirmCreateDir(dir, msg) {
|
|
|
8325
8386
|
}
|
|
8326
8387
|
|
|
8327
8388
|
function getDir(url) {
|
|
8328
|
-
var _URL$parse2 = URL.parse(url),
|
|
8389
|
+
var _URL$parse2 = URL$1.parse(url),
|
|
8329
8390
|
hostname = _URL$parse2.hostname;
|
|
8330
8391
|
|
|
8331
8392
|
return "./src/extractors/custom/".concat(hostname);
|
|
@@ -8334,7 +8395,7 @@ function getDir(url) {
|
|
|
8334
8395
|
function scaffoldCustomParser(url) {
|
|
8335
8396
|
var dir = getDir(url);
|
|
8336
8397
|
|
|
8337
|
-
var _URL$parse3 = URL.parse(url),
|
|
8398
|
+
var _URL$parse3 = URL$1.parse(url),
|
|
8338
8399
|
hostname = _URL$parse3.hostname;
|
|
8339
8400
|
|
|
8340
8401
|
var newParser = false;
|
|
@@ -8360,7 +8421,7 @@ if (urlArg) {
|
|
|
8360
8421
|
}
|
|
8361
8422
|
|
|
8362
8423
|
function generateScaffold(url, file, result) {
|
|
8363
|
-
var _URL$parse4 = URL.parse(url),
|
|
8424
|
+
var _URL$parse4 = URL$1.parse(url),
|
|
8364
8425
|
hostname = _URL$parse4.hostname;
|
|
8365
8426
|
|
|
8366
8427
|
var extractor = extractorTemplate(hostname, extractorName(hostname));
|
|
@@ -8375,7 +8436,7 @@ function savePage($, _ref, newParser) {
|
|
|
8375
8436
|
var _ref2 = _slicedToArray(_ref, 1),
|
|
8376
8437
|
url = _ref2[0];
|
|
8377
8438
|
|
|
8378
|
-
var _URL$parse5 = URL.parse(url),
|
|
8439
|
+
var _URL$parse5 = URL$1.parse(url),
|
|
8379
8440
|
hostname = _URL$parse5.hostname;
|
|
8380
8441
|
|
|
8381
8442
|
spinner.succeed();
|
|
@@ -8406,7 +8467,7 @@ function savePage($, _ref, newParser) {
|
|
|
8406
8467
|
}
|
|
8407
8468
|
|
|
8408
8469
|
function exportString(url) {
|
|
8409
|
-
var _URL$parse6 = URL.parse(url),
|
|
8470
|
+
var _URL$parse6 = URL$1.parse(url),
|
|
8410
8471
|
hostname = _URL$parse6.hostname;
|
|
8411
8472
|
|
|
8412
8473
|
return "export * from './".concat(hostname, "';");
|