hydra-crawler 2.8.3 → 3.0.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/apis/{autocomplete.api.d.ts → autocomplete.api.d.mts} +4 -4
- package/dist/apis/autocomplete.api.mjs +14 -0
- package/dist/apis/autocomplete.api.mjs.map +1 -0
- package/dist/apis/{bugs.api.d.ts → bugs.api.d.mts} +4 -4
- package/dist/apis/bugs.api.mjs +18 -0
- package/dist/apis/bugs.api.mjs.map +1 -0
- package/dist/apis/{crawl.api.d.ts → crawl.api.d.mts} +4 -4
- package/dist/apis/crawl.api.mjs +17 -0
- package/dist/apis/crawl.api.mjs.map +1 -0
- package/dist/apis/{domains.api.d.ts → domains.api.d.mts} +4 -4
- package/dist/apis/{domains.api.js → domains.api.mjs} +10 -18
- package/dist/apis/domains.api.mjs.map +1 -0
- package/dist/apis/{images.api.d.ts → images.api.d.mts} +4 -4
- package/dist/apis/images.api.mjs +19 -0
- package/dist/apis/images.api.mjs.map +1 -0
- package/dist/apis/{statistics.api.d.ts → statistics.api.d.mts} +4 -4
- package/dist/apis/statistics.api.mjs +33 -0
- package/dist/apis/statistics.api.mjs.map +1 -0
- package/dist/apis/{test.api.d.ts → test.api.d.mts} +3 -3
- package/dist/apis/test.api.mjs +10 -0
- package/dist/apis/test.api.mjs.map +1 -0
- package/dist/apis/{urls.api.d.ts → urls.api.d.mts} +4 -4
- package/dist/apis/urls.api.mjs +21 -0
- package/dist/apis/urls.api.mjs.map +1 -0
- package/dist/apps/{cleanup.app.d.ts → cleanup.app.d.mts} +5 -5
- package/dist/apps/cleanup.app.mjs +129 -0
- package/dist/apps/cleanup.app.mjs.map +1 -0
- package/dist/apps/{cross-populate-export.app.d.ts → cross-populate-export.app.d.mts} +3 -3
- package/dist/apps/cross-populate-export.app.mjs +61 -0
- package/dist/apps/cross-populate-export.app.mjs.map +1 -0
- package/dist/apps/{cross-populate-import.app.d.ts → cross-populate-import.app.d.mts} +3 -3
- package/dist/apps/cross-populate-import.app.mjs +61 -0
- package/dist/apps/cross-populate-import.app.mjs.map +1 -0
- package/dist/apps/{denylist.app.d.ts → denylist.app.d.mts} +5 -5
- package/dist/apps/denylist.app.mjs +122 -0
- package/dist/apps/denylist.app.mjs.map +1 -0
- package/dist/apps/{expire.app.d.ts → expire.app.d.mts} +8 -7
- package/dist/apps/expire.app.mjs +51 -0
- package/dist/apps/expire.app.mjs.map +1 -0
- package/dist/apps/{export-domain-urls.d.ts → export-domain-urls.d.mts} +3 -3
- package/dist/apps/export-domain-urls.mjs +85 -0
- package/dist/apps/export-domain-urls.mjs.map +1 -0
- package/dist/apps/{extract-text.app.d.ts → extract-text.app.d.mts} +2 -2
- package/dist/apps/extract-text.app.mjs +43 -0
- package/dist/apps/extract-text.app.mjs.map +1 -0
- package/dist/apps/{hydra.app.d.ts → hydra.app.d.mts} +10 -10
- package/dist/apps/hydra.app.mjs +222 -0
- package/dist/apps/hydra.app.mjs.map +1 -0
- package/dist/apps/{import.app.d.ts → import.app.d.mts} +3 -3
- package/dist/apps/import.app.mjs +48 -0
- package/dist/apps/import.app.mjs.map +1 -0
- package/dist/apps/{internal-hydra-common.app.d.ts → internal-hydra-common.app.d.mts} +6 -6
- package/dist/apps/{internal-hydra-common.app.js → internal-hydra-common.app.mjs} +1 -1
- package/dist/apps/internal-hydra-common.app.mjs.map +1 -0
- package/dist/apps/{move-to-archive.app.d.ts → move-to-archive.app.d.mts} +2 -2
- package/dist/apps/move-to-archive.app.mjs +31 -0
- package/dist/apps/move-to-archive.app.mjs.map +1 -0
- package/dist/apps/{prune-archive.app.d.ts → prune-archive.app.d.mts} +2 -2
- package/dist/apps/prune-archive.app.mjs +40 -0
- package/dist/apps/prune-archive.app.mjs.map +1 -0
- package/dist/apps/{query.app.d.ts → query.app.d.mts} +6 -6
- package/dist/apps/query.app.mjs +69 -0
- package/dist/apps/query.app.mjs.map +1 -0
- package/dist/apps/{reattempt.app.d.ts → reattempt.app.d.mts} +6 -6
- package/dist/apps/reattempt.app.mjs +74 -0
- package/dist/apps/reattempt.app.mjs.map +1 -0
- package/dist/apps/{requeue-domain.app.d.ts → requeue-domain.app.d.mts} +3 -3
- package/dist/apps/requeue-domain.app.mjs +52 -0
- package/dist/apps/requeue-domain.app.mjs.map +1 -0
- package/dist/apps/{seed.app.d.ts → seed.app.d.mts} +5 -5
- package/dist/apps/seed.app.mjs +59 -0
- package/dist/apps/seed.app.mjs.map +1 -0
- package/dist/apps/{startup.app.d.ts → startup.app.d.mts} +3 -3
- package/dist/apps/startup.app.mjs +55 -0
- package/dist/apps/startup.app.mjs.map +1 -0
- package/dist/apps/{unarchive-urls.app.d.ts → unarchive-urls.app.d.mts} +5 -5
- package/dist/apps/unarchive-urls.app.mjs +71 -0
- package/dist/apps/unarchive-urls.app.mjs.map +1 -0
- package/dist/classes/{cleaner.d.ts → cleaner.d.mts} +2 -2
- package/dist/classes/cleaner.mjs +257 -0
- package/dist/classes/cleaner.mjs.map +1 -0
- package/dist/classes/{crawler.d.ts → crawler.d.mts} +10 -12
- package/dist/classes/crawler.mjs +418 -0
- package/dist/classes/crawler.mjs.map +1 -0
- package/dist/classes/{dns.js → dns.mjs} +4 -4
- package/dist/classes/dns.mjs.map +1 -0
- package/dist/classes/{expirer.d.ts → expirer.d.mts} +2 -2
- package/dist/classes/expirer.mjs +117 -0
- package/dist/classes/expirer.mjs.map +1 -0
- package/dist/classes/{expiry.d.ts → expiry.d.mts} +1 -1
- package/dist/classes/{expiry.js → expiry.mjs} +7 -9
- package/dist/classes/expiry.mjs.map +1 -0
- package/dist/classes/{lists.d.ts → lists.d.mts} +2 -2
- package/dist/classes/{lists.js → lists.mjs} +4 -4
- package/dist/classes/lists.mjs.map +1 -0
- package/dist/classes/{robot.d.ts → robot.d.mts} +3 -3
- package/dist/classes/robot.mjs +74 -0
- package/dist/classes/robot.mjs.map +1 -0
- package/dist/classes/{tracker.d.ts → tracker.d.mts} +3 -3
- package/dist/classes/tracker.mjs +101 -0
- package/dist/classes/tracker.mjs.map +1 -0
- package/dist/{cli.js → cli.mjs} +46 -58
- package/dist/cli.mjs.map +1 -0
- package/dist/enums/{eavailable-strategy.js → eavailable-strategy.mjs} +1 -1
- package/dist/enums/eavailable-strategy.mjs.map +1 -0
- package/dist/enums/{elist.js → elist.mjs} +1 -1
- package/dist/enums/elist.mjs.map +1 -0
- package/dist/enums/{eserver.js → eserver.mjs} +1 -1
- package/dist/enums/eserver.mjs.map +1 -0
- package/dist/enums/{ex-powered-by.js → ex-powered-by.mjs} +1 -1
- package/dist/enums/ex-powered-by.mjs.map +1 -0
- package/dist/helpers/{matcher.d.ts → matcher.d.mts} +1 -1
- package/dist/helpers/{matcher.js → matcher.mjs} +1 -1
- package/dist/helpers/matcher.mjs.map +1 -0
- package/dist/helpers/{random.d.ts → random.d.mts} +1 -1
- package/dist/helpers/{random.js → random.mjs} +1 -1
- package/dist/helpers/random.mjs.map +1 -0
- package/dist/helpers/{utf-decoder.d.ts → utf-decoder.d.mts} +0 -1
- package/dist/helpers/{utf-decoder.js → utf-decoder.mjs} +3 -3
- package/dist/helpers/utf-decoder.mjs.map +1 -0
- package/dist/interfaces/{iexpiry.d.ts → iexpiry.d.mts} +1 -1
- package/dist/interfaces/{iexpiry.js → iexpiry.mjs} +3 -3
- package/dist/interfaces/iexpiry.mjs.map +1 -0
- package/dist/interfaces/{imatch.js → imatch.mjs} +2 -2
- package/dist/interfaces/imatch.mjs.map +1 -0
- package/dist/interfaces/{iparser-config.js → iparser-config.mjs} +2 -2
- package/dist/interfaces/iparser-config.mjs.map +1 -0
- package/dist/interfaces/{iparser.d.ts → iparser.d.mts} +1 -1
- package/dist/interfaces/iparser.mjs +2 -0
- package/dist/interfaces/iparser.mjs.map +1 -0
- package/dist/interfaces/{irequest-outcome.d.ts → irequest-outcome.d.mts} +0 -2
- package/dist/interfaces/irequest-outcome.mjs +2 -0
- package/dist/interfaces/irequest-outcome.mjs.map +1 -0
- package/dist/interfaces/iserver.mjs +2 -0
- package/dist/interfaces/iserver.mjs.map +1 -0
- package/dist/parsers/accessibility-metrics.parser.d.mts +11 -0
- package/dist/parsers/accessibility-metrics.parser.mjs +30 -0
- package/dist/parsers/accessibility-metrics.parser.mjs.map +1 -0
- package/dist/parsers/asp-error.parser.d.mts +12 -0
- package/dist/parsers/asp-error.parser.mjs +38 -0
- package/dist/parsers/asp-error.parser.mjs.map +1 -0
- package/dist/parsers/{bad-words.parser.d.ts → bad-words.parser.d.mts} +6 -6
- package/dist/parsers/bad-words.parser.mjs +17 -0
- package/dist/parsers/bad-words.parser.mjs.map +1 -0
- package/dist/parsers/complex-english.parser.d.mts +15 -0
- package/dist/parsers/complex-english.parser.mjs +52 -0
- package/dist/parsers/complex-english.parser.mjs.map +1 -0
- package/dist/parsers/data.parser.d.mts +13 -0
- package/dist/parsers/{data.parser.js → data.parser.mjs} +8 -7
- package/dist/parsers/data.parser.mjs.map +1 -0
- package/dist/parsers/{dictionary.parser.d.ts → dictionary.parser.d.mts} +6 -6
- package/dist/parsers/dictionary.parser.mjs +63 -0
- package/dist/parsers/dictionary.parser.mjs.map +1 -0
- package/dist/parsers/html.parser.d.mts +13 -0
- package/dist/parsers/{html.parser.js → html.parser.mjs} +4 -3
- package/dist/parsers/html.parser.mjs.map +1 -0
- package/dist/parsers/hyperlinks.parser.d.mts +20 -0
- package/dist/parsers/hyperlinks.parser.mjs +104 -0
- package/dist/parsers/hyperlinks.parser.mjs.map +1 -0
- package/dist/parsers/image-tags.parser.d.mts +19 -0
- package/dist/parsers/image-tags.parser.mjs +42 -0
- package/dist/parsers/image-tags.parser.mjs.map +1 -0
- package/dist/parsers/{interest.parser.d.ts → interest.parser.d.mts} +7 -7
- package/dist/parsers/interest.parser.mjs +60 -0
- package/dist/parsers/interest.parser.mjs.map +1 -0
- package/dist/parsers/jpeg.parser.d.mts +11 -0
- package/dist/parsers/jpeg.parser.mjs +29 -0
- package/dist/parsers/jpeg.parser.mjs.map +1 -0
- package/dist/parsers/{llama-guard.parser.d.ts → llama-guard.parser.d.mts} +7 -7
- package/dist/parsers/llama-guard.parser.mjs +56 -0
- package/dist/parsers/llama-guard.parser.mjs.map +1 -0
- package/dist/parsers/{offence.parser.d.ts → offence.parser.d.mts} +7 -7
- package/dist/parsers/offence.parser.mjs +60 -0
- package/dist/parsers/offence.parser.mjs.map +1 -0
- package/dist/parsers/{ollama.parser.d.ts → ollama.parser.d.mts} +6 -6
- package/dist/parsers/ollama.parser.mjs +43 -0
- package/dist/parsers/ollama.parser.mjs.map +1 -0
- package/dist/parsers/{paragraphs.parser.d.ts → paragraphs.parser.d.mts} +5 -5
- package/dist/parsers/paragraphs.parser.mjs +38 -0
- package/dist/parsers/paragraphs.parser.mjs.map +1 -0
- package/dist/parsers/{parser.d.ts → parser.d.mts} +6 -6
- package/dist/parsers/parser.mjs +45 -0
- package/dist/parsers/parser.mjs.map +1 -0
- package/dist/parsers/php-error.parser.d.mts +12 -0
- package/dist/parsers/php-error.parser.mjs +42 -0
- package/dist/parsers/php-error.parser.mjs.map +1 -0
- package/dist/parsers/{phrase.parser.d.ts → phrase.parser.d.mts} +3 -3
- package/dist/parsers/phrase.parser.mjs +15 -0
- package/dist/parsers/phrase.parser.mjs.map +1 -0
- package/dist/parsers/{regex.parser.d.ts → regex.parser.d.mts} +3 -3
- package/dist/parsers/regex.parser.mjs +29 -0
- package/dist/parsers/regex.parser.mjs.map +1 -0
- package/dist/parsers/server.parser.d.mts +11 -0
- package/dist/parsers/server.parser.mjs +57 -0
- package/dist/parsers/server.parser.mjs.map +1 -0
- package/dist/parsers/{spelling.parser.d.ts → spelling.parser.d.mts} +6 -6
- package/dist/parsers/spelling.parser.mjs +17 -0
- package/dist/parsers/spelling.parser.mjs.map +1 -0
- package/dist/parsers/string.parser.d.mts +8 -0
- package/dist/parsers/{string.parser.js → string.parser.mjs} +5 -4
- package/dist/parsers/string.parser.mjs.map +1 -0
- package/dist/parsers/{text.parser.d.ts → text.parser.d.mts} +3 -3
- package/dist/parsers/text.parser.mjs +30 -0
- package/dist/parsers/text.parser.mjs.map +1 -0
- package/dist/parsers/{words.parser.d.ts → words.parser.d.mts} +3 -3
- package/dist/parsers/words.parser.mjs +29 -0
- package/dist/parsers/words.parser.mjs.map +1 -0
- package/dist/queries/complex-english.query.d.mts +2 -0
- package/dist/queries/{complex-english.query.js → complex-english.query.mjs} +18 -27
- package/dist/queries/complex-english.query.mjs.map +1 -0
- package/dist/queries/flash-content.query.d.mts +2 -0
- package/dist/queries/flash-content.query.mjs +80 -0
- package/dist/queries/flash-content.query.mjs.map +1 -0
- package/dist/queries/linking-to-domains.query.d.mts +2 -0
- package/dist/queries/linking-to-domains.query.mjs +128 -0
- package/dist/queries/linking-to-domains.query.mjs.map +1 -0
- package/dist/queries/llamaguard-unsafe-content.query.d.mts +2 -0
- package/dist/queries/llamaguard-unsafe-content.query.mjs +90 -0
- package/dist/queries/llamaguard-unsafe-content.query.mjs.map +1 -0
- package/dist/queries/readability-score.query.d.mts +2 -0
- package/dist/queries/{readability-score.query.js → readability-score.query.mjs} +11 -20
- package/dist/queries/readability-score.query.mjs.map +1 -0
- package/dist/servers/{crawl.server.d.ts → crawl.server.d.mts} +10 -10
- package/dist/servers/crawl.server.mjs +192 -0
- package/dist/servers/crawl.server.mjs.map +1 -0
- package/dist/servers/{express.server.d.ts → express.server.d.mts} +2 -3
- package/dist/servers/express.server.mjs +13 -0
- package/dist/servers/express.server.mjs.map +1 -0
- package/dist/servers/{maintenance.server.d.ts → maintenance.server.d.mts} +5 -5
- package/dist/servers/maintenance.server.mjs +97 -0
- package/dist/servers/maintenance.server.mjs.map +1 -0
- package/dist/servers/{rest.server.d.ts → rest.server.d.mts} +4 -4
- package/dist/servers/rest.server.mjs +62 -0
- package/dist/servers/rest.server.mjs.map +1 -0
- package/dist/servers/{socket-io.server.d.ts → socket-io.server.d.mts} +4 -4
- package/dist/servers/socket-io.server.mjs +22 -0
- package/dist/servers/socket-io.server.mjs.map +1 -0
- package/dist/services/{database.service.d.ts → database.service.d.mts} +12 -12
- package/dist/services/database.service.mjs +645 -0
- package/dist/services/database.service.mjs.map +1 -0
- package/dist/services/{ollama-rest.service.d.ts → ollama-rest.service.d.mts} +2 -2
- package/dist/services/ollama-rest.service.mjs +27 -0
- package/dist/services/ollama-rest.service.mjs.map +1 -0
- package/dist/services/{rig-llama-guard.service.d.ts → rig-llama-guard.service.d.mts} +2 -2
- package/dist/services/{rig-llama-guard.service.js → rig-llama-guard.service.mjs} +33 -43
- package/dist/services/rig-llama-guard.service.mjs.map +1 -0
- package/dist/services/{rig-queue-length.service.d.ts → rig-queue-length.service.d.mts} +1 -1
- package/dist/services/rig-queue-length.service.mjs +12 -0
- package/dist/services/rig-queue-length.service.mjs.map +1 -0
- package/dist/services/{rig-subjectivity-scale.service.d.ts → rig-subjectivity-scale.service.d.mts} +2 -2
- package/dist/services/rig-subjectivity-scale.service.mjs +82 -0
- package/dist/services/rig-subjectivity-scale.service.mjs.map +1 -0
- package/dist/services/{rig-ticket-rest.service.d.ts → rig-ticket-rest.service.d.mts} +3 -3
- package/dist/services/rig-ticket-rest.service.mjs +15 -0
- package/dist/services/rig-ticket-rest.service.mjs.map +1 -0
- package/dist/services/{rig-ticketed-promise.service.d.ts → rig-ticketed-promise.service.d.mts} +4 -6
- package/dist/services/{rig-ticketed-promise.service.js → rig-ticketed-promise.service.mjs} +7 -6
- package/dist/services/rig-ticketed-promise.service.mjs.map +1 -0
- package/dist/types/{tcrawl-config.js → tcrawl-config.mjs} +2 -2
- package/dist/types/tcrawl-config.mjs.map +1 -0
- package/dist/types/{thydra-config.js → thydra-config.mjs} +2 -2
- package/dist/types/thydra-config.mjs.map +1 -0
- package/dist/types/tparser-ctor.d.mts +7 -0
- package/dist/types/tparser-ctor.mjs +2 -0
- package/dist/types/tparser-ctor.mjs.map +1 -0
- package/dist/types/tquery.d.mts +7 -0
- package/dist/types/tquery.mjs +2 -0
- package/dist/types/tquery.mjs.map +1 -0
- package/dist/types/tqueue-length.mjs +2 -0
- package/dist/types/tqueue-length.mjs.map +1 -0
- package/dist/types/{trobots-config.js → trobots-config.mjs} +2 -2
- package/dist/types/trobots-config.mjs.map +1 -0
- package/package.json +37 -43
- package/dist/apis/autocomplete.api.js +0 -22
- package/dist/apis/autocomplete.api.js.map +0 -1
- package/dist/apis/bugs.api.js +0 -26
- package/dist/apis/bugs.api.js.map +0 -1
- package/dist/apis/crawl.api.js +0 -25
- package/dist/apis/crawl.api.js.map +0 -1
- package/dist/apis/domains.api.js.map +0 -1
- package/dist/apis/images.api.js +0 -27
- package/dist/apis/images.api.js.map +0 -1
- package/dist/apis/statistics.api.js +0 -41
- package/dist/apis/statistics.api.js.map +0 -1
- package/dist/apis/test.api.js +0 -19
- package/dist/apis/test.api.js.map +0 -1
- package/dist/apis/urls.api.js +0 -29
- package/dist/apis/urls.api.js.map +0 -1
- package/dist/apps/cleanup.app.js +0 -141
- package/dist/apps/cleanup.app.js.map +0 -1
- package/dist/apps/cross-populate-export.app.js +0 -75
- package/dist/apps/cross-populate-export.app.js.map +0 -1
- package/dist/apps/cross-populate-import.app.js +0 -100
- package/dist/apps/cross-populate-import.app.js.map +0 -1
- package/dist/apps/denylist.app.js +0 -132
- package/dist/apps/denylist.app.js.map +0 -1
- package/dist/apps/expire.app.js +0 -63
- package/dist/apps/expire.app.js.map +0 -1
- package/dist/apps/export-domain-urls.js +0 -99
- package/dist/apps/export-domain-urls.js.map +0 -1
- package/dist/apps/extract-text.app.js +0 -55
- package/dist/apps/extract-text.app.js.map +0 -1
- package/dist/apps/hydra.app.js +0 -218
- package/dist/apps/hydra.app.js.map +0 -1
- package/dist/apps/import.app.js +0 -57
- package/dist/apps/import.app.js.map +0 -1
- package/dist/apps/internal-hydra-common.app.js.map +0 -1
- package/dist/apps/move-to-archive.app.js +0 -46
- package/dist/apps/move-to-archive.app.js.map +0 -1
- package/dist/apps/prune-archive.app.js +0 -55
- package/dist/apps/prune-archive.app.js.map +0 -1
- package/dist/apps/query.app.js +0 -80
- package/dist/apps/query.app.js.map +0 -1
- package/dist/apps/reattempt.app.js +0 -83
- package/dist/apps/reattempt.app.js.map +0 -1
- package/dist/apps/requeue-domain.app.js +0 -64
- package/dist/apps/requeue-domain.app.js.map +0 -1
- package/dist/apps/seed.app.js +0 -69
- package/dist/apps/seed.app.js.map +0 -1
- package/dist/apps/startup.app.js +0 -64
- package/dist/apps/startup.app.js.map +0 -1
- package/dist/apps/unarchive-urls.app.js +0 -83
- package/dist/apps/unarchive-urls.app.js.map +0 -1
- package/dist/classes/cleaner.js +0 -266
- package/dist/classes/cleaner.js.map +0 -1
- package/dist/classes/crawler.js +0 -422
- package/dist/classes/crawler.js.map +0 -1
- package/dist/classes/dns.js.map +0 -1
- package/dist/classes/expirer.js +0 -121
- package/dist/classes/expirer.js.map +0 -1
- package/dist/classes/expiry.js.map +0 -1
- package/dist/classes/lists.js.map +0 -1
- package/dist/classes/robot.js +0 -82
- package/dist/classes/robot.js.map +0 -1
- package/dist/classes/tracker.js +0 -120
- package/dist/classes/tracker.js.map +0 -1
- package/dist/cli.js.map +0 -1
- package/dist/enums/eavailable-strategy.js.map +0 -1
- package/dist/enums/elist.js.map +0 -1
- package/dist/enums/eserver.js.map +0 -1
- package/dist/enums/ex-powered-by.js.map +0 -1
- package/dist/helpers/matcher.js.map +0 -1
- package/dist/helpers/random.js.map +0 -1
- package/dist/helpers/utf-decoder.js.map +0 -1
- package/dist/interfaces/iexpiry.js.map +0 -1
- package/dist/interfaces/imatch.js.map +0 -1
- package/dist/interfaces/iparser-config.js.map +0 -1
- package/dist/interfaces/iparser.js +0 -2
- package/dist/interfaces/iparser.js.map +0 -1
- package/dist/interfaces/irequest-outcome.js +0 -2
- package/dist/interfaces/irequest-outcome.js.map +0 -1
- package/dist/interfaces/iserver.js +0 -2
- package/dist/interfaces/iserver.js.map +0 -1
- package/dist/parsers/accessibility-metrics.parser.d.ts +0 -11
- package/dist/parsers/accessibility-metrics.parser.js +0 -40
- package/dist/parsers/accessibility-metrics.parser.js.map +0 -1
- package/dist/parsers/asp-error.parser.d.ts +0 -12
- package/dist/parsers/asp-error.parser.js +0 -48
- package/dist/parsers/asp-error.parser.js.map +0 -1
- package/dist/parsers/bad-words.parser.js +0 -27
- package/dist/parsers/bad-words.parser.js.map +0 -1
- package/dist/parsers/complex-english.parser.d.ts +0 -15
- package/dist/parsers/complex-english.parser.js +0 -61
- package/dist/parsers/complex-english.parser.js.map +0 -1
- package/dist/parsers/data.parser.d.ts +0 -14
- package/dist/parsers/data.parser.js.map +0 -1
- package/dist/parsers/dictionary.parser.js +0 -73
- package/dist/parsers/dictionary.parser.js.map +0 -1
- package/dist/parsers/html.parser.d.ts +0 -13
- package/dist/parsers/html.parser.js.map +0 -1
- package/dist/parsers/hyperlinks.parser.d.ts +0 -20
- package/dist/parsers/hyperlinks.parser.js +0 -115
- package/dist/parsers/hyperlinks.parser.js.map +0 -1
- package/dist/parsers/image-tags.parser.d.ts +0 -19
- package/dist/parsers/image-tags.parser.js +0 -52
- package/dist/parsers/image-tags.parser.js.map +0 -1
- package/dist/parsers/interest.parser.js +0 -69
- package/dist/parsers/interest.parser.js.map +0 -1
- package/dist/parsers/jpeg.parser.d.ts +0 -11
- package/dist/parsers/jpeg.parser.js +0 -39
- package/dist/parsers/jpeg.parser.js.map +0 -1
- package/dist/parsers/llama-guard.parser.js +0 -65
- package/dist/parsers/llama-guard.parser.js.map +0 -1
- package/dist/parsers/offence.parser.js +0 -69
- package/dist/parsers/offence.parser.js.map +0 -1
- package/dist/parsers/ollama.parser.js +0 -51
- package/dist/parsers/ollama.parser.js.map +0 -1
- package/dist/parsers/paragraphs.parser.js +0 -49
- package/dist/parsers/paragraphs.parser.js.map +0 -1
- package/dist/parsers/parser.js +0 -57
- package/dist/parsers/parser.js.map +0 -1
- package/dist/parsers/php-error.parser.d.ts +0 -12
- package/dist/parsers/php-error.parser.js +0 -52
- package/dist/parsers/php-error.parser.js.map +0 -1
- package/dist/parsers/phrase.parser.js +0 -26
- package/dist/parsers/phrase.parser.js.map +0 -1
- package/dist/parsers/regex.parser.js +0 -43
- package/dist/parsers/regex.parser.js.map +0 -1
- package/dist/parsers/server.parser.d.ts +0 -11
- package/dist/parsers/server.parser.js +0 -67
- package/dist/parsers/server.parser.js.map +0 -1
- package/dist/parsers/spelling.parser.js +0 -27
- package/dist/parsers/spelling.parser.js.map +0 -1
- package/dist/parsers/string.parser.d.ts +0 -8
- package/dist/parsers/string.parser.js.map +0 -1
- package/dist/parsers/text.parser.js +0 -41
- package/dist/parsers/text.parser.js.map +0 -1
- package/dist/parsers/words.parser.js +0 -40
- package/dist/parsers/words.parser.js.map +0 -1
- package/dist/queries/complex-english.query.d.ts +0 -2
- package/dist/queries/complex-english.query.js.map +0 -1
- package/dist/queries/flash-content.query.d.ts +0 -2
- package/dist/queries/flash-content.query.js +0 -82
- package/dist/queries/flash-content.query.js.map +0 -1
- package/dist/queries/linking-to-domains.query.d.ts +0 -2
- package/dist/queries/linking-to-domains.query.js +0 -130
- package/dist/queries/linking-to-domains.query.js.map +0 -1
- package/dist/queries/llamaguard-unsafe-content.query.d.ts +0 -2
- package/dist/queries/llamaguard-unsafe-content.query.js +0 -92
- package/dist/queries/llamaguard-unsafe-content.query.js.map +0 -1
- package/dist/queries/readability-score.query.d.ts +0 -2
- package/dist/queries/readability-score.query.js.map +0 -1
- package/dist/servers/crawl.server.js +0 -198
- package/dist/servers/crawl.server.js.map +0 -1
- package/dist/servers/express.server.js +0 -13
- package/dist/servers/express.server.js.map +0 -1
- package/dist/servers/maintenance.server.js +0 -103
- package/dist/servers/maintenance.server.js.map +0 -1
- package/dist/servers/rest.server.js +0 -46
- package/dist/servers/rest.server.js.map +0 -1
- package/dist/servers/socket-io.server.js +0 -61
- package/dist/servers/socket-io.server.js.map +0 -1
- package/dist/services/database.service.js +0 -795
- package/dist/services/database.service.js.map +0 -1
- package/dist/services/ollama-rest.service.js +0 -46
- package/dist/services/ollama-rest.service.js.map +0 -1
- package/dist/services/rig-llama-guard.service.js.map +0 -1
- package/dist/services/rig-queue-length.service.js +0 -22
- package/dist/services/rig-queue-length.service.js.map +0 -1
- package/dist/services/rig-subjectivity-scale.service.js +0 -96
- package/dist/services/rig-subjectivity-scale.service.js.map +0 -1
- package/dist/services/rig-ticket-rest.service.js +0 -29
- package/dist/services/rig-ticket-rest.service.js.map +0 -1
- package/dist/services/rig-ticketed-promise.service.js.map +0 -1
- package/dist/types/tcrawl-config.js.map +0 -1
- package/dist/types/thydra-config.js.map +0 -1
- package/dist/types/tparser-ctor.d.ts +0 -7
- package/dist/types/tparser-ctor.js +0 -2
- package/dist/types/tparser-ctor.js.map +0 -1
- package/dist/types/tquery.d.ts +0 -7
- package/dist/types/tquery.js +0 -2
- package/dist/types/tquery.js.map +0 -1
- package/dist/types/tqueue-length.js +0 -2
- package/dist/types/tqueue-length.js.map +0 -1
- package/dist/types/trobots-config.js.map +0 -1
- /package/dist/classes/{dns.d.ts → dns.d.mts} +0 -0
- /package/dist/{cli.d.ts → cli.d.mts} +0 -0
- /package/dist/enums/{eavailable-strategy.d.ts → eavailable-strategy.d.mts} +0 -0
- /package/dist/enums/{elist.d.ts → elist.d.mts} +0 -0
- /package/dist/enums/{eserver.d.ts → eserver.d.mts} +0 -0
- /package/dist/enums/{ex-powered-by.d.ts → ex-powered-by.d.mts} +0 -0
- /package/dist/interfaces/{imatch.d.ts → imatch.d.mts} +0 -0
- /package/dist/interfaces/{iparser-config.d.ts → iparser-config.d.mts} +0 -0
- /package/dist/interfaces/{iserver.d.ts → iserver.d.mts} +0 -0
- /package/dist/types/{tcrawl-config.d.ts → tcrawl-config.d.mts} +0 -0
- /package/dist/types/{thydra-config.d.ts → thydra-config.d.mts} +0 -0
- /package/dist/types/{tqueue-length.d.ts → tqueue-length.d.mts} +0 -0
- /package/dist/types/{trobots-config.d.ts → trobots-config.d.mts} +0 -0
|
@@ -1,82 +0,0 @@
|
|
|
1
|
-
var __awaiter = (this && this.__awaiter) || function (thisArg, _arguments, P, generator) {
|
|
2
|
-
function adopt(value) { return value instanceof P ? value : new P(function (resolve) { resolve(value); }); }
|
|
3
|
-
return new (P || (P = Promise))(function (resolve, reject) {
|
|
4
|
-
function fulfilled(value) { try { step(generator.next(value)); } catch (e) { reject(e); } }
|
|
5
|
-
function rejected(value) { try { step(generator["throw"](value)); } catch (e) { reject(e); } }
|
|
6
|
-
function step(result) { result.done ? resolve(result.value) : adopt(result.value).then(fulfilled, rejected); }
|
|
7
|
-
step((generator = generator.apply(thisArg, _arguments || [])).next());
|
|
8
|
-
});
|
|
9
|
-
};
|
|
10
|
-
import { ECommonsCsvColumnType } from 'tscommons-es-format';
|
|
11
|
-
import { isIUrl } from 'hydra-crawler-ts-assets';
|
|
12
|
-
import { isTLink } from 'hydra-crawler-ts-assets';
|
|
13
|
-
import { EStatus } from 'hydra-crawler-ts-assets';
|
|
14
|
-
import { commonsOutputDoing, commonsOutputProgress, commonsOutputResult, commonsOutputSuccess } from 'nodecommons-es-cli';
|
|
15
|
-
import { CommonsCsv } from 'nodecommons-es-file';
|
|
16
|
-
export const QUERY = (args, databaseService, _lists, _expiry, _parsersConfig) => __awaiter(void 0, void 0, void 0, function* () {
|
|
17
|
-
const filename = args.getString('filename');
|
|
18
|
-
commonsOutputDoing('Searching for FLV and SWF URLs');
|
|
19
|
-
const results = databaseService.getUrls().find({
|
|
20
|
-
url: /\.(flv|swf)$/i,
|
|
21
|
-
status: { $in: [
|
|
22
|
-
EStatus.ACTIVE,
|
|
23
|
-
EStatus.DENY,
|
|
24
|
-
EStatus.DISALLOWED,
|
|
25
|
-
EStatus.DONE,
|
|
26
|
-
EStatus.FAILED,
|
|
27
|
-
EStatus.QUEUED
|
|
28
|
-
] }
|
|
29
|
-
}, {});
|
|
30
|
-
const urls = yield databaseService.listQueryResults(results, isIUrl);
|
|
31
|
-
commonsOutputResult(urls.length);
|
|
32
|
-
commonsOutputDoing('Searching for outgoing links to URLs');
|
|
33
|
-
let tally = 0;
|
|
34
|
-
const urlLinks = new Map();
|
|
35
|
-
for (const url of urls) {
|
|
36
|
-
const results3 = databaseService.getLinks().find({
|
|
37
|
-
outgoing: url.url
|
|
38
|
-
}, {});
|
|
39
|
-
const links = yield databaseService.listQueryResults(results3, isTLink);
|
|
40
|
-
if (links.length === 0)
|
|
41
|
-
continue;
|
|
42
|
-
tally += links.length;
|
|
43
|
-
commonsOutputProgress(tally);
|
|
44
|
-
urlLinks.set(url, links);
|
|
45
|
-
}
|
|
46
|
-
commonsOutputResult(tally);
|
|
47
|
-
commonsOutputDoing('Building CSV array');
|
|
48
|
-
const rows = [];
|
|
49
|
-
for (const url of urls) {
|
|
50
|
-
for (const link of (urlLinks.get(url) || [])) {
|
|
51
|
-
rows.push({
|
|
52
|
-
src: link.url,
|
|
53
|
-
dest: url.url
|
|
54
|
-
});
|
|
55
|
-
}
|
|
56
|
-
}
|
|
57
|
-
rows
|
|
58
|
-
.sort((a, b) => {
|
|
59
|
-
if (a.src < b.src)
|
|
60
|
-
return -1;
|
|
61
|
-
if (a.src > b.src)
|
|
62
|
-
return 1;
|
|
63
|
-
if (a.dest < b.dest)
|
|
64
|
-
return -1;
|
|
65
|
-
if (a.dest > b.dest)
|
|
66
|
-
return 1;
|
|
67
|
-
return 0;
|
|
68
|
-
});
|
|
69
|
-
commonsOutputSuccess();
|
|
70
|
-
const csv = new CommonsCsv([
|
|
71
|
-
{
|
|
72
|
-
name: 'src',
|
|
73
|
-
type: ECommonsCsvColumnType.STRING
|
|
74
|
-
},
|
|
75
|
-
{
|
|
76
|
-
name: 'dest',
|
|
77
|
-
type: ECommonsCsvColumnType.STRING
|
|
78
|
-
}
|
|
79
|
-
]);
|
|
80
|
-
csv.save(rows, filename, true);
|
|
81
|
-
});
|
|
82
|
-
//# sourceMappingURL=flash-content.query.js.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"flash-content.query.js","sourceRoot":"","sources":["../../src/queries/flash-content.query.ts"],"names":[],"mappings":";;;;;;;;;AAGA,OAAO,EAAE,qBAAqB,EAAE,MAAM,qBAAqB,CAAC;AAE5D,OAAO,EAAQ,MAAM,EAAE,MAAM,yBAAyB,CAAC;AACvD,OAAO,EAAS,OAAO,EAAE,MAAM,yBAAyB,CAAC;AACzD,OAAO,EAAE,OAAO,EAAE,MAAM,yBAAyB,CAAC;AAElD,OAAO,EAAe,kBAAkB,EAAE,qBAAqB,EAAE,mBAAmB,EAAE,oBAAoB,EAAE,MAAM,oBAAoB,CAAC;AACvI,OAAO,EAAE,UAAU,EAAE,MAAM,qBAAqB,CAAC;AAgBjD,MAAM,CAAC,MAAM,KAAK,GAAW,CAC3B,IAAiB,EACjB,eAAgC,EAChC,MAAa,EACb,OAAe,EACf,cAAyC,EAC1B,EAAE;IAClB,MAAM,QAAQ,GAAW,IAAI,CAAC,SAAS,CAAC,UAAU,CAAC,CAAC;IAEpD,kBAAkB,CAAC,gCAAgC,CAAC,CAAC;IACrD,MAAM,OAAO,GAA6B,eAAe,CAAC,OAAO,EAAE,CAAC,IAAI,CACtE;QACE,GAAG,EAAE,eAAe;QACpB,MAAM,EAAE,EAAE,GAAG,EAAE;gBACb,OAAO,CAAC,MAAM;gBACd,OAAO,CAAC,IAAI;gBACZ,OAAO,CAAC,UAAU;gBAClB,OAAO,CAAC,IAAI;gBACZ,OAAO,CAAC,MAAM;gBACd,OAAO,CAAC,MAAM;aACf,EAAE;KACJ,EACD,EAAE,CACH,CAAC;IACF,MAAM,IAAI,GAAW,MAAM,eAAe,CAAC,gBAAgB,CACzD,OAAO,EACP,MAAM,CACP,CAAC;IACF,mBAAmB,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;IAEjC,kBAAkB,CAAC,sCAAsC,CAAC,CAAC;IAC3D,IAAI,KAAK,GAAW,CAAC,CAAC;IACtB,MAAM,QAAQ,GAAuB,IAAI,GAAG,EAAiB,CAAC;IAC9D,KAAK,MAAM,GAAG,IAAI,IAAI,EAAE;QACvB,MAAM,QAAQ,GAA8B,eAAe,CAAC,QAAQ,EAAE,CAAC,IAAI,CACzE;YACE,QAAQ,EAAE,GAAG,CAAC,GAAG;SAClB,EACD,EAAE,CACH,CAAC;QACF,MAAM,KAAK,GAAY,MAAM,eAAe,CAAC,gBAAgB,CAC3D,QAAQ,EACR,OAAO,CACR,CAAC;QAEF,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC;YAAE,SAAS;QAEjC,KAAK,IAAI,KAAK,CAAC,MAAM,CAAC;QACtB,qBAAqB,CAAC,KAAK,CAAC,CAAC;QAE7B,QAAQ,CAAC,GAAG,CAAC,GAAG,EAAE,KAAK,CAAC,CAAC;KACzB;IACD,mBAAmB,CAAC,KAAK,CAAC,CAAC;IAE3B,kBAAkB,CAAC,oBAAoB,CAAC,CAAC;IAEzC,MAAM,IAAI,GAAW,EAAE,CAAC;IACxB,KAAK,MAAM,GAAG,IAAI,IAAI,EAAE;QACvB,KAAK,MAAM,IAAI,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,GAAG,CAAC,IAAI,EAAE,CAAC,EAAE;YAC7C,IAAI,CAAC,IAAI,CAAC;gBACR,GAAG,EAAE,IAAI,CAAC,GAAG;gBACb,IAAI,EAAE,GAAG,CAAC,GAAG;aACd,CAAC,CAAC;SACH;KACD;IACD,IAAI;SACD,IAAI,CAAC,CAAC,CAAO,EAAE,CAAO,EAAU,EAAE;QAClC,IAAI,CAAC,CAAC,GAAG,GAAG,CAAC,CAAC,GAAG;YAAE,OAAO,CAAC,CAAC,CAAC;QAC7B,IAAI,CAAC,CAAC,GAAG,GAAG,CAAC,CAAC,GAAG;YAAE,OAAO,CAAC,CAAC;QAC5B,IAAI,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,IAAI;YAAE,OAAO,CAAC,CAAC,CAAC;QAC/B,IAAI,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,IAAI;YAAE,OAAO,CAAC,CAAC;QAC9B,OAAO,CAAC,CAAC;IACV,CAAC,CAAC,CAAC;IAEL,oBAAoB,EAAE,CAAC;IAEvB,MAAM,GAAG,GAAe,IAAI,UAAU,CAAC;QACrC;YACE,IAAI,EAAE,KAAK;YACX,IAAI,EAAE,qBAAqB,CAAC,MAAM;SACnC;QACD;YACE,IAAI,EAAE,MAAM;YACZ,IAAI,EAAE,qBAAqB,CAAC,MAAM;SACnC;KACF,CAAC,CAAC;IACH,GAAG,CAAC,IAAI,CACN,IAAI,EACJ,QAAQ,EACR,IAAI,CACL,CAAC;AACH,CAAC,CAAA,CAAC"}
|
|
@@ -1,130 +0,0 @@
|
|
|
1
|
-
var __awaiter = (this && this.__awaiter) || function (thisArg, _arguments, P, generator) {
|
|
2
|
-
function adopt(value) { return value instanceof P ? value : new P(function (resolve) { resolve(value); }); }
|
|
3
|
-
return new (P || (P = Promise))(function (resolve, reject) {
|
|
4
|
-
function fulfilled(value) { try { step(generator.next(value)); } catch (e) { reject(e); } }
|
|
5
|
-
function rejected(value) { try { step(generator["throw"](value)); } catch (e) { reject(e); } }
|
|
6
|
-
function step(result) { result.done ? resolve(result.value) : adopt(result.value).then(fulfilled, rejected); }
|
|
7
|
-
step((generator = generator.apply(thisArg, _arguments || [])).next());
|
|
8
|
-
});
|
|
9
|
-
};
|
|
10
|
-
import { isIUrl } from 'hydra-crawler-ts-assets';
|
|
11
|
-
import { isTLink } from 'hydra-crawler-ts-assets';
|
|
12
|
-
import { isTDomain } from 'hydra-crawler-ts-assets';
|
|
13
|
-
import { EStatus } from 'hydra-crawler-ts-assets';
|
|
14
|
-
import { commonsOutputDoing, commonsOutputError, commonsOutputProgress, commonsOutputResult, commonsOutputSuccess } from 'nodecommons-es-cli';
|
|
15
|
-
const domainSort = (a, b) => {
|
|
16
|
-
if (a.startsWith('http://'))
|
|
17
|
-
a = a.substr(7);
|
|
18
|
-
if (a.startsWith('https://'))
|
|
19
|
-
a = a.substr(8);
|
|
20
|
-
if (a.startsWith('www.'))
|
|
21
|
-
a = a.substr(4);
|
|
22
|
-
if (b.startsWith('http://'))
|
|
23
|
-
b = b.substr(7);
|
|
24
|
-
if (b.startsWith('https://'))
|
|
25
|
-
b = b.substr(8);
|
|
26
|
-
if (b.startsWith('www.'))
|
|
27
|
-
b = b.substr(4);
|
|
28
|
-
if (a < b)
|
|
29
|
-
return -1;
|
|
30
|
-
if (a > b)
|
|
31
|
-
return 1;
|
|
32
|
-
return 0;
|
|
33
|
-
};
|
|
34
|
-
export const QUERY = (args, databaseService, _lists, _expiry, _parsersConfig) => __awaiter(void 0, void 0, void 0, function* () {
|
|
35
|
-
const regexStr = args.getString('regex');
|
|
36
|
-
if (!regexStr) {
|
|
37
|
-
commonsOutputError('No domain regex specified');
|
|
38
|
-
return;
|
|
39
|
-
}
|
|
40
|
-
const regex = new RegExp(regexStr);
|
|
41
|
-
commonsOutputDoing('Searching for matching domains');
|
|
42
|
-
const results = databaseService.getDomains().find({
|
|
43
|
-
domain: regex
|
|
44
|
-
}, {});
|
|
45
|
-
const domains = yield databaseService.listQueryResults(results, isTDomain);
|
|
46
|
-
commonsOutputResult(domains.length);
|
|
47
|
-
const domainUrls = new Map();
|
|
48
|
-
for (const domain of domains) {
|
|
49
|
-
commonsOutputDoing(`Searching for URLs for ${domain.domain}`);
|
|
50
|
-
const results2 = databaseService.getUrls().find({
|
|
51
|
-
domain: domain.domain,
|
|
52
|
-
status: { $ne: EStatus.ARCHIVED }
|
|
53
|
-
}, {});
|
|
54
|
-
const urls = yield databaseService.listQueryResults(results2, isIUrl);
|
|
55
|
-
commonsOutputResult(urls.length);
|
|
56
|
-
domainUrls.set(domain, urls);
|
|
57
|
-
}
|
|
58
|
-
commonsOutputDoing('Searching for outgoing links to URLs');
|
|
59
|
-
let tally = 0;
|
|
60
|
-
const domainUrlLinks = new Map();
|
|
61
|
-
for (const domain of domains) {
|
|
62
|
-
const urls = domainUrls.get(domain);
|
|
63
|
-
if (!urls || !urls.length)
|
|
64
|
-
continue;
|
|
65
|
-
const map = new Map();
|
|
66
|
-
for (const url of urls) {
|
|
67
|
-
const results3 = databaseService.getLinks().find({
|
|
68
|
-
outgoing: url.url
|
|
69
|
-
}, {});
|
|
70
|
-
const links = yield databaseService.listQueryResults(results3, isTLink);
|
|
71
|
-
if (links.length === 0)
|
|
72
|
-
continue;
|
|
73
|
-
tally += links.length;
|
|
74
|
-
commonsOutputProgress(tally);
|
|
75
|
-
map.set(url, links);
|
|
76
|
-
}
|
|
77
|
-
if (map.size === 0)
|
|
78
|
-
continue;
|
|
79
|
-
domainUrlLinks.set(domain, map);
|
|
80
|
-
}
|
|
81
|
-
commonsOutputResult(tally);
|
|
82
|
-
commonsOutputDoing('Constructing JSON object');
|
|
83
|
-
const outcome = {};
|
|
84
|
-
for (const domain of domainUrlLinks.keys()) {
|
|
85
|
-
outcome[domain.domain] = {};
|
|
86
|
-
for (const url of domainUrlLinks.get(domain).keys()) {
|
|
87
|
-
outcome[domain.domain][url.url] = domainUrlLinks.get(domain).get(url)
|
|
88
|
-
.map((link) => link.url);
|
|
89
|
-
}
|
|
90
|
-
}
|
|
91
|
-
commonsOutputSuccess();
|
|
92
|
-
if (args.hasAttribute('domains-only')) {
|
|
93
|
-
Object.keys(outcome)
|
|
94
|
-
.sort(domainSort)
|
|
95
|
-
.forEach((domain) => {
|
|
96
|
-
console.log(domain);
|
|
97
|
-
});
|
|
98
|
-
}
|
|
99
|
-
else if (args.hasAttribute('url-list')) {
|
|
100
|
-
const reverseMap = new Map();
|
|
101
|
-
for (const domain of Object.keys(outcome)) {
|
|
102
|
-
for (const out of Object.keys(outcome[domain])) {
|
|
103
|
-
for (const url of outcome[domain][out]) {
|
|
104
|
-
if (!reverseMap.has(url))
|
|
105
|
-
reverseMap.set(url, []);
|
|
106
|
-
if (!reverseMap.get(url).includes(out))
|
|
107
|
-
reverseMap.get(url).push(out);
|
|
108
|
-
}
|
|
109
|
-
}
|
|
110
|
-
}
|
|
111
|
-
const urls = Array.from(reverseMap.keys())
|
|
112
|
-
.sort(domainSort);
|
|
113
|
-
for (const url of urls) {
|
|
114
|
-
reverseMap.get(url).sort(domainSort);
|
|
115
|
-
let first = true;
|
|
116
|
-
for (const out of reverseMap.get(url)) {
|
|
117
|
-
const tsv = [
|
|
118
|
-
first ? url : '',
|
|
119
|
-
out
|
|
120
|
-
];
|
|
121
|
-
console.log(tsv.join('\t'));
|
|
122
|
-
first = false;
|
|
123
|
-
}
|
|
124
|
-
}
|
|
125
|
-
}
|
|
126
|
-
else if (args.hasAttribute('json-dump')) {
|
|
127
|
-
console.log(JSON.stringify(outcome));
|
|
128
|
-
}
|
|
129
|
-
});
|
|
130
|
-
//# sourceMappingURL=linking-to-domains.query.js.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"linking-to-domains.query.js","sourceRoot":"","sources":["../../src/queries/linking-to-domains.query.ts"],"names":[],"mappings":";;;;;;;;;AAIA,OAAO,EAAQ,MAAM,EAAE,MAAM,yBAAyB,CAAC;AACvD,OAAO,EAAS,OAAO,EAAE,MAAM,yBAAyB,CAAC;AACzD,OAAO,EAAW,SAAS,EAAE,MAAM,yBAAyB,CAAC;AAC7D,OAAO,EAAE,OAAO,EAAE,MAAM,yBAAyB,CAAC;AAElD,OAAO,EAAe,kBAAkB,EAAE,kBAAkB,EAAE,qBAAqB,EAAE,mBAAmB,EAAE,oBAAoB,EAAE,MAAM,oBAAoB,CAAC;AAiB3J,MAAM,UAAU,GAAqC,CAAC,CAAS,EAAE,CAAS,EAAU,EAAE;IACrF,IAAI,CAAC,CAAC,UAAU,CAAC,SAAS,CAAC;QAAE,CAAC,GAAG,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC;IAC7C,IAAI,CAAC,CAAC,UAAU,CAAC,UAAU,CAAC;QAAE,CAAC,GAAG,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC;IAC9C,IAAI,CAAC,CAAC,UAAU,CAAC,MAAM,CAAC;QAAE,CAAC,GAAG,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC;IAC1C,IAAI,CAAC,CAAC,UAAU,CAAC,SAAS,CAAC;QAAE,CAAC,GAAG,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC;IAC7C,IAAI,CAAC,CAAC,UAAU,CAAC,UAAU,CAAC;QAAE,CAAC,GAAG,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC;IAC9C,IAAI,CAAC,CAAC,UAAU,CAAC,MAAM,CAAC;QAAE,CAAC,GAAG,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC;IAE1C,IAAI,CAAC,GAAG,CAAC;QAAE,OAAO,CAAC,CAAC,CAAC;IACrB,IAAI,CAAC,GAAG,CAAC;QAAE,OAAO,CAAC,CAAC;IACpB,OAAO,CAAC,CAAC;AACV,CAAC,CAAC;AAEF,MAAM,CAAC,MAAM,KAAK,GAAW,CAC3B,IAAiB,EACjB,eAAgC,EAChC,MAAa,EACb,OAAe,EACf,cAAyC,EAC1B,EAAE;IAClB,MAAM,QAAQ,GAAqB,IAAI,CAAC,SAAS,CAAC,OAAO,CAAC,CAAC;IAC3D,IAAI,CAAC,QAAQ,EAAE;QACd,kBAAkB,CAAC,2BAA2B,CAAC,CAAC;QAChD,OAAO;KACP;IACD,MAAM,KAAK,GAAW,IAAI,MAAM,CAAC,QAAQ,CAAC,CAAC;IAE3C,kBAAkB,CAAC,gCAAgC,CAAC,CAAC;IACrD,MAAM,OAAO,GAAgC,eAAe,CAAC,UAAU,EAAE,CAAC,IAAI,CAC5E;QACE,MAAM,EAAE,KAAK;KACd,EACD,EAAE,CACH,CAAC;IACF,MAAM,OAAO,GAAc,MAAM,eAAe,CAAC,gBAAgB,CAC/D,OAAO,EACP,SAAS,CACV,CAAC;IACF,mBAAmB,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC;IAEpC,MAAM,UAAU,GAAyB,IAAI,GAAG,EAAmB,CAAC;IACpE,KAAK,MAAM,MAAM,IAAI,OAAO,EAAE;QAC7B,kBAAkB,CAAC,0BAA0B,MAAM,CAAC,MAAM,EAAE,CAAC,CAAC;QAC9D,MAAM,QAAQ,GAA6B,eAAe,CAAC,OAAO,EAAE,CAAC,IAAI,CACvE;YACE,MAAM,EAAE,MAAM,CAAC,MAAM;YACrB,MAAM,EAAE,EAAE,GAAG,EAAE,OAAO,CAAC,QAAQ,EAAE;SAClC,EACD,EAAE,CACH,CAAC;QACF,MAAM,IAAI,GAAW,MAAM,eAAe,CAAC,gBAAgB,CACzD,QAAQ,EACR,MAAM,CACP,CAAC;QACF,mBAAmB,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QAEjC,UAAU,CAAC,GAAG,CAAC,MAAM,EAAE,IAAI,CAAC,CAAC;KAC7B;IAED,kBAAkB,CAAC,sCAAsC,CAAC,CAAC;IAC3D,IAAI,KAAK,GAAW,CAAC,CAAC;IACtB,MAAM,cAAc,GAAqC,IAAI,GAAG,EAA+B,CAAC;IAChG,KAAK,MAAM,MAAM,IAAI,OAAO,EAAE;QAC7B,MAAM,IAAI,GAAqB,UAAU,CAAC,GAAG,CAAC,MAAM,CAAC,CAAC;QACtD,IAAI,CAAC,IAAI,IAAI,CAAC,IAAI,CAAC,MAAM;YAAE,SAAS;QAEpC,MAAM,GAAG,GAAuB,IAAI,GAAG,EAAiB,CAAC;QAEzD,KAAK,MAAM,GAAG,IAAI,IAAI,EAAE;YACvB,MAAM,QAAQ,GAA8B,eAAe,CAAC,QAAQ,EAAE,CAAC,IAAI,CACzE;gBACE,QAAQ,EAAE,GAAG,CAAC,GAAG;aAClB,EACD,EAAE,CACH,CAAC;YACF,MAAM,KAAK,GAAY,MAAM,eAAe,CAAC,gBAAgB,CAC3D,QAAQ,EACR,OAAO,CACR,CAAC;YAEF,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC;gBAAE,SAAS;YAEjC,KAAK,IAAI,KAAK,CAAC,MAAM,CAAC;YACtB,qBAAqB,CAAC,KAAK,CAAC,CAAC;YAE7B,GAAG,CAAC,GAAG,CAAC,GAAG,EAAE,KAAK,CAAC,CAAC;SACpB;QAED,IAAI,GAAG,CAAC,IAAI,KAAK,CAAC;YAAE,SAAS;QAE7B,cAAc,CAAC,GAAG,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;KAChC;IACD,mBAAmB,CAAC,KAAK,CAAC,CAAC;IAE3B,kBAAkB,CAAC,0BAA0B,CAAC,CAAC;IAC/C,MAAM,OAAO,GAAa,EAAE,CAAC;IAC7B,KAAK,MAAM,MAAM,IAAI,cAAc,CAAC,IAAI,EAAE,EAAE;QAC3C,OAAO,CAAC,MAAM,CAAC,MAAM,CAAC,GAAG,EAAE,CAAC;QAE5B,KAAK,MAAM,GAAG,IAAI,cAAc,CAAC,GAAG,CAAC,MAAM,CAAE,CAAC,IAAI,EAAE,EAAE;YACrD,OAAO,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,CAAC,GAAG,CAAC,GAAG,cAAc,CAAC,GAAG,CAAC,MAAM,CAAE,CAAC,GAAG,CAAC,GAAG,CAAE;iBACpE,GAAG,CAAC,CAAC,IAAW,EAAU,EAAE,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;SAC1C;KACD;IACD,oBAAoB,EAAE,CAAC;IAEvB,IAAI,IAAI,CAAC,YAAY,CAAC,cAAc,CAAC,EAAE;QACtC,MAAM,CAAC,IAAI,CAAC,OAAO,CAAC;aACjB,IAAI,CAAC,UAAU,CAAC;aAChB,OAAO,CAAC,CAAC,MAAc,EAAQ,EAAE;YACjC,OAAO,CAAC,GAAG,CAAC,MAAM,CAAC,CAAC;QACrB,CAAC,CAAC,CAAC;KACL;SAAM,IAAI,IAAI,CAAC,YAAY,CAAC,UAAU,CAAC,EAAE;QACzC,MAAM,UAAU,GAA0B,IAAI,GAAG,EAAoB,CAAC;QAEtE,KAAK,MAAM,MAAM,IAAI,MAAM,CAAC,IAAI,CAAC,OAAO,CAAC,EAAE;YAC1C,KAAK,MAAM,GAAG,IAAI,MAAM,CAAC,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC,EAAE;gBAC/C,KAAK,MAAM,GAAG,IAAI,OAAO,CAAC,MAAM,CAAC,CAAC,GAAG,CAAC,EAAE;oBACvC,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC,GAAG,CAAC;wBAAE,UAAU,CAAC,GAAG,CAAC,GAAG,EAAE,EAAE,CAAC,CAAC;oBAClD,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC,GAAG,CAAE,CAAC,QAAQ,CAAC,GAAG,CAAC;wBAAE,UAAU,CAAC,GAAG,CAAC,GAAG,CAAE,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;iBACxE;aACD;SACD;QAED,MAAM,IAAI,GAAa,KAAK,CAAC,IAAI,CAAC,UAAU,CAAC,IAAI,EAAE,CAAC;aACjD,IAAI,CAAC,UAAU,CAAC,CAAC;QACpB,KAAK,MAAM,GAAG,IAAI,IAAI,EAAE;YACvB,UAAU,CAAC,GAAG,CAAC,GAAG,CAAE,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;YAEtC,IAAI,KAAK,GAAY,IAAI,CAAC;YAC1B,KAAK,MAAM,GAAG,IAAI,UAAU,CAAC,GAAG,CAAC,GAAG,CAAE,EAAE;gBACvC,MAAM,GAAG,GAAa;oBACpB,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE;oBAChB,GAAG;iBACJ,CAAC;gBACF,OAAO,CAAC,GAAG,CAAC,GAAG,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC;gBAE5B,KAAK,GAAG,KAAK,CAAC;aACd;SACD;KACD;SAAM,IAAI,IAAI,CAAC,YAAY,CAAC,WAAW,CAAC,EAAE;QAC1C,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,SAAS,CAAC,OAAO,CAAC,CAAC,CAAC;KACrC;AACF,CAAC,CAAA,CAAC"}
|
|
@@ -1,92 +0,0 @@
|
|
|
1
|
-
var __awaiter = (this && this.__awaiter) || function (thisArg, _arguments, P, generator) {
|
|
2
|
-
function adopt(value) { return value instanceof P ? value : new P(function (resolve) { resolve(value); }); }
|
|
3
|
-
return new (P || (P = Promise))(function (resolve, reject) {
|
|
4
|
-
function fulfilled(value) { try { step(generator.next(value)); } catch (e) { reject(e); } }
|
|
5
|
-
function rejected(value) { try { step(generator["throw"](value)); } catch (e) { reject(e); } }
|
|
6
|
-
function step(result) { result.done ? resolve(result.value) : adopt(result.value).then(fulfilled, rejected); }
|
|
7
|
-
step((generator = generator.apply(thisArg, _arguments || [])).next());
|
|
8
|
-
});
|
|
9
|
-
};
|
|
10
|
-
import { ECommonsCsvColumnType } from 'tscommons-es-format';
|
|
11
|
-
import { EStatus } from 'hydra-crawler-ts-assets';
|
|
12
|
-
import { commonsOutputDoing, commonsOutputResult, commonsOutputSuccess } from 'nodecommons-es-cli';
|
|
13
|
-
import { CommonsCsv } from 'nodecommons-es-file';
|
|
14
|
-
import { ELLAMA_GUARD_CATEGORYS, prettyLlamaGuardCategory } from '../services/rig-llama-guard.service';
|
|
15
|
-
export const QUERY = (args, databaseService, _lists, _expiry, _parsersConfig) => __awaiter(void 0, void 0, void 0, function* () {
|
|
16
|
-
const filename = args.getString('filename');
|
|
17
|
-
commonsOutputDoing('Searching for URLs marked unsafe');
|
|
18
|
-
const results = databaseService.getUrls().find({
|
|
19
|
-
'llamaguard.classification': 'unsafe',
|
|
20
|
-
status: { $in: [
|
|
21
|
-
EStatus.ACTIVE,
|
|
22
|
-
EStatus.DENY,
|
|
23
|
-
EStatus.DISALLOWED,
|
|
24
|
-
EStatus.DONE,
|
|
25
|
-
EStatus.FAILED,
|
|
26
|
-
EStatus.QUEUED
|
|
27
|
-
] }
|
|
28
|
-
}, {});
|
|
29
|
-
const urls = yield databaseService.listQueryResults(results, (_t) => true);
|
|
30
|
-
commonsOutputResult(urls.length);
|
|
31
|
-
commonsOutputDoing('Inverting categorisation');
|
|
32
|
-
const map = new Map();
|
|
33
|
-
for (const category of ELLAMA_GUARD_CATEGORYS)
|
|
34
|
-
map.set(category, []);
|
|
35
|
-
for (const url of urls) {
|
|
36
|
-
if (url.llamaguard.classification === 'safe')
|
|
37
|
-
continue;
|
|
38
|
-
for (const category of url.llamaguard.categories)
|
|
39
|
-
map.get(category).push(url);
|
|
40
|
-
}
|
|
41
|
-
commonsOutputSuccess();
|
|
42
|
-
commonsOutputDoing('Building CSV array');
|
|
43
|
-
const rows = [];
|
|
44
|
-
for (const category of ELLAMA_GUARD_CATEGORYS) {
|
|
45
|
-
const meaning = prettyLlamaGuardCategory(category);
|
|
46
|
-
for (const url of map.get(category)) {
|
|
47
|
-
rows.push({
|
|
48
|
-
category: category,
|
|
49
|
-
meaning: meaning,
|
|
50
|
-
domain: url.domain,
|
|
51
|
-
url: url.url
|
|
52
|
-
});
|
|
53
|
-
}
|
|
54
|
-
}
|
|
55
|
-
rows
|
|
56
|
-
.sort((a, b) => {
|
|
57
|
-
if (a.category < b.category)
|
|
58
|
-
return -1;
|
|
59
|
-
if (a.category > b.category)
|
|
60
|
-
return 1;
|
|
61
|
-
if (a.domain < b.domain)
|
|
62
|
-
return -1;
|
|
63
|
-
if (a.domain > b.domain)
|
|
64
|
-
return 1;
|
|
65
|
-
if (a.url < b.url)
|
|
66
|
-
return -1;
|
|
67
|
-
if (a.url > b.url)
|
|
68
|
-
return 1;
|
|
69
|
-
return 0;
|
|
70
|
-
});
|
|
71
|
-
commonsOutputSuccess();
|
|
72
|
-
const csv = new CommonsCsv([
|
|
73
|
-
{
|
|
74
|
-
name: 'category',
|
|
75
|
-
type: ECommonsCsvColumnType.STRING
|
|
76
|
-
},
|
|
77
|
-
{
|
|
78
|
-
name: 'meaning',
|
|
79
|
-
type: ECommonsCsvColumnType.STRING
|
|
80
|
-
},
|
|
81
|
-
{
|
|
82
|
-
name: 'domain',
|
|
83
|
-
type: ECommonsCsvColumnType.STRING
|
|
84
|
-
},
|
|
85
|
-
{
|
|
86
|
-
name: 'url',
|
|
87
|
-
type: ECommonsCsvColumnType.STRING
|
|
88
|
-
}
|
|
89
|
-
]);
|
|
90
|
-
csv.save(rows, filename, true);
|
|
91
|
-
});
|
|
92
|
-
//# sourceMappingURL=llamaguard-unsafe-content.query.js.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"llamaguard-unsafe-content.query.js","sourceRoot":"","sources":["../../src/queries/llamaguard-unsafe-content.query.ts"],"names":[],"mappings":";;;;;;;;;AAGA,OAAO,EAAE,qBAAqB,EAAE,MAAM,qBAAqB,CAAC;AAG5D,OAAO,EAAE,OAAO,EAAE,MAAM,yBAAyB,CAAC;AAElD,OAAO,EAAe,kBAAkB,EAAE,mBAAmB,EAAE,oBAAoB,EAAE,MAAM,oBAAoB,CAAC;AAChH,OAAO,EAAE,UAAU,EAAE,MAAM,qBAAqB,CAAC;AAMjD,OAAO,EAAE,sBAAsB,EAAuB,wBAAwB,EAAqB,MAAM,qCAAqC,CAAC;AAe/I,MAAM,CAAC,MAAM,KAAK,GAAW,CAC3B,IAAiB,EACjB,eAAgC,EAChC,MAAa,EACb,OAAe,EACf,cAAyC,EAC1B,EAAE;IAClB,MAAM,QAAQ,GAAW,IAAI,CAAC,SAAS,CAAC,UAAU,CAAC,CAAC;IAEpD,kBAAkB,CAAC,kCAAkC,CAAC,CAAC;IACvD,MAAM,OAAO,GAA2C,eAAe,CAAC,OAAO,EAAE,CAAC,IAAI,CACpF;QACE,2BAA2B,EAAE,QAAQ;QACrC,MAAM,EAAE,EAAE,GAAG,EAAE;gBACb,OAAO,CAAC,MAAM;gBACd,OAAO,CAAC,IAAI;gBACZ,OAAO,CAAC,UAAU;gBAClB,OAAO,CAAC,IAAI;gBACZ,OAAO,CAAC,MAAM;gBACd,OAAO,CAAC,MAAM;aACf,EAAE;KACJ,EACD,EAAE,CACH,CAAC;IACF,MAAM,IAAI,GAAyB,MAAM,eAAe,CAAC,gBAAgB,CACvE,OAAO,EACP,CAAC,EAAW,EAA4B,EAAE,CAAC,IAAI,CAChD,CAAC;IACF,mBAAmB,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;IAEjC,kBAAkB,CAAC,0BAA0B,CAAC,CAAC;IAC/C,MAAM,GAAG,GAAqC,IAAI,GAAG,EAA+B,CAAC;IACrF,KAAK,MAAM,QAAQ,IAAI,sBAAsB;QAAE,GAAG,CAAC,GAAG,CAAC,QAAQ,EAAE,EAAE,CAAC,CAAC;IAErE,KAAK,MAAM,GAAG,IAAI,IAAI,EAAE;QACvB,IAAI,GAAG,CAAC,UAAU,CAAC,cAAc,KAAK,MAAM;YAAE,SAAS;QAEvD,KAAK,MAAM,QAAQ,IAAI,GAAG,CAAC,UAAU,CAAC,UAAU;YAAE,GAAG,CAAC,GAAG,CAAC,QAAQ,CAAE,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;KAC/E;IACD,oBAAoB,EAAE,CAAC;IAEvB,kBAAkB,CAAC,oBAAoB,CAAC,CAAC;IAEzC,MAAM,IAAI,GAAW,EAAE,CAAC;IACxB,KAAK,MAAM,QAAQ,IAAI,sBAAsB,EAAE;QAC9C,MAAM,OAAO,GAAW,wBAAwB,CAAC,QAAQ,CAAC,CAAC;QAE3D,KAAK,MAAM,GAAG,IAAI,GAAG,CAAC,GAAG,CAAC,QAAQ,CAAE,EAAE;YACrC,IAAI,CAAC,IAAI,CAAC;gBACR,QAAQ,EAAE,QAAQ;gBAClB,OAAO,EAAE,OAAO;gBAChB,MAAM,EAAE,GAAG,CAAC,MAAM;gBAClB,GAAG,EAAE,GAAG,CAAC,GAAG;aACb,CAAC,CAAC;SACH;KACD;IAED,IAAI;SACD,IAAI,CAAC,CAAC,CAAO,EAAE,CAAO,EAAU,EAAE;QAClC,IAAI,CAAC,CAAC,QAAQ,GAAG,CAAC,CAAC,QAAQ;YAAE,OAAO,CAAC,CAAC,CAAC;QACvC,IAAI,CAAC,CAAC,QAAQ,GAAG,CAAC,CAAC,QAAQ;YAAE,OAAO,CAAC,CAAC;QAEtC,IAAI,CAAC,CAAC,MAAM,GAAG,CAAC,CAAC,MAAM;YAAE,OAAO,CAAC,CAAC,CAAC;QACnC,IAAI,CAAC,CAAC,MAAM,GAAG,CAAC,CAAC,MAAM;YAAE,OAAO,CAAC,CAAC;QAElC,IAAI,CAAC,CAAC,GAAG,GAAG,CAAC,CAAC,GAAG;YAAE,OAAO,CAAC,CAAC,CAAC;QAC7B,IAAI,CAAC,CAAC,GAAG,GAAG,CAAC,CAAC,GAAG;YAAE,OAAO,CAAC,CAAC;QAE5B,OAAO,CAAC,CAAC;IACV,CAAC,CAAC,CAAC;IAEL,oBAAoB,EAAE,CAAC;IAEvB,MAAM,GAAG,GAAe,IAAI,UAAU,CAAC;QACrC;YACE,IAAI,EAAE,UAAU;YAChB,IAAI,EAAE,qBAAqB,CAAC,MAAM;SACnC;QACD;YACE,IAAI,EAAE,SAAS;YACf,IAAI,EAAE,qBAAqB,CAAC,MAAM;SACnC;QACD;YACE,IAAI,EAAE,QAAQ;YACd,IAAI,EAAE,qBAAqB,CAAC,MAAM;SACnC;QACD;YACE,IAAI,EAAE,KAAK;YACX,IAAI,EAAE,qBAAqB,CAAC,MAAM;SACnC;KACF,CAAC,CAAC;IACH,GAAG,CAAC,IAAI,CACN,IAAI,EACJ,QAAQ,EACR,IAAI,CACL,CAAC;AACH,CAAC,CAAA,CAAC"}
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"readability-score.query.js","sourceRoot":"","sources":["../../src/queries/readability-score.query.ts"],"names":[],"mappings":";;;;;;;;;AAIA,OAAO,EAAE,OAAO,EAAE,MAAM,yBAAyB,CAAC;AAElD,OAAO,EAAe,kBAAkB,EAAE,kBAAkB,EAAE,qBAAqB,EAAE,mBAAmB,EAAE,MAAM,oBAAoB,CAAC;AAuBrI,MAAM,CAAC,MAAM,KAAK,GAAW,CAC3B,IAAiB,EACjB,eAAgC,EAChC,MAAa,EACb,OAAe,EACf,cAAyC,EAC1B,EAAE;IAClB,MAAM,MAAM,GAAqB,IAAI,CAAC,SAAS,CAAC,QAAQ,CAAC,CAAC;IAC1D,IAAI,CAAC,MAAM,EAAE;QACZ,kBAAkB,CAAC,qBAAqB,CAAC,CAAC;QAC1C,OAAO;KACP;IAED,kBAAkB,CAAC,4DAA4D,MAAM,EAAE,CAAC,CAAC;IAEzF,MAAM,OAAO,GAA+B,eAAe,CAAC,OAAO,EAAE,CAAC,SAAS,CAAU;QACvF,EAAE,MAAM,EAAE;gBACR,MAAM,EAAE,EAAE,GAAG,EAAE,OAAO,CAAC,QAAQ,EAAE;gBACjC,MAAM,EAAE,MAAM;gBACd,sBAAsB,EAAE,WAAW;aACpC,EAAE;QACH,EAAE,MAAM,EAAE;gBACR,2BAA2B,EAAE,EAAE,OAAO,EAAE,CAAC,EAAE;gBAC3C,0BAA0B,EAAE,EAAE,OAAO,EAAE,CAAC,EAAE;aAC3C,EAAE;QACH,EAAE,QAAQ,EAAE;gBACV,GAAG,EAAE,IAAI;gBACT,KAAK,EAAE;oBACL,UAAU,EAAE,kCAAkC;oBAC9C,SAAS,EAAE,iCAAiC;oBAC5C,KAAK,EAAE,6BAA6B;oBACpC,IAAI,EAAE,4BAA4B;oBAClC,GAAG,EAAE,2BAA2B;iBACjC;aACF,EAAE;QACH,EAAE,QAAQ,EAAE;gBACV,GAAG,EAAE,IAAI;gBACT,KAAK,EAAE,IAAI;gBACX,KAAK,EAAE;oBACL,IAAI,EAAE,EAAE,IAAI,EAAE,CAAC,CAAC,EAAE,EAAE,IAAI,EAAE,CAAE,GAAG,EAAE,aAAa,CAAE,EAAE,CAAE,EAAE;oBACtD,GAAG,EAAE,EAAE,IAAI,EAAE,CAAC,CAAC,EAAE,EAAE,IAAI,EAAE,CAAE,EAAE,EAAE,YAAY,CAAE,EAAE,CAAE,EAAE;iBACpD;aACF,EAAE;QACH,EAAE,QAAQ,EAAE;gBACV,GAAG,EAAE,IAAI;gBACT,KAAK,EAAE,IAAI;gBACX,QAAQ,EAAE;oBACR,IAAI,EAAE,EAAE,OAAO,EAAE,CAAE,EAAE,SAAS,EAAE,CAAE,GAAG,EAAE,aAAa,CAAE,EAAE,EAAE,GAAG,CAAE,EAAE;oBACjE,GAAG,EAAE,EAAE,OAAO,EAAE,CAAE,EAAE,SAAS,EAAE,CAAE,YAAY,EAAE,CAAC,CAAE,EAAE,EAAE,EAAE,CAAE,EAAE;iBAC7D;aACF,EAAE;QACH,EAAE,QAAQ,EAAE;gBACV,GAAG,EAAE,IAAI;gBACT,KAAK,EAAE,IAAI;gBACX,KAAK,EAAE,EAAE,OAAO,EAAE,CAAE,EAAE,IAAI,EAAE,CAAE,gBAAgB,EAAE,eAAe,CAAE,EAAE,EAAE,CAAC,CAAE,EAAE;aAC3E,EAAE;QACH,EAAE,KAAK,EAAE,EAAE,KAAK,EAAE,CAAC,CAAC,EAAE,EAAE;KACzB,CAAC,CAAC;IAEH,MAAM,OAAO,GAAc,EAAE,CAAC;IAC9B,IAAI,KAAK,GAAW,CAAC,CAAC;IACtB,OAAO,IAAI,EAAE;QACZ,KAAK,EAAE,CAAC;QACR,IAAI,CAAC,KAAK,GAAG,GAAG,CAAC,KAAK,CAAC;YAAE,qBAAqB,CAAC,GAAG,KAAK,EAAE,CAAC,CAAC;QAE3D,MAAM,GAAG,GAAiB,MAAM,OAAO,CAAC,IAAI,EAAE,CAAC;QAC/C,IAAI,GAAG,KAAK,IAAI;YAAE,MAAM;QAExB,OAAO,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;KAClB;IAED,mBAAmB,CAAC,KAAK,CAAC,CAAC;IAE3B,OAAO,CAAC,GAAG,CAAC,qDAAqD,CAAC,CAAC;IACnE,KAAK,MAAM,KAAK,IAAI,OAAO,EAAE;QAC5B,OAAO,CAAC,GAAG,CAAC,GAAG,KAAK,CAAC,GAAG,KAAK,KAAK,CAAC,KAAK,CAAC,UAAU,KAAK,KAAK,CAAC,KAAK,CAAC,SAAS,KAAK,KAAK,CAAC,KAAK,CAAC,KAAK,KAAK,KAAK,CAAC,KAAK,CAAC,IAAI,KAAK,KAAK,CAAC,KAAK,CAAC,GAAG,KAAK,KAAK,CAAC,KAAK,EAAE,CAAC,CAAC;KAChK;AACF,CAAC,CAAA,CAAC"}
|
|
@@ -1,198 +0,0 @@
|
|
|
1
|
-
var __awaiter = (this && this.__awaiter) || function (thisArg, _arguments, P, generator) {
|
|
2
|
-
function adopt(value) { return value instanceof P ? value : new P(function (resolve) { resolve(value); }); }
|
|
3
|
-
return new (P || (P = Promise))(function (resolve, reject) {
|
|
4
|
-
function fulfilled(value) { try { step(generator.next(value)); } catch (e) { reject(e); } }
|
|
5
|
-
function rejected(value) { try { step(generator["throw"](value)); } catch (e) { reject(e); } }
|
|
6
|
-
function step(result) { result.done ? resolve(result.value) : adopt(result.value).then(fulfilled, rejected); }
|
|
7
|
-
step((generator = generator.apply(thisArg, _arguments || [])).next());
|
|
8
|
-
});
|
|
9
|
-
};
|
|
10
|
-
import { commonsAsyncAbortTimeout, commonsAsyncTimeout } from 'tscommons-es-async';
|
|
11
|
-
import { EStatus } from 'hydra-crawler-ts-assets';
|
|
12
|
-
import { commonsOutputAlert, commonsOutputCompleted, commonsOutputDebug, commonsOutputDoing, commonsOutputProgress, commonsOutputStarting, commonsOutputSuccess } from 'nodecommons-es-cli';
|
|
13
|
-
import { commonsGracefulAbortAddCallback } from 'nodecommons-es-process';
|
|
14
|
-
import { Crawler } from '../classes/crawler';
|
|
15
|
-
import { EAvailableStrategy } from '../enums/eavailable-strategy';
|
|
16
|
-
export class CrawlServer {
|
|
17
|
-
set restrictTo(domains) {
|
|
18
|
-
this.domainRestrictTo = domains;
|
|
19
|
-
}
|
|
20
|
-
constructor(database, hydraConfig, crawlConfig, parsersConfig, robotsConfig, lists, tracker) {
|
|
21
|
-
this.database = database;
|
|
22
|
-
this.hydraConfig = hydraConfig;
|
|
23
|
-
this.crawlConfig = crawlConfig;
|
|
24
|
-
this.parsersConfig = parsersConfig;
|
|
25
|
-
this.robotsConfig = robotsConfig;
|
|
26
|
-
this.lists = lists;
|
|
27
|
-
this.tracker = tracker;
|
|
28
|
-
this.parsers = [];
|
|
29
|
-
this.isAborted = false;
|
|
30
|
-
this.preDelayIds = [];
|
|
31
|
-
this.isPaused = false;
|
|
32
|
-
this.domainRestrictTo = [];
|
|
33
|
-
this.crawlers = new Map();
|
|
34
|
-
this.strategies = new Map();
|
|
35
|
-
commonsGracefulAbortAddCallback(() => {
|
|
36
|
-
commonsOutputAlert('SIGINT abort flag is set. Aborting crawl server.');
|
|
37
|
-
this.abort();
|
|
38
|
-
for (const preDelayId of this.preDelayIds)
|
|
39
|
-
commonsAsyncAbortTimeout(preDelayId);
|
|
40
|
-
});
|
|
41
|
-
}
|
|
42
|
-
addParser(parser) {
|
|
43
|
-
this.parsers.push(parser);
|
|
44
|
-
}
|
|
45
|
-
listParsers() {
|
|
46
|
-
return this.parsers.slice();
|
|
47
|
-
}
|
|
48
|
-
pause() {
|
|
49
|
-
commonsOutputAlert('Pausing crawl server');
|
|
50
|
-
this.isPaused = true;
|
|
51
|
-
for (const domain of this.crawlers.keys()) {
|
|
52
|
-
this.pauseCrawl(domain);
|
|
53
|
-
}
|
|
54
|
-
}
|
|
55
|
-
resume() {
|
|
56
|
-
commonsOutputCompleted('Resuming crawl server');
|
|
57
|
-
this.isPaused = false;
|
|
58
|
-
for (const domain of this.crawlers.keys()) {
|
|
59
|
-
this.resumeCrawl(domain);
|
|
60
|
-
}
|
|
61
|
-
}
|
|
62
|
-
abort() {
|
|
63
|
-
this.isAborted = true;
|
|
64
|
-
commonsAsyncAbortTimeout('find-new-available');
|
|
65
|
-
}
|
|
66
|
-
terminate() {
|
|
67
|
-
return __awaiter(this, void 0, void 0, function* () {
|
|
68
|
-
this.abort();
|
|
69
|
-
yield this.database.close();
|
|
70
|
-
process.exit(0);
|
|
71
|
-
});
|
|
72
|
-
}
|
|
73
|
-
pauseCrawl(domain) {
|
|
74
|
-
if (!this.crawlers.has(domain))
|
|
75
|
-
return;
|
|
76
|
-
commonsOutputAlert(`Pausing crawler for ${domain}`);
|
|
77
|
-
this.crawlers.get(domain).pause();
|
|
78
|
-
}
|
|
79
|
-
resumeCrawl(domain) {
|
|
80
|
-
if (!this.crawlers.has(domain))
|
|
81
|
-
return;
|
|
82
|
-
commonsOutputCompleted(`Resuming crawler for ${domain}`);
|
|
83
|
-
this.crawlers.get(domain).resume();
|
|
84
|
-
}
|
|
85
|
-
start() {
|
|
86
|
-
return __awaiter(this, void 0, void 0, function* () {
|
|
87
|
-
yield this.database.resetActive();
|
|
88
|
-
const added = yield this.database.queue(this.hydraConfig.startUrl);
|
|
89
|
-
if (added)
|
|
90
|
-
this.tracker.delta(EStatus.QUEUED, 1);
|
|
91
|
-
while (!this.isAborted) {
|
|
92
|
-
if (!this.isPaused) {
|
|
93
|
-
const existing = [...this.crawlers.keys()];
|
|
94
|
-
const space = this.crawlConfig.maxCrawlers - existing.length;
|
|
95
|
-
if (space > 0) {
|
|
96
|
-
commonsOutputDebug(`Space for ${space} new crawls available`);
|
|
97
|
-
const largestStrategyDomains = existing
|
|
98
|
-
.filter((domain) => this.strategies.get(domain) === EAvailableStrategy.LARGEST);
|
|
99
|
-
const smallestStrategyDomains = existing
|
|
100
|
-
.filter((domain) => this.strategies.get(domain) === EAvailableStrategy.SMALLEST);
|
|
101
|
-
commonsOutputDebug(`Current crawl has LARGEST=${largestStrategyDomains.length}; SMALLEST=${smallestStrategyDomains.length}`);
|
|
102
|
-
let spaceForLargestDomains = 0;
|
|
103
|
-
let spaceForSmallestDomains = space;
|
|
104
|
-
if (largestStrategyDomains.length >= Math.floor(this.crawlConfig.maxCrawlers / 2)) {
|
|
105
|
-
// already 50% large crawling, so all remaining space goes to small crawls
|
|
106
|
-
}
|
|
107
|
-
else {
|
|
108
|
-
// allow a new large crawl, if enough space
|
|
109
|
-
if (space > 1) {
|
|
110
|
-
spaceForLargestDomains = 1;
|
|
111
|
-
spaceForSmallestDomains--;
|
|
112
|
-
}
|
|
113
|
-
}
|
|
114
|
-
commonsOutputDebug(`Space for LARGEST=${spaceForLargestDomains}; SMALLEST=${spaceForSmallestDomains}`);
|
|
115
|
-
const availablesLargest = yield this.database.available(EAvailableStrategy.LARGEST, this.crawlConfig.availableStrategyThreshold, spaceForLargestDomains, existing, this.domainRestrictTo);
|
|
116
|
-
existing.push(...availablesLargest);
|
|
117
|
-
const availablesSmallest = yield this.database.available(EAvailableStrategy.SMALLEST, this.crawlConfig.availableStrategyThreshold, spaceForSmallestDomains, existing, this.domainRestrictTo);
|
|
118
|
-
const availables = [
|
|
119
|
-
...availablesSmallest,
|
|
120
|
-
...availablesLargest
|
|
121
|
-
];
|
|
122
|
-
if (!this.isAborted) {
|
|
123
|
-
for (const domain of availables) {
|
|
124
|
-
commonsOutputStarting(`Creating new crawl head for ${domain}`);
|
|
125
|
-
const crawler = new Crawler(domain, this.database, this.crawlConfig, this.parsersConfig, this.robotsConfig, this.parsers, this.lists, this.tracker);
|
|
126
|
-
this.crawlers.set(domain, crawler);
|
|
127
|
-
if (availablesLargest.includes(domain)) {
|
|
128
|
-
this.strategies.set(domain, EAvailableStrategy.LARGEST);
|
|
129
|
-
}
|
|
130
|
-
else {
|
|
131
|
-
this.strategies.set(domain, EAvailableStrategy.SMALLEST);
|
|
132
|
-
}
|
|
133
|
-
// called without await in order to do parallel crawls
|
|
134
|
-
void (() => __awaiter(this, void 0, void 0, function* () {
|
|
135
|
-
try {
|
|
136
|
-
// delay randomly to prevent network socket request spikes
|
|
137
|
-
const preDelayId = `predelay_${domain}`;
|
|
138
|
-
this.preDelayIds.push(preDelayId);
|
|
139
|
-
try {
|
|
140
|
-
yield commonsAsyncTimeout(Math.random() * (this.crawlConfig.findNewAvailableDelay - 1000), preDelayId);
|
|
141
|
-
}
|
|
142
|
-
catch (e) {
|
|
143
|
-
if (e.message === 'abortTimeout called')
|
|
144
|
-
return;
|
|
145
|
-
throw e;
|
|
146
|
-
}
|
|
147
|
-
this.preDelayIds = this.preDelayIds
|
|
148
|
-
.filter((pid) => pid !== preDelayId);
|
|
149
|
-
if (this.isAborted)
|
|
150
|
-
return;
|
|
151
|
-
if (this.isPaused)
|
|
152
|
-
this.pauseCrawl(domain);
|
|
153
|
-
commonsOutputStarting(`Starting crawler for ${domain}`);
|
|
154
|
-
yield crawler.crawl();
|
|
155
|
-
}
|
|
156
|
-
catch (ex) {
|
|
157
|
-
commonsOutputDebug('debug position 6');
|
|
158
|
-
console.log(ex);
|
|
159
|
-
}
|
|
160
|
-
finally {
|
|
161
|
-
this.crawlers.delete(domain); // doesn't get called until after doCrawl() is called, so have to do it here if aborted
|
|
162
|
-
this.strategies.delete(domain);
|
|
163
|
-
}
|
|
164
|
-
}))();
|
|
165
|
-
}
|
|
166
|
-
}
|
|
167
|
-
}
|
|
168
|
-
}
|
|
169
|
-
try {
|
|
170
|
-
yield commonsAsyncTimeout(this.crawlConfig.findNewAvailableDelay, 'find-new-available');
|
|
171
|
-
}
|
|
172
|
-
catch (ex) {
|
|
173
|
-
// ignore
|
|
174
|
-
}
|
|
175
|
-
if (this.isAborted) {
|
|
176
|
-
commonsOutputAlert('SIGINT abort is set. Aborting new head loop.');
|
|
177
|
-
break;
|
|
178
|
-
}
|
|
179
|
-
}
|
|
180
|
-
});
|
|
181
|
-
}
|
|
182
|
-
shutdown() {
|
|
183
|
-
return __awaiter(this, void 0, void 0, function* () {
|
|
184
|
-
commonsOutputDoing('Waiting for all crawlers to abort');
|
|
185
|
-
while (this.crawlers.size > 0) {
|
|
186
|
-
commonsOutputProgress(this.crawlers.size);
|
|
187
|
-
try {
|
|
188
|
-
yield commonsAsyncTimeout(1000);
|
|
189
|
-
}
|
|
190
|
-
catch (ex) {
|
|
191
|
-
// ignore
|
|
192
|
-
}
|
|
193
|
-
}
|
|
194
|
-
commonsOutputSuccess();
|
|
195
|
-
});
|
|
196
|
-
}
|
|
197
|
-
}
|
|
198
|
-
//# sourceMappingURL=crawl.server.js.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"crawl.server.js","sourceRoot":"","sources":["../../src/servers/crawl.server.ts"],"names":[],"mappings":";;;;;;;;;AACA,OAAO,EAAE,wBAAwB,EAAE,mBAAmB,EAAE,MAAM,oBAAoB,CAAC;AAEnF,OAAO,EAAE,OAAO,EAAE,MAAM,yBAAyB,CAAC;AAElD,OAAO,EAAE,kBAAkB,EAAE,sBAAsB,EAAE,kBAAkB,EAAE,kBAAkB,EAAE,qBAAqB,EAAE,qBAAqB,EAAE,oBAAoB,EAAE,MAAM,oBAAoB,CAAC;AAC5L,OAAO,EAAE,+BAA+B,EAAE,MAAM,wBAAwB,CAAC;AAEzE,OAAO,EAAE,OAAO,EAAE,MAAM,oBAAoB,CAAC;AAa7C,OAAO,EAAE,kBAAkB,EAAE,MAAM,8BAA8B,CAAC;AAElE,MAAM,OAAO,WAAW;IAWvB,IAAW,UAAU,CAAC,OAAiB;QACtC,IAAI,CAAC,gBAAgB,GAAG,OAAO,CAAC;IACjC,CAAC;IAED,YACU,QAAyB,EACzB,WAAyB,EACzB,WAAyB,EACzB,aAAwC,EACxC,YAA2B,EAC3B,KAAY,EACZ,OAAgB;QANhB,aAAQ,GAAR,QAAQ,CAAiB;QACzB,gBAAW,GAAX,WAAW,CAAc;QACzB,gBAAW,GAAX,WAAW,CAAc;QACzB,kBAAa,GAAb,aAAa,CAA2B;QACxC,iBAAY,GAAZ,YAAY,CAAe;QAC3B,UAAK,GAAL,KAAK,CAAO;QACZ,YAAO,GAAP,OAAO,CAAS;QArBlB,YAAO,GAAkB,EAAE,CAAC;QAG5B,cAAS,GAAY,KAAK,CAAC;QAE3B,gBAAW,GAAa,EAAE,CAAC;QAE3B,aAAQ,GAAY,KAAK,CAAC;QAE1B,qBAAgB,GAAa,EAAE,CAAC;QAcvC,IAAI,CAAC,QAAQ,GAAG,IAAI,GAAG,EAAmB,CAAC;QAC3C,IAAI,CAAC,UAAU,GAAG,IAAI,GAAG,EAA8B,CAAC;QAExD,+BAA+B,CAAC,GAAS,EAAE;YAC1C,kBAAkB,CAAC,kDAAkD,CAAC,CAAC;YACvE,IAAI,CAAC,KAAK,EAAE,CAAC;YAEb,KAAK,MAAM,UAAU,IAAI,IAAI,CAAC,WAAW;gBAAE,wBAAwB,CAAC,UAAU,CAAC,CAAC;QACjF,CAAC,CAAC,CAAC;IACJ,CAAC;IAEM,SAAS,CAAC,MAAmB;QACnC,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;IAC3B,CAAC;IAEM,WAAW;QACjB,OAAO,IAAI,CAAC,OAAO,CAAC,KAAK,EAAE,CAAC;IAC7B,CAAC;IAEM,KAAK;QACX,kBAAkB,CAAC,sBAAsB,CAAC,CAAC;QAE3C,IAAI,CAAC,QAAQ,GAAG,IAAI,CAAC;QAErB,KAAK,MAAM,MAAM,IAAI,IAAI,CAAC,QAAQ,CAAC,IAAI,EAAE,EAAE;YAC1C,IAAI,CAAC,UAAU,CAAC,MAAM,CAAC,CAAC;SACxB;IACF,CAAC;IAEM,MAAM;QACZ,sBAAsB,CAAC,uBAAuB,CAAC,CAAC;QAEhD,IAAI,CAAC,QAAQ,GAAG,KAAK,CAAC;QAEtB,KAAK,MAAM,MAAM,IAAI,IAAI,CAAC,QAAQ,CAAC,IAAI,EAAE,EAAE;YAC1C,IAAI,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;SACzB;IACF,CAAC;IAEO,KAAK;QACZ,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC;QACtB,wBAAwB,CAAC,oBAAoB,CAAC,CAAC;IAChD,CAAC;IAEY,SAAS;;YACrB,IAAI,CAAC,KAAK,EAAE,CAAC;YAEb,MAAM,IAAI,CAAC,QAAQ,CAAC,KAAK,EAAE,CAAC;YAC5B,OAAO,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC;QACjB,CAAC;KAAA;IAEO,UAAU,CAAC,MAAc;QAChC,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,MAAM,CAAC;YAAE,OAAO;QAEvC,kBAAkB,CAAC,uBAAuB,MAAM,EAAE,CAAC,CAAC;QAEpD,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,MAAM,CAAE,CAAC,KAAK,EAAE,CAAC;IACpC,CAAC;IAEO,WAAW,CAAC,MAAc;QACjC,IAAI,CAAC,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,MAAM,CAAC;YAAE,OAAO;QAEvC,sBAAsB,CAAC,wBAAwB,MAAM,EAAE,CAAC,CAAC;QAEzD,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,MAAM,CAAE,CAAC,MAAM,EAAE,CAAC;IACrC,CAAC;IAEY,KAAK;;YACjB,MAAM,IAAI,CAAC,QAAQ,CAAC,WAAW,EAAE,CAAC;YAElC,MAAM,KAAK,GAAY,MAAM,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,IAAI,CAAC,WAAW,CAAC,QAAQ,CAAC,CAAC;YAC5E,IAAI,KAAK;gBAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;YAEjD,OAAO,CAAC,IAAI,CAAC,SAAS,EAAE;gBACvB,IAAI,CAAC,IAAI,CAAC,QAAQ,EAAE;oBACnB,MAAM,QAAQ,GAAa,CAAE,GAAG,IAAI,CAAC,QAAQ,CAAC,IAAI,EAAE,CAAE,CAAC;oBAEvD,MAAM,KAAK,GAAW,IAAI,CAAC,WAAW,CAAC,WAAW,GAAG,QAAQ,CAAC,MAAM,CAAC;oBAErE,IAAI,KAAK,GAAG,CAAC,EAAE;wBACd,kBAAkB,CAAC,aAAa,KAAK,uBAAuB,CAAC,CAAC;wBAE9D,MAAM,sBAAsB,GAAa,QAAQ;6BAC9C,MAAM,CAAC,CAAC,MAAc,EAAW,EAAE,CAAC,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC,MAAM,CAAC,KAAK,kBAAkB,CAAC,OAAO,CAAC,CAAC;wBAEnG,MAAM,uBAAuB,GAAa,QAAQ;6BAC/C,MAAM,CAAC,CAAC,MAAc,EAAW,EAAE,CAAC,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC,MAAM,CAAC,KAAK,kBAAkB,CAAC,QAAQ,CAAC,CAAC;wBAEpG,kBAAkB,CAAC,6BAA6B,sBAAsB,CAAC,MAAM,cAAc,uBAAuB,CAAC,MAAM,EAAE,CAAC,CAAC;wBAE7H,IAAI,sBAAsB,GAAW,CAAC,CAAC;wBACvC,IAAI,uBAAuB,GAAW,KAAK,CAAC;wBAE5C,IAAI,sBAAsB,CAAC,MAAM,IAAI,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,WAAW,CAAC,WAAW,GAAG,CAAC,CAAC,EAAE;4BAClF,0EAA0E;yBAC1E;6BAAM;4BACN,2CAA2C;4BAC3C,IAAI,KAAK,GAAG,CAAC,EAAE;gCACd,sBAAsB,GAAG,CAAC,CAAC;gCAC3B,uBAAuB,EAAE,CAAC;6BAC1B;yBACD;wBAED,kBAAkB,CAAC,qBAAqB,sBAAsB,cAAc,uBAAuB,EAAE,CAAC,CAAC;wBAEvG,MAAM,iBAAiB,GAAa,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,CAC/D,kBAAkB,CAAC,OAAO,EAC1B,IAAI,CAAC,WAAW,CAAC,0BAA0B,EAC3C,sBAAsB,EACtB,QAAQ,EACR,IAAI,CAAC,gBAAgB,CACtB,CAAC;wBAEF,QAAQ,CAAC,IAAI,CAAC,GAAG,iBAAiB,CAAC,CAAC;wBAEpC,MAAM,kBAAkB,GAAa,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,CAChE,kBAAkB,CAAC,QAAQ,EAC3B,IAAI,CAAC,WAAW,CAAC,0BAA0B,EAC3C,uBAAuB,EACvB,QAAQ,EACR,IAAI,CAAC,gBAAgB,CACtB,CAAC;wBAEF,MAAM,UAAU,GAAa;4BAC3B,GAAG,kBAAkB;4BACrB,GAAG,iBAAiB;yBACrB,CAAC;wBAEF,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE;4BACpB,KAAK,MAAM,MAAM,IAAI,UAAU,EAAE;gCAChC,qBAAqB,CAAC,+BAA+B,MAAM,EAAE,CAAC,CAAC;gCAE/D,MAAM,OAAO,GAAY,IAAI,OAAO,CAClC,MAAM,EACN,IAAI,CAAC,QAAQ,EACb,IAAI,CAAC,WAAW,EAChB,IAAI,CAAC,aAAa,EAClB,IAAI,CAAC,YAAY,EACjB,IAAI,CAAC,OAAO,EACZ,IAAI,CAAC,KAAK,EACV,IAAI,CAAC,OAAO,CACb,CAAC;gCAEF,IAAI,CAAC,QAAQ,CAAC,GAAG,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;gCAEnC,IAAI,iBAAiB,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE;oCACvC,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC,MAAM,EAAE,kBAAkB,CAAC,OAAO,CAAC,CAAC;iCACxD;qCAAM;oCACN,IAAI,CAAC,UAAU,CAAC,GAAG,CAAC,MAAM,EAAE,kBAAkB,CAAC,QAAQ,CAAC,CAAC;iCACzD;gCAED,sDAAsD;gCACtD,KAAK,CAAC,GAAwB,EAAE;oCAC/B,IAAI;wCACH,0DAA0D;wCAC1D,MAAM,UAAU,GAAW,YAAY,MAAM,EAAE,CAAC;wCAChD,IAAI,CAAC,WAAW,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;wCAClC,IAAI;4CACH,MAAM,mBAAmB,CACvB,IAAI,CAAC,MAAM,EAAE,GAAG,CAAC,IAAI,CAAC,WAAW,CAAC,qBAAqB,GAAG,IAAI,CAAC,EAC/D,UAAU,CACX,CAAC;yCACF;wCAAC,OAAO,CAAC,EAAE;4CACX,IAAK,CAAW,CAAC,OAAO,KAAK,qBAAqB;gDAAE,OAAO;4CAC3D,MAAM,CAAC,CAAC;yCACR;wCAED,IAAI,CAAC,WAAW,GAAG,IAAI,CAAC,WAAW;6CAChC,MAAM,CAAC,CAAC,GAAW,EAAW,EAAE,CAAC,GAAG,KAAK,UAAU,CAAC,CAAC;wCAExD,IAAI,IAAI,CAAC,SAAS;4CAAE,OAAO;wCAC3B,IAAI,IAAI,CAAC,QAAQ;4CAAE,IAAI,CAAC,UAAU,CAAC,MAAM,CAAC,CAAC;wCAE3C,qBAAqB,CAAC,wBAAwB,MAAM,EAAE,CAAC,CAAC;wCACxD,MAAM,OAAO,CAAC,KAAK,EAAE,CAAC;qCACtB;oCAAC,OAAO,EAAE,EAAE;wCACZ,kBAAkB,CAAC,kBAAkB,CAAC,CAAC;wCACvC,OAAO,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;qCAChB;4CAAS;wCACT,IAAI,CAAC,QAAQ,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,uFAAuF;wCACrH,IAAI,CAAC,UAAU,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;qCAC/B;gCACF,CAAC,CAAA,CAAC,EAAE,CAAC;6BACL;yBACD;qBACD;iBACD;gBAED,IAAI;oBACH,MAAM,mBAAmB,CAAC,IAAI,CAAC,WAAW,CAAC,qBAAqB,EAAE,oBAAoB,CAAC,CAAC;iBACxF;gBAAC,OAAO,EAAE,EAAE;oBACZ,SAAS;iBACT;gBAED,IAAI,IAAI,CAAC,SAAS,EAAE;oBACnB,kBAAkB,CAAC,8CAA8C,CAAC,CAAC;oBACnE,MAAM;iBACN;aACD;QACF,CAAC;KAAA;IAEY,QAAQ;;YACpB,kBAAkB,CAAC,mCAAmC,CAAC,CAAC;YACxD,OAAO,IAAI,CAAC,QAAQ,CAAC,IAAI,GAAG,CAAC,EAAE;gBAC9B,qBAAqB,CAAC,IAAI,CAAC,QAAQ,CAAC,IAAI,CAAC,CAAC;gBAE1C,IAAI;oBACH,MAAM,mBAAmB,CAAC,IAAI,CAAC,CAAC;iBAChC;gBAAC,OAAO,EAAE,EAAE;oBACZ,SAAS;iBACT;aACD;YACD,oBAAoB,EAAE,CAAC;QACxB,CAAC;KAAA;CACD"}
|
|
@@ -1,13 +0,0 @@
|
|
|
1
|
-
import { CommonsStrictExpressServer } from 'nodecommons-es-express';
|
|
2
|
-
import { commonsGracefulAbortAddCallback } from 'nodecommons-es-process';
|
|
3
|
-
import { commonsOutputAlert } from 'nodecommons-es-cli';
|
|
4
|
-
export class ExpressServer extends CommonsStrictExpressServer {
|
|
5
|
-
constructor(ex, server, config) {
|
|
6
|
-
super(ex, server, config.port);
|
|
7
|
-
commonsGracefulAbortAddCallback(() => {
|
|
8
|
-
commonsOutputAlert('SIGINT abort flag is set. Aborting Express server.');
|
|
9
|
-
super.close();
|
|
10
|
-
});
|
|
11
|
-
}
|
|
12
|
-
}
|
|
13
|
-
//# sourceMappingURL=express.server.js.map
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
{"version":3,"file":"express.server.js","sourceRoot":"","sources":["../../src/servers/express.server.ts"],"names":[],"mappings":"AAIA,OAAO,EAAE,0BAA0B,EAAE,MAAM,wBAAwB,CAAC;AAEpE,OAAO,EAAE,+BAA+B,EAAE,MAAM,wBAAwB,CAAC;AACzE,OAAO,EAAE,kBAAkB,EAAE,MAAM,oBAAoB,CAAC;AAExD,MAAM,OAAO,aAAc,SAAQ,0BAA0B;IAC5D,YACE,EAAmB,EACnB,MAAmB,EACnB,MAA6B;QAE9B,KAAK,CAAC,EAAE,EAAE,MAAM,EAAE,MAAM,CAAC,IAAI,CAAC,CAAC;QAE/B,+BAA+B,CAAC,GAAS,EAAE;YAC1C,kBAAkB,CAAC,oDAAoD,CAAC,CAAC;YACzE,KAAK,CAAC,KAAK,EAAE,CAAC;QACf,CAAC,CAAC,CAAC;IACJ,CAAC;CACD"}
|