hydra-crawler 2.8.3 → 3.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (468) hide show
  1. package/dist/apis/{autocomplete.api.d.ts → autocomplete.api.d.mts} +4 -4
  2. package/dist/apis/autocomplete.api.mjs +14 -0
  3. package/dist/apis/autocomplete.api.mjs.map +1 -0
  4. package/dist/apis/{bugs.api.d.ts → bugs.api.d.mts} +4 -4
  5. package/dist/apis/bugs.api.mjs +18 -0
  6. package/dist/apis/bugs.api.mjs.map +1 -0
  7. package/dist/apis/{crawl.api.d.ts → crawl.api.d.mts} +4 -4
  8. package/dist/apis/crawl.api.mjs +17 -0
  9. package/dist/apis/crawl.api.mjs.map +1 -0
  10. package/dist/apis/{domains.api.d.ts → domains.api.d.mts} +4 -4
  11. package/dist/apis/{domains.api.js → domains.api.mjs} +10 -18
  12. package/dist/apis/domains.api.mjs.map +1 -0
  13. package/dist/apis/{images.api.d.ts → images.api.d.mts} +4 -4
  14. package/dist/apis/images.api.mjs +19 -0
  15. package/dist/apis/images.api.mjs.map +1 -0
  16. package/dist/apis/{statistics.api.d.ts → statistics.api.d.mts} +4 -4
  17. package/dist/apis/statistics.api.mjs +33 -0
  18. package/dist/apis/statistics.api.mjs.map +1 -0
  19. package/dist/apis/{test.api.d.ts → test.api.d.mts} +3 -3
  20. package/dist/apis/test.api.mjs +10 -0
  21. package/dist/apis/test.api.mjs.map +1 -0
  22. package/dist/apis/{urls.api.d.ts → urls.api.d.mts} +4 -4
  23. package/dist/apis/urls.api.mjs +21 -0
  24. package/dist/apis/urls.api.mjs.map +1 -0
  25. package/dist/apps/{cleanup.app.d.ts → cleanup.app.d.mts} +5 -5
  26. package/dist/apps/cleanup.app.mjs +129 -0
  27. package/dist/apps/cleanup.app.mjs.map +1 -0
  28. package/dist/apps/{cross-populate-export.app.d.ts → cross-populate-export.app.d.mts} +3 -3
  29. package/dist/apps/cross-populate-export.app.mjs +61 -0
  30. package/dist/apps/cross-populate-export.app.mjs.map +1 -0
  31. package/dist/apps/{cross-populate-import.app.d.ts → cross-populate-import.app.d.mts} +3 -3
  32. package/dist/apps/cross-populate-import.app.mjs +61 -0
  33. package/dist/apps/cross-populate-import.app.mjs.map +1 -0
  34. package/dist/apps/{denylist.app.d.ts → denylist.app.d.mts} +5 -5
  35. package/dist/apps/denylist.app.mjs +122 -0
  36. package/dist/apps/denylist.app.mjs.map +1 -0
  37. package/dist/apps/{expire.app.d.ts → expire.app.d.mts} +8 -7
  38. package/dist/apps/expire.app.mjs +51 -0
  39. package/dist/apps/expire.app.mjs.map +1 -0
  40. package/dist/apps/{export-domain-urls.d.ts → export-domain-urls.d.mts} +3 -3
  41. package/dist/apps/export-domain-urls.mjs +85 -0
  42. package/dist/apps/export-domain-urls.mjs.map +1 -0
  43. package/dist/apps/{extract-text.app.d.ts → extract-text.app.d.mts} +2 -2
  44. package/dist/apps/extract-text.app.mjs +43 -0
  45. package/dist/apps/extract-text.app.mjs.map +1 -0
  46. package/dist/apps/{hydra.app.d.ts → hydra.app.d.mts} +10 -10
  47. package/dist/apps/hydra.app.mjs +222 -0
  48. package/dist/apps/hydra.app.mjs.map +1 -0
  49. package/dist/apps/{import.app.d.ts → import.app.d.mts} +3 -3
  50. package/dist/apps/import.app.mjs +48 -0
  51. package/dist/apps/import.app.mjs.map +1 -0
  52. package/dist/apps/{internal-hydra-common.app.d.ts → internal-hydra-common.app.d.mts} +6 -6
  53. package/dist/apps/{internal-hydra-common.app.js → internal-hydra-common.app.mjs} +1 -1
  54. package/dist/apps/internal-hydra-common.app.mjs.map +1 -0
  55. package/dist/apps/{move-to-archive.app.d.ts → move-to-archive.app.d.mts} +2 -2
  56. package/dist/apps/move-to-archive.app.mjs +31 -0
  57. package/dist/apps/move-to-archive.app.mjs.map +1 -0
  58. package/dist/apps/{prune-archive.app.d.ts → prune-archive.app.d.mts} +2 -2
  59. package/dist/apps/prune-archive.app.mjs +40 -0
  60. package/dist/apps/prune-archive.app.mjs.map +1 -0
  61. package/dist/apps/{query.app.d.ts → query.app.d.mts} +6 -6
  62. package/dist/apps/query.app.mjs +69 -0
  63. package/dist/apps/query.app.mjs.map +1 -0
  64. package/dist/apps/{reattempt.app.d.ts → reattempt.app.d.mts} +6 -6
  65. package/dist/apps/reattempt.app.mjs +74 -0
  66. package/dist/apps/reattempt.app.mjs.map +1 -0
  67. package/dist/apps/{requeue-domain.app.d.ts → requeue-domain.app.d.mts} +3 -3
  68. package/dist/apps/requeue-domain.app.mjs +52 -0
  69. package/dist/apps/requeue-domain.app.mjs.map +1 -0
  70. package/dist/apps/{seed.app.d.ts → seed.app.d.mts} +5 -5
  71. package/dist/apps/seed.app.mjs +59 -0
  72. package/dist/apps/seed.app.mjs.map +1 -0
  73. package/dist/apps/{startup.app.d.ts → startup.app.d.mts} +3 -3
  74. package/dist/apps/startup.app.mjs +55 -0
  75. package/dist/apps/startup.app.mjs.map +1 -0
  76. package/dist/apps/{unarchive-urls.app.d.ts → unarchive-urls.app.d.mts} +5 -5
  77. package/dist/apps/unarchive-urls.app.mjs +71 -0
  78. package/dist/apps/unarchive-urls.app.mjs.map +1 -0
  79. package/dist/classes/{cleaner.d.ts → cleaner.d.mts} +2 -2
  80. package/dist/classes/cleaner.mjs +257 -0
  81. package/dist/classes/cleaner.mjs.map +1 -0
  82. package/dist/classes/{crawler.d.ts → crawler.d.mts} +10 -12
  83. package/dist/classes/crawler.mjs +418 -0
  84. package/dist/classes/crawler.mjs.map +1 -0
  85. package/dist/classes/{dns.js → dns.mjs} +4 -4
  86. package/dist/classes/dns.mjs.map +1 -0
  87. package/dist/classes/{expirer.d.ts → expirer.d.mts} +2 -2
  88. package/dist/classes/expirer.mjs +117 -0
  89. package/dist/classes/expirer.mjs.map +1 -0
  90. package/dist/classes/{expiry.d.ts → expiry.d.mts} +1 -1
  91. package/dist/classes/{expiry.js → expiry.mjs} +7 -9
  92. package/dist/classes/expiry.mjs.map +1 -0
  93. package/dist/classes/{lists.d.ts → lists.d.mts} +2 -2
  94. package/dist/classes/{lists.js → lists.mjs} +4 -4
  95. package/dist/classes/lists.mjs.map +1 -0
  96. package/dist/classes/{robot.d.ts → robot.d.mts} +3 -3
  97. package/dist/classes/robot.mjs +74 -0
  98. package/dist/classes/robot.mjs.map +1 -0
  99. package/dist/classes/{tracker.d.ts → tracker.d.mts} +3 -3
  100. package/dist/classes/tracker.mjs +101 -0
  101. package/dist/classes/tracker.mjs.map +1 -0
  102. package/dist/{cli.js → cli.mjs} +46 -58
  103. package/dist/cli.mjs.map +1 -0
  104. package/dist/enums/{eavailable-strategy.js → eavailable-strategy.mjs} +1 -1
  105. package/dist/enums/eavailable-strategy.mjs.map +1 -0
  106. package/dist/enums/{elist.js → elist.mjs} +1 -1
  107. package/dist/enums/elist.mjs.map +1 -0
  108. package/dist/enums/{eserver.js → eserver.mjs} +1 -1
  109. package/dist/enums/eserver.mjs.map +1 -0
  110. package/dist/enums/{ex-powered-by.js → ex-powered-by.mjs} +1 -1
  111. package/dist/enums/ex-powered-by.mjs.map +1 -0
  112. package/dist/helpers/{matcher.d.ts → matcher.d.mts} +1 -1
  113. package/dist/helpers/{matcher.js → matcher.mjs} +1 -1
  114. package/dist/helpers/matcher.mjs.map +1 -0
  115. package/dist/helpers/{random.d.ts → random.d.mts} +1 -1
  116. package/dist/helpers/{random.js → random.mjs} +1 -1
  117. package/dist/helpers/random.mjs.map +1 -0
  118. package/dist/helpers/{utf-decoder.d.ts → utf-decoder.d.mts} +0 -1
  119. package/dist/helpers/{utf-decoder.js → utf-decoder.mjs} +3 -3
  120. package/dist/helpers/utf-decoder.mjs.map +1 -0
  121. package/dist/interfaces/{iexpiry.d.ts → iexpiry.d.mts} +1 -1
  122. package/dist/interfaces/{iexpiry.js → iexpiry.mjs} +3 -3
  123. package/dist/interfaces/iexpiry.mjs.map +1 -0
  124. package/dist/interfaces/{imatch.js → imatch.mjs} +2 -2
  125. package/dist/interfaces/imatch.mjs.map +1 -0
  126. package/dist/interfaces/{iparser-config.js → iparser-config.mjs} +2 -2
  127. package/dist/interfaces/iparser-config.mjs.map +1 -0
  128. package/dist/interfaces/{iparser.d.ts → iparser.d.mts} +1 -1
  129. package/dist/interfaces/iparser.mjs +2 -0
  130. package/dist/interfaces/iparser.mjs.map +1 -0
  131. package/dist/interfaces/{irequest-outcome.d.ts → irequest-outcome.d.mts} +0 -2
  132. package/dist/interfaces/irequest-outcome.mjs +2 -0
  133. package/dist/interfaces/irequest-outcome.mjs.map +1 -0
  134. package/dist/interfaces/iserver.mjs +2 -0
  135. package/dist/interfaces/iserver.mjs.map +1 -0
  136. package/dist/parsers/accessibility-metrics.parser.d.mts +11 -0
  137. package/dist/parsers/accessibility-metrics.parser.mjs +30 -0
  138. package/dist/parsers/accessibility-metrics.parser.mjs.map +1 -0
  139. package/dist/parsers/asp-error.parser.d.mts +12 -0
  140. package/dist/parsers/asp-error.parser.mjs +38 -0
  141. package/dist/parsers/asp-error.parser.mjs.map +1 -0
  142. package/dist/parsers/{bad-words.parser.d.ts → bad-words.parser.d.mts} +6 -6
  143. package/dist/parsers/bad-words.parser.mjs +17 -0
  144. package/dist/parsers/bad-words.parser.mjs.map +1 -0
  145. package/dist/parsers/complex-english.parser.d.mts +15 -0
  146. package/dist/parsers/complex-english.parser.mjs +52 -0
  147. package/dist/parsers/complex-english.parser.mjs.map +1 -0
  148. package/dist/parsers/data.parser.d.mts +13 -0
  149. package/dist/parsers/{data.parser.js → data.parser.mjs} +8 -7
  150. package/dist/parsers/data.parser.mjs.map +1 -0
  151. package/dist/parsers/{dictionary.parser.d.ts → dictionary.parser.d.mts} +6 -6
  152. package/dist/parsers/dictionary.parser.mjs +63 -0
  153. package/dist/parsers/dictionary.parser.mjs.map +1 -0
  154. package/dist/parsers/html.parser.d.mts +13 -0
  155. package/dist/parsers/{html.parser.js → html.parser.mjs} +4 -3
  156. package/dist/parsers/html.parser.mjs.map +1 -0
  157. package/dist/parsers/hyperlinks.parser.d.mts +20 -0
  158. package/dist/parsers/hyperlinks.parser.mjs +104 -0
  159. package/dist/parsers/hyperlinks.parser.mjs.map +1 -0
  160. package/dist/parsers/image-tags.parser.d.mts +19 -0
  161. package/dist/parsers/image-tags.parser.mjs +42 -0
  162. package/dist/parsers/image-tags.parser.mjs.map +1 -0
  163. package/dist/parsers/{interest.parser.d.ts → interest.parser.d.mts} +7 -7
  164. package/dist/parsers/interest.parser.mjs +60 -0
  165. package/dist/parsers/interest.parser.mjs.map +1 -0
  166. package/dist/parsers/jpeg.parser.d.mts +11 -0
  167. package/dist/parsers/jpeg.parser.mjs +29 -0
  168. package/dist/parsers/jpeg.parser.mjs.map +1 -0
  169. package/dist/parsers/{llama-guard.parser.d.ts → llama-guard.parser.d.mts} +7 -7
  170. package/dist/parsers/llama-guard.parser.mjs +56 -0
  171. package/dist/parsers/llama-guard.parser.mjs.map +1 -0
  172. package/dist/parsers/{offence.parser.d.ts → offence.parser.d.mts} +7 -7
  173. package/dist/parsers/offence.parser.mjs +60 -0
  174. package/dist/parsers/offence.parser.mjs.map +1 -0
  175. package/dist/parsers/{ollama.parser.d.ts → ollama.parser.d.mts} +6 -6
  176. package/dist/parsers/ollama.parser.mjs +43 -0
  177. package/dist/parsers/ollama.parser.mjs.map +1 -0
  178. package/dist/parsers/{paragraphs.parser.d.ts → paragraphs.parser.d.mts} +5 -5
  179. package/dist/parsers/paragraphs.parser.mjs +38 -0
  180. package/dist/parsers/paragraphs.parser.mjs.map +1 -0
  181. package/dist/parsers/{parser.d.ts → parser.d.mts} +6 -6
  182. package/dist/parsers/parser.mjs +45 -0
  183. package/dist/parsers/parser.mjs.map +1 -0
  184. package/dist/parsers/php-error.parser.d.mts +12 -0
  185. package/dist/parsers/php-error.parser.mjs +42 -0
  186. package/dist/parsers/php-error.parser.mjs.map +1 -0
  187. package/dist/parsers/{phrase.parser.d.ts → phrase.parser.d.mts} +3 -3
  188. package/dist/parsers/phrase.parser.mjs +15 -0
  189. package/dist/parsers/phrase.parser.mjs.map +1 -0
  190. package/dist/parsers/{regex.parser.d.ts → regex.parser.d.mts} +3 -3
  191. package/dist/parsers/regex.parser.mjs +29 -0
  192. package/dist/parsers/regex.parser.mjs.map +1 -0
  193. package/dist/parsers/server.parser.d.mts +11 -0
  194. package/dist/parsers/server.parser.mjs +57 -0
  195. package/dist/parsers/server.parser.mjs.map +1 -0
  196. package/dist/parsers/{spelling.parser.d.ts → spelling.parser.d.mts} +6 -6
  197. package/dist/parsers/spelling.parser.mjs +17 -0
  198. package/dist/parsers/spelling.parser.mjs.map +1 -0
  199. package/dist/parsers/string.parser.d.mts +8 -0
  200. package/dist/parsers/{string.parser.js → string.parser.mjs} +5 -4
  201. package/dist/parsers/string.parser.mjs.map +1 -0
  202. package/dist/parsers/{text.parser.d.ts → text.parser.d.mts} +3 -3
  203. package/dist/parsers/text.parser.mjs +30 -0
  204. package/dist/parsers/text.parser.mjs.map +1 -0
  205. package/dist/parsers/{words.parser.d.ts → words.parser.d.mts} +3 -3
  206. package/dist/parsers/words.parser.mjs +29 -0
  207. package/dist/parsers/words.parser.mjs.map +1 -0
  208. package/dist/queries/complex-english.query.d.mts +2 -0
  209. package/dist/queries/{complex-english.query.js → complex-english.query.mjs} +18 -27
  210. package/dist/queries/complex-english.query.mjs.map +1 -0
  211. package/dist/queries/flash-content.query.d.mts +2 -0
  212. package/dist/queries/flash-content.query.mjs +80 -0
  213. package/dist/queries/flash-content.query.mjs.map +1 -0
  214. package/dist/queries/linking-to-domains.query.d.mts +2 -0
  215. package/dist/queries/linking-to-domains.query.mjs +128 -0
  216. package/dist/queries/linking-to-domains.query.mjs.map +1 -0
  217. package/dist/queries/llamaguard-unsafe-content.query.d.mts +2 -0
  218. package/dist/queries/llamaguard-unsafe-content.query.mjs +90 -0
  219. package/dist/queries/llamaguard-unsafe-content.query.mjs.map +1 -0
  220. package/dist/queries/readability-score.query.d.mts +2 -0
  221. package/dist/queries/{readability-score.query.js → readability-score.query.mjs} +11 -20
  222. package/dist/queries/readability-score.query.mjs.map +1 -0
  223. package/dist/servers/{crawl.server.d.ts → crawl.server.d.mts} +10 -10
  224. package/dist/servers/crawl.server.mjs +192 -0
  225. package/dist/servers/crawl.server.mjs.map +1 -0
  226. package/dist/servers/{express.server.d.ts → express.server.d.mts} +2 -3
  227. package/dist/servers/express.server.mjs +13 -0
  228. package/dist/servers/express.server.mjs.map +1 -0
  229. package/dist/servers/{maintenance.server.d.ts → maintenance.server.d.mts} +5 -5
  230. package/dist/servers/maintenance.server.mjs +97 -0
  231. package/dist/servers/maintenance.server.mjs.map +1 -0
  232. package/dist/servers/{rest.server.d.ts → rest.server.d.mts} +4 -4
  233. package/dist/servers/rest.server.mjs +62 -0
  234. package/dist/servers/rest.server.mjs.map +1 -0
  235. package/dist/servers/{socket-io.server.d.ts → socket-io.server.d.mts} +4 -4
  236. package/dist/servers/socket-io.server.mjs +22 -0
  237. package/dist/servers/socket-io.server.mjs.map +1 -0
  238. package/dist/services/{database.service.d.ts → database.service.d.mts} +12 -12
  239. package/dist/services/database.service.mjs +645 -0
  240. package/dist/services/database.service.mjs.map +1 -0
  241. package/dist/services/{ollama-rest.service.d.ts → ollama-rest.service.d.mts} +2 -2
  242. package/dist/services/ollama-rest.service.mjs +27 -0
  243. package/dist/services/ollama-rest.service.mjs.map +1 -0
  244. package/dist/services/{rig-llama-guard.service.d.ts → rig-llama-guard.service.d.mts} +2 -2
  245. package/dist/services/{rig-llama-guard.service.js → rig-llama-guard.service.mjs} +33 -43
  246. package/dist/services/rig-llama-guard.service.mjs.map +1 -0
  247. package/dist/services/{rig-queue-length.service.d.ts → rig-queue-length.service.d.mts} +1 -1
  248. package/dist/services/rig-queue-length.service.mjs +12 -0
  249. package/dist/services/rig-queue-length.service.mjs.map +1 -0
  250. package/dist/services/{rig-subjectivity-scale.service.d.ts → rig-subjectivity-scale.service.d.mts} +2 -2
  251. package/dist/services/rig-subjectivity-scale.service.mjs +82 -0
  252. package/dist/services/rig-subjectivity-scale.service.mjs.map +1 -0
  253. package/dist/services/{rig-ticket-rest.service.d.ts → rig-ticket-rest.service.d.mts} +3 -3
  254. package/dist/services/rig-ticket-rest.service.mjs +15 -0
  255. package/dist/services/rig-ticket-rest.service.mjs.map +1 -0
  256. package/dist/services/{rig-ticketed-promise.service.d.ts → rig-ticketed-promise.service.d.mts} +4 -6
  257. package/dist/services/{rig-ticketed-promise.service.js → rig-ticketed-promise.service.mjs} +7 -6
  258. package/dist/services/rig-ticketed-promise.service.mjs.map +1 -0
  259. package/dist/types/{tcrawl-config.js → tcrawl-config.mjs} +2 -2
  260. package/dist/types/tcrawl-config.mjs.map +1 -0
  261. package/dist/types/{thydra-config.js → thydra-config.mjs} +2 -2
  262. package/dist/types/thydra-config.mjs.map +1 -0
  263. package/dist/types/tparser-ctor.d.mts +7 -0
  264. package/dist/types/tparser-ctor.mjs +2 -0
  265. package/dist/types/tparser-ctor.mjs.map +1 -0
  266. package/dist/types/tquery.d.mts +7 -0
  267. package/dist/types/tquery.mjs +2 -0
  268. package/dist/types/tquery.mjs.map +1 -0
  269. package/dist/types/tqueue-length.mjs +2 -0
  270. package/dist/types/tqueue-length.mjs.map +1 -0
  271. package/dist/types/{trobots-config.js → trobots-config.mjs} +2 -2
  272. package/dist/types/trobots-config.mjs.map +1 -0
  273. package/package.json +37 -43
  274. package/dist/apis/autocomplete.api.js +0 -22
  275. package/dist/apis/autocomplete.api.js.map +0 -1
  276. package/dist/apis/bugs.api.js +0 -26
  277. package/dist/apis/bugs.api.js.map +0 -1
  278. package/dist/apis/crawl.api.js +0 -25
  279. package/dist/apis/crawl.api.js.map +0 -1
  280. package/dist/apis/domains.api.js.map +0 -1
  281. package/dist/apis/images.api.js +0 -27
  282. package/dist/apis/images.api.js.map +0 -1
  283. package/dist/apis/statistics.api.js +0 -41
  284. package/dist/apis/statistics.api.js.map +0 -1
  285. package/dist/apis/test.api.js +0 -19
  286. package/dist/apis/test.api.js.map +0 -1
  287. package/dist/apis/urls.api.js +0 -29
  288. package/dist/apis/urls.api.js.map +0 -1
  289. package/dist/apps/cleanup.app.js +0 -141
  290. package/dist/apps/cleanup.app.js.map +0 -1
  291. package/dist/apps/cross-populate-export.app.js +0 -75
  292. package/dist/apps/cross-populate-export.app.js.map +0 -1
  293. package/dist/apps/cross-populate-import.app.js +0 -100
  294. package/dist/apps/cross-populate-import.app.js.map +0 -1
  295. package/dist/apps/denylist.app.js +0 -132
  296. package/dist/apps/denylist.app.js.map +0 -1
  297. package/dist/apps/expire.app.js +0 -63
  298. package/dist/apps/expire.app.js.map +0 -1
  299. package/dist/apps/export-domain-urls.js +0 -99
  300. package/dist/apps/export-domain-urls.js.map +0 -1
  301. package/dist/apps/extract-text.app.js +0 -55
  302. package/dist/apps/extract-text.app.js.map +0 -1
  303. package/dist/apps/hydra.app.js +0 -218
  304. package/dist/apps/hydra.app.js.map +0 -1
  305. package/dist/apps/import.app.js +0 -57
  306. package/dist/apps/import.app.js.map +0 -1
  307. package/dist/apps/internal-hydra-common.app.js.map +0 -1
  308. package/dist/apps/move-to-archive.app.js +0 -46
  309. package/dist/apps/move-to-archive.app.js.map +0 -1
  310. package/dist/apps/prune-archive.app.js +0 -55
  311. package/dist/apps/prune-archive.app.js.map +0 -1
  312. package/dist/apps/query.app.js +0 -80
  313. package/dist/apps/query.app.js.map +0 -1
  314. package/dist/apps/reattempt.app.js +0 -83
  315. package/dist/apps/reattempt.app.js.map +0 -1
  316. package/dist/apps/requeue-domain.app.js +0 -64
  317. package/dist/apps/requeue-domain.app.js.map +0 -1
  318. package/dist/apps/seed.app.js +0 -69
  319. package/dist/apps/seed.app.js.map +0 -1
  320. package/dist/apps/startup.app.js +0 -64
  321. package/dist/apps/startup.app.js.map +0 -1
  322. package/dist/apps/unarchive-urls.app.js +0 -83
  323. package/dist/apps/unarchive-urls.app.js.map +0 -1
  324. package/dist/classes/cleaner.js +0 -266
  325. package/dist/classes/cleaner.js.map +0 -1
  326. package/dist/classes/crawler.js +0 -422
  327. package/dist/classes/crawler.js.map +0 -1
  328. package/dist/classes/dns.js.map +0 -1
  329. package/dist/classes/expirer.js +0 -121
  330. package/dist/classes/expirer.js.map +0 -1
  331. package/dist/classes/expiry.js.map +0 -1
  332. package/dist/classes/lists.js.map +0 -1
  333. package/dist/classes/robot.js +0 -82
  334. package/dist/classes/robot.js.map +0 -1
  335. package/dist/classes/tracker.js +0 -120
  336. package/dist/classes/tracker.js.map +0 -1
  337. package/dist/cli.js.map +0 -1
  338. package/dist/enums/eavailable-strategy.js.map +0 -1
  339. package/dist/enums/elist.js.map +0 -1
  340. package/dist/enums/eserver.js.map +0 -1
  341. package/dist/enums/ex-powered-by.js.map +0 -1
  342. package/dist/helpers/matcher.js.map +0 -1
  343. package/dist/helpers/random.js.map +0 -1
  344. package/dist/helpers/utf-decoder.js.map +0 -1
  345. package/dist/interfaces/iexpiry.js.map +0 -1
  346. package/dist/interfaces/imatch.js.map +0 -1
  347. package/dist/interfaces/iparser-config.js.map +0 -1
  348. package/dist/interfaces/iparser.js +0 -2
  349. package/dist/interfaces/iparser.js.map +0 -1
  350. package/dist/interfaces/irequest-outcome.js +0 -2
  351. package/dist/interfaces/irequest-outcome.js.map +0 -1
  352. package/dist/interfaces/iserver.js +0 -2
  353. package/dist/interfaces/iserver.js.map +0 -1
  354. package/dist/parsers/accessibility-metrics.parser.d.ts +0 -11
  355. package/dist/parsers/accessibility-metrics.parser.js +0 -40
  356. package/dist/parsers/accessibility-metrics.parser.js.map +0 -1
  357. package/dist/parsers/asp-error.parser.d.ts +0 -12
  358. package/dist/parsers/asp-error.parser.js +0 -48
  359. package/dist/parsers/asp-error.parser.js.map +0 -1
  360. package/dist/parsers/bad-words.parser.js +0 -27
  361. package/dist/parsers/bad-words.parser.js.map +0 -1
  362. package/dist/parsers/complex-english.parser.d.ts +0 -15
  363. package/dist/parsers/complex-english.parser.js +0 -61
  364. package/dist/parsers/complex-english.parser.js.map +0 -1
  365. package/dist/parsers/data.parser.d.ts +0 -14
  366. package/dist/parsers/data.parser.js.map +0 -1
  367. package/dist/parsers/dictionary.parser.js +0 -73
  368. package/dist/parsers/dictionary.parser.js.map +0 -1
  369. package/dist/parsers/html.parser.d.ts +0 -13
  370. package/dist/parsers/html.parser.js.map +0 -1
  371. package/dist/parsers/hyperlinks.parser.d.ts +0 -20
  372. package/dist/parsers/hyperlinks.parser.js +0 -115
  373. package/dist/parsers/hyperlinks.parser.js.map +0 -1
  374. package/dist/parsers/image-tags.parser.d.ts +0 -19
  375. package/dist/parsers/image-tags.parser.js +0 -52
  376. package/dist/parsers/image-tags.parser.js.map +0 -1
  377. package/dist/parsers/interest.parser.js +0 -69
  378. package/dist/parsers/interest.parser.js.map +0 -1
  379. package/dist/parsers/jpeg.parser.d.ts +0 -11
  380. package/dist/parsers/jpeg.parser.js +0 -39
  381. package/dist/parsers/jpeg.parser.js.map +0 -1
  382. package/dist/parsers/llama-guard.parser.js +0 -65
  383. package/dist/parsers/llama-guard.parser.js.map +0 -1
  384. package/dist/parsers/offence.parser.js +0 -69
  385. package/dist/parsers/offence.parser.js.map +0 -1
  386. package/dist/parsers/ollama.parser.js +0 -51
  387. package/dist/parsers/ollama.parser.js.map +0 -1
  388. package/dist/parsers/paragraphs.parser.js +0 -49
  389. package/dist/parsers/paragraphs.parser.js.map +0 -1
  390. package/dist/parsers/parser.js +0 -57
  391. package/dist/parsers/parser.js.map +0 -1
  392. package/dist/parsers/php-error.parser.d.ts +0 -12
  393. package/dist/parsers/php-error.parser.js +0 -52
  394. package/dist/parsers/php-error.parser.js.map +0 -1
  395. package/dist/parsers/phrase.parser.js +0 -26
  396. package/dist/parsers/phrase.parser.js.map +0 -1
  397. package/dist/parsers/regex.parser.js +0 -43
  398. package/dist/parsers/regex.parser.js.map +0 -1
  399. package/dist/parsers/server.parser.d.ts +0 -11
  400. package/dist/parsers/server.parser.js +0 -67
  401. package/dist/parsers/server.parser.js.map +0 -1
  402. package/dist/parsers/spelling.parser.js +0 -27
  403. package/dist/parsers/spelling.parser.js.map +0 -1
  404. package/dist/parsers/string.parser.d.ts +0 -8
  405. package/dist/parsers/string.parser.js.map +0 -1
  406. package/dist/parsers/text.parser.js +0 -41
  407. package/dist/parsers/text.parser.js.map +0 -1
  408. package/dist/parsers/words.parser.js +0 -40
  409. package/dist/parsers/words.parser.js.map +0 -1
  410. package/dist/queries/complex-english.query.d.ts +0 -2
  411. package/dist/queries/complex-english.query.js.map +0 -1
  412. package/dist/queries/flash-content.query.d.ts +0 -2
  413. package/dist/queries/flash-content.query.js +0 -82
  414. package/dist/queries/flash-content.query.js.map +0 -1
  415. package/dist/queries/linking-to-domains.query.d.ts +0 -2
  416. package/dist/queries/linking-to-domains.query.js +0 -130
  417. package/dist/queries/linking-to-domains.query.js.map +0 -1
  418. package/dist/queries/llamaguard-unsafe-content.query.d.ts +0 -2
  419. package/dist/queries/llamaguard-unsafe-content.query.js +0 -92
  420. package/dist/queries/llamaguard-unsafe-content.query.js.map +0 -1
  421. package/dist/queries/readability-score.query.d.ts +0 -2
  422. package/dist/queries/readability-score.query.js.map +0 -1
  423. package/dist/servers/crawl.server.js +0 -198
  424. package/dist/servers/crawl.server.js.map +0 -1
  425. package/dist/servers/express.server.js +0 -13
  426. package/dist/servers/express.server.js.map +0 -1
  427. package/dist/servers/maintenance.server.js +0 -103
  428. package/dist/servers/maintenance.server.js.map +0 -1
  429. package/dist/servers/rest.server.js +0 -46
  430. package/dist/servers/rest.server.js.map +0 -1
  431. package/dist/servers/socket-io.server.js +0 -61
  432. package/dist/servers/socket-io.server.js.map +0 -1
  433. package/dist/services/database.service.js +0 -795
  434. package/dist/services/database.service.js.map +0 -1
  435. package/dist/services/ollama-rest.service.js +0 -46
  436. package/dist/services/ollama-rest.service.js.map +0 -1
  437. package/dist/services/rig-llama-guard.service.js.map +0 -1
  438. package/dist/services/rig-queue-length.service.js +0 -22
  439. package/dist/services/rig-queue-length.service.js.map +0 -1
  440. package/dist/services/rig-subjectivity-scale.service.js +0 -96
  441. package/dist/services/rig-subjectivity-scale.service.js.map +0 -1
  442. package/dist/services/rig-ticket-rest.service.js +0 -29
  443. package/dist/services/rig-ticket-rest.service.js.map +0 -1
  444. package/dist/services/rig-ticketed-promise.service.js.map +0 -1
  445. package/dist/types/tcrawl-config.js.map +0 -1
  446. package/dist/types/thydra-config.js.map +0 -1
  447. package/dist/types/tparser-ctor.d.ts +0 -7
  448. package/dist/types/tparser-ctor.js +0 -2
  449. package/dist/types/tparser-ctor.js.map +0 -1
  450. package/dist/types/tquery.d.ts +0 -7
  451. package/dist/types/tquery.js +0 -2
  452. package/dist/types/tquery.js.map +0 -1
  453. package/dist/types/tqueue-length.js +0 -2
  454. package/dist/types/tqueue-length.js.map +0 -1
  455. package/dist/types/trobots-config.js.map +0 -1
  456. /package/dist/classes/{dns.d.ts → dns.d.mts} +0 -0
  457. /package/dist/{cli.d.ts → cli.d.mts} +0 -0
  458. /package/dist/enums/{eavailable-strategy.d.ts → eavailable-strategy.d.mts} +0 -0
  459. /package/dist/enums/{elist.d.ts → elist.d.mts} +0 -0
  460. /package/dist/enums/{eserver.d.ts → eserver.d.mts} +0 -0
  461. /package/dist/enums/{ex-powered-by.d.ts → ex-powered-by.d.mts} +0 -0
  462. /package/dist/interfaces/{imatch.d.ts → imatch.d.mts} +0 -0
  463. /package/dist/interfaces/{iparser-config.d.ts → iparser-config.d.mts} +0 -0
  464. /package/dist/interfaces/{iserver.d.ts → iserver.d.mts} +0 -0
  465. /package/dist/types/{tcrawl-config.d.ts → tcrawl-config.d.mts} +0 -0
  466. /package/dist/types/{thydra-config.d.ts → thydra-config.d.mts} +0 -0
  467. /package/dist/types/{tqueue-length.d.ts → tqueue-length.d.mts} +0 -0
  468. /package/dist/types/{trobots-config.d.ts → trobots-config.d.mts} +0 -0
@@ -0,0 +1,418 @@
1
+ import { URL } from 'url';
2
+ import * as http from 'http';
3
+ import * as https from 'https';
4
+ import { commonsMapToObject, commonsTypeHasPropertyString } from 'tscommons-esm-core';
5
+ import { commonsAsyncAbortTimeout, commonsAsyncTimeout } from 'tscommons-esm-async';
6
+ import { EStatus } from 'hydra-crawler-esm-assets';
7
+ import { commonsLogAlert, commonsLogDebug, commonsLogError, commonsLogInfo } from 'nodecommons-esm-log';
8
+ import { commonsGracefulAbortAddCallback, commonsGracefulAbortRemoveCallback } from 'nodecommons-esm-process';
9
+ import { commonsHashMd5 } from 'nodecommons-esm-security';
10
+ import { Robot } from '../classes/robot.mjs';
11
+ import { Random } from '../helpers/random.mjs';
12
+ import { EList } from '../enums/elist.mjs';
13
+ import { Dns } from './dns.mjs';
14
+ export class Crawler {
15
+ domain;
16
+ database;
17
+ crawlConfig;
18
+ parsersConfig;
19
+ robotsConfig;
20
+ parsers;
21
+ lists;
22
+ tracker;
23
+ static applyMasqueradeHeaders(request) {
24
+ request.setHeader('Accept', 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8');
25
+ request.setHeader('Accept-Encoding', 'identity');
26
+ request.setHeader('Connection', 'close');
27
+ request.setHeader('User-Agent', 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Ubuntu Chromium/68.0.3440.106 Chrome/68.0.3440.106 Safari/537.36 (UoM Hydra)');
28
+ }
29
+ static request(handler, url, connectTimeout, maxFileSize, tracker) {
30
+ return new Promise((resolve, reject) => {
31
+ const start = new Date().getTime();
32
+ let exceeded = false;
33
+ let completed = false;
34
+ let timedOut = false;
35
+ const timedOutMessage = `Timeout on crawl of ${url}`;
36
+ const secondaryTimeoutId = `crawler_${url}_secondary_timeout`;
37
+ commonsAsyncTimeout(connectTimeout + 60000, secondaryTimeoutId)
38
+ .then(() => {
39
+ if (timedOut || completed)
40
+ return;
41
+ commonsLogDebug(`Secondary timeout for ${url}`);
42
+ timedOut = true;
43
+ reject(new Error(timedOutMessage));
44
+ return;
45
+ })
46
+ .catch((e) => {
47
+ if (e.message === 'abortTimeout called')
48
+ return;
49
+ commonsLogDebug('debug position 10');
50
+ console.log(e);
51
+ throw e;
52
+ });
53
+ const req = handler.request(url, (res) => {
54
+ // likely unnecessary due to doing it below, but doesn't hurt to do it twice
55
+ req.setTimeout(connectTimeout);
56
+ res.setTimeout(connectTimeout);
57
+ const end = new Date().getTime();
58
+ const latency = end - start;
59
+ // always check for a body, even in 4xx 3xx etc.
60
+ let read = 0;
61
+ const data = [];
62
+ res.on('data', (chunk) => {
63
+ if (read > maxFileSize) {
64
+ if (!exceeded) {
65
+ exceeded = true;
66
+ res.destroy();
67
+ commonsLogAlert(`Exceeded maxFileSize for URL: ${url}`);
68
+ }
69
+ return;
70
+ }
71
+ data.push(chunk);
72
+ read += chunk.length;
73
+ if (tracker)
74
+ tracker.bandwidth(chunk.length);
75
+ });
76
+ res.on('end', () => {
77
+ if (timedOut || completed)
78
+ return;
79
+ completed = true;
80
+ commonsAsyncAbortTimeout(secondaryTimeoutId);
81
+ resolve({
82
+ latency: latency,
83
+ // eslint-disable-next-line @typescript-eslint/no-unsafe-assignment
84
+ ip: res['remoteIp'],
85
+ statusCode: res.statusCode || 599,
86
+ headers: res.headers,
87
+ data: Buffer.concat(data),
88
+ exceeded: exceeded
89
+ });
90
+ });
91
+ // not sure if this event actually occurs, as opposed to req error below
92
+ res.on('error', (err) => {
93
+ if (timedOut || completed)
94
+ return;
95
+ commonsAsyncAbortTimeout(secondaryTimeoutId);
96
+ reject(err);
97
+ });
98
+ });
99
+ req.setTimeout(connectTimeout);
100
+ Crawler.applyMasqueradeHeaders(req);
101
+ req.on('timeout', () => {
102
+ if (timedOut || completed)
103
+ return;
104
+ timedOut = true;
105
+ req.destroy();
106
+ commonsAsyncAbortTimeout(secondaryTimeoutId);
107
+ reject(new Error(timedOutMessage));
108
+ });
109
+ req.on('response', (res) => {
110
+ res['remoteIp'] = res.connection.remoteAddress;
111
+ });
112
+ req.on('error', (err) => {
113
+ if (timedOut || completed)
114
+ return;
115
+ commonsAsyncAbortTimeout(secondaryTimeoutId);
116
+ reject(err);
117
+ });
118
+ req.on('socket', (socket) => {
119
+ socket.setTimeout(connectTimeout);
120
+ socket.on('timeout', () => {
121
+ if (timedOut || completed)
122
+ return;
123
+ commonsAsyncAbortTimeout(secondaryTimeoutId);
124
+ timedOut = true;
125
+ req.destroy();
126
+ reject(new Error(timedOutMessage));
127
+ });
128
+ });
129
+ req.end();
130
+ });
131
+ }
132
+ static pruneHeaders(headers, keepHeaders) {
133
+ const map = new Map();
134
+ const keys = [];
135
+ for (const k of keepHeaders) {
136
+ const kt = k.split(':');
137
+ keys.push({ key: kt[0], type: kt[1] });
138
+ }
139
+ for (const key of keys) {
140
+ if (!Object.keys(headers).includes(key.key))
141
+ continue;
142
+ if (!commonsTypeHasPropertyString(headers, key.key))
143
+ continue;
144
+ const value = headers[key.key];
145
+ switch (key.type) {
146
+ case 'string':
147
+ map.set(key.key, value.toString());
148
+ break;
149
+ case 'number':
150
+ map.set(key.key, parseInt(value, 10));
151
+ break;
152
+ case 'date':
153
+ map.set(key.key, new Date(value));
154
+ break;
155
+ default: throw new Error('unknown header key type');
156
+ }
157
+ }
158
+ return map;
159
+ }
160
+ isPaused = false;
161
+ isAborted = false;
162
+ constructor(domain, database, crawlConfig, parsersConfig, robotsConfig, parsers, lists, tracker) {
163
+ this.domain = domain;
164
+ this.database = database;
165
+ this.crawlConfig = crawlConfig;
166
+ this.parsersConfig = parsersConfig;
167
+ this.robotsConfig = robotsConfig;
168
+ this.parsers = parsers;
169
+ this.lists = lists;
170
+ this.tracker = tracker;
171
+ }
172
+ abort() {
173
+ this.isAborted = true;
174
+ commonsAsyncAbortTimeout(`crawl_${this.domain}`);
175
+ }
176
+ pause() {
177
+ commonsLogAlert(`Pausing crawler for ${this.domain}`);
178
+ this.isPaused = true;
179
+ }
180
+ resume() {
181
+ commonsLogInfo(`Resuming crawler for ${this.domain}`);
182
+ this.isPaused = false;
183
+ }
184
+ async fetch(url, setDomainIp) {
185
+ commonsLogInfo(`Fetching ${url}`);
186
+ const whatwg = new URL(url);
187
+ let handler;
188
+ switch (whatwg.protocol) {
189
+ case 'http:':
190
+ handler = http;
191
+ break;
192
+ case 'https:':
193
+ handler = https;
194
+ break;
195
+ default:
196
+ throw new Error(`unable to handle protocol ${whatwg.protocol}`);
197
+ }
198
+ let outcome;
199
+ // eslint-disable-next-line no-useless-catch
200
+ try {
201
+ outcome = await Crawler.request(handler, url, this.crawlConfig.connectTimeout, this.crawlConfig.maxFileSize, this.tracker);
202
+ }
203
+ catch (ex) {
204
+ //if (!/^Timeout on crawl of/.test(ex.message)) console.error(ex);
205
+ throw ex;
206
+ }
207
+ if (setDomainIp) {
208
+ await this.database.domain(whatwg.hostname, outcome.ip);
209
+ if (this.tracker)
210
+ this.tracker.domain();
211
+ }
212
+ await this.database.setStatusCode(url, outcome.statusCode);
213
+ const headers = Crawler.pruneHeaders(outcome.headers, this.crawlConfig.keepHeaders);
214
+ if (!headers.has('content-length') && outcome.data !== undefined)
215
+ headers.set('content-length', outcome.data.length);
216
+ await this.database.setHeaders(url, commonsMapToObject(headers));
217
+ const outgoing = [];
218
+ if (outcome.statusCode >= 300
219
+ && outcome.statusCode < 400
220
+ && headers.has('location')
221
+ && this.lists.match(EList.ALLOW, url) // only queue redirects for allowlist urls
222
+ ) {
223
+ // redirect codes
224
+ const location = new URL(headers.get('location'), url);
225
+ if (location.protocol.match(/^http(s?):$/)) {
226
+ const added = await this.database.queue(location.toString(), this.lists.match(EList.DENY, location.toString()));
227
+ if (added && this.tracker)
228
+ this.tracker.delta(this.lists.match(EList.DENY, location.toString()) ? EStatus.DENY : EStatus.QUEUED, 1);
229
+ if (location.toString() !== url)
230
+ outgoing.push(location.toString());
231
+ }
232
+ }
233
+ if (outcome.data) {
234
+ const hash = commonsHashMd5(outcome.data);
235
+ const existing = await this.database.getHash(url);
236
+ if (hash !== existing)
237
+ await this.database.setHash(url, hash);
238
+ }
239
+ if (outcome.data && outcome.data.length && headers.has('content-type')) {
240
+ const contentType = headers.get('content-type');
241
+ const isAllow = this.lists.match(EList.ALLOW, url);
242
+ for (const ctor of this.parsers) {
243
+ const parser = new ctor(url, outcome, this.parsersConfig);
244
+ if (!parser.isEnabled())
245
+ continue;
246
+ if (!parser.supports(contentType, isAllow))
247
+ continue;
248
+ try {
249
+ await parser.parse(this.database);
250
+ }
251
+ catch (ex) {
252
+ commonsLogDebug('debug position 3');
253
+ console.log(ex);
254
+ }
255
+ if (isAllow) {
256
+ try {
257
+ const links = await parser.links();
258
+ if (links.length === 0)
259
+ continue;
260
+ for (const link of links) {
261
+ if (link === url)
262
+ continue;
263
+ try {
264
+ outgoing.push(link);
265
+ }
266
+ catch (_ex) { /* do nothing */ }
267
+ }
268
+ }
269
+ catch (ex) {
270
+ commonsLogDebug('debug position 2');
271
+ console.log(ex);
272
+ }
273
+ }
274
+ }
275
+ }
276
+ for (const link of outgoing) {
277
+ const added = await this.database.queue(link, this.lists.match(EList.DENY, link));
278
+ if (added && this.tracker)
279
+ this.tracker.delta(this.lists.match(EList.DENY, link) ? EStatus.DENY : EStatus.QUEUED, 1);
280
+ }
281
+ await this.database.link(url, outgoing);
282
+ if (this.tracker)
283
+ this.tracker.link(outgoing.length);
284
+ return outcome.statusCode;
285
+ }
286
+ async crawl() {
287
+ const gracefulAbortId = commonsGracefulAbortAddCallback(() => {
288
+ commonsLogAlert(`SIGINT abort flag is set. Aborting crawler ${this.domain}.`);
289
+ this.abort();
290
+ });
291
+ try {
292
+ try {
293
+ await Dns.resolve(this.domain, this.crawlConfig.connectTimeout);
294
+ }
295
+ catch (ex) {
296
+ if (ex.message === 'DNS timeout' && !this.crawlConfig.treatTimeoutDnsAsDead) {
297
+ commonsLogError(`DNS timed out for ${this.domain}. Will allow reattempts`);
298
+ return;
299
+ }
300
+ commonsLogError(`Domain ${this.domain} is dead.`);
301
+ await this.database.markDead(this.domain);
302
+ return;
303
+ }
304
+ const robots = new Robot(this.domain, this.crawlConfig, this.robotsConfig, this.tracker);
305
+ await robots.load();
306
+ let tally = 0;
307
+ while (true) {
308
+ if (this.isAborted)
309
+ break;
310
+ if (this.isPaused) {
311
+ await commonsAsyncTimeout(1000);
312
+ continue;
313
+ }
314
+ const url = await this.database.next(this.domain);
315
+ if (!url) {
316
+ commonsLogInfo(`Crawl for ${this.domain} completed.`);
317
+ break;
318
+ }
319
+ await this.database.unsetFailReason(url);
320
+ if (this.tracker)
321
+ this.tracker.delta(EStatus.QUEUED, -1);
322
+ if (this.lists.match(EList.DENY, url)) {
323
+ await this.database.setStatus(url, EStatus.DENY);
324
+ await this.database.unsetTtl(url);
325
+ if (this.tracker)
326
+ this.tracker.delta(EStatus.DENY, 1);
327
+ // To get here, a url was queued but is now denylisted.
328
+ // It may have had outgoings, so remove any that were there.
329
+ await this.database.link(url, []);
330
+ continue;
331
+ }
332
+ if (robots.isDisallowed(url)) {
333
+ await this.database.setStatus(url, EStatus.DISALLOWED);
334
+ await this.database.unsetTtl(url);
335
+ if (this.tracker)
336
+ this.tracker.delta(EStatus.DISALLOWED, 1);
337
+ // To get here, a url was queued but is now disallowed.
338
+ // It may have had outgoings, so remove any that were there.
339
+ await this.database.link(url, []);
340
+ continue;
341
+ }
342
+ if (!await this.database.setStatus(url, EStatus.ACTIVE)) {
343
+ commonsLogError(`Unable to set status to active for ${url}. Aborting crawler.`);
344
+ break;
345
+ }
346
+ if (this.tracker)
347
+ this.tracker.delta(EStatus.ACTIVE, 1);
348
+ if (tally > 0) {
349
+ try {
350
+ const timeout = Random.randomise(this.crawlConfig.betweenFetchDelay, this.crawlConfig);
351
+ await commonsAsyncTimeout(timeout, `crawl_${this.domain}`);
352
+ while (this.isPaused && !this.isAborted) {
353
+ await commonsAsyncTimeout(1000);
354
+ }
355
+ }
356
+ catch (_ex) { /* ignore */ }
357
+ }
358
+ if (this.isAborted)
359
+ break;
360
+ if (this.tracker)
361
+ await this.tracker.fetching(url);
362
+ try {
363
+ const statusCode = await this.fetch(url, tally === 0);
364
+ if (this.tracker)
365
+ await this.tracker.done(url, statusCode);
366
+ await this.database.setStatus(url, EStatus.DONE);
367
+ await this.database.unsetTtl(url);
368
+ if (this.tracker)
369
+ this.tracker.delta(EStatus.DONE, 1);
370
+ }
371
+ catch (ex) {
372
+ if (this.tracker)
373
+ await this.tracker.failed(url);
374
+ const ttl = await this.database.getTtl(url) || 0;
375
+ if (ttl < this.crawlConfig.maxFailedTtl) {
376
+ await this.database.setTtl(url, ttl + 1);
377
+ await this.database.setStatus(url, EStatus.QUEUED);
378
+ if (this.tracker)
379
+ this.tracker.delta(EStatus.QUEUED, 1);
380
+ }
381
+ else {
382
+ await this.database.setStatus(url, EStatus.FAILED);
383
+ if (this.tracker)
384
+ this.tracker.delta(EStatus.FAILED, 1);
385
+ if (commonsTypeHasPropertyString(ex, 'code')) {
386
+ await this.database.setFailReason(url, ex.code);
387
+ }
388
+ else if (commonsTypeHasPropertyString(ex, 'message')) {
389
+ if (/^Timeout on crawl/.test(ex.message)) {
390
+ await this.database.setFailReason(url, 'TIMEOUT');
391
+ }
392
+ else {
393
+ await this.database.setFailReason(url, ex.message);
394
+ }
395
+ }
396
+ }
397
+ }
398
+ finally {
399
+ if (this.tracker)
400
+ this.tracker.delta(EStatus.ACTIVE, -1);
401
+ }
402
+ tally++;
403
+ if (tally >= this.crawlConfig.maxFetchesPerCrawl) {
404
+ commonsLogAlert(`Crawl for ${this.domain} reached the maximum permitted fetches for this session.`);
405
+ break;
406
+ }
407
+ }
408
+ }
409
+ catch (e) {
410
+ commonsLogDebug('debug position 1');
411
+ console.log(e);
412
+ }
413
+ finally {
414
+ commonsGracefulAbortRemoveCallback(gracefulAbortId);
415
+ }
416
+ }
417
+ }
418
+ //# sourceMappingURL=crawler.mjs.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"crawler.mjs","sourceRoot":"","sources":["../../src/classes/crawler.mts"],"names":[],"mappings":"AACA,OAAO,EAAE,GAAG,EAAE,MAAM,KAAK,CAAC;AAC1B,OAAO,KAAK,IAAI,MAAM,MAAM,CAAC;AAC7B,OAAO,KAAK,KAAK,MAAM,OAAO,CAAC;AAG/B,OAAO,EAAE,kBAAkB,EAAE,4BAA4B,EAAE,MAAM,oBAAoB,CAAC;AAEtF,OAAO,EAAE,wBAAwB,EAAE,mBAAmB,EAAE,MAAM,qBAAqB,CAAC;AAEpF,OAAO,EAAE,OAAO,EAAE,MAAM,0BAA0B,CAAC;AAEnD,OAAO,EAAE,eAAe,EAAE,eAAe,EAAE,eAAe,EAAE,cAAc,EAAE,MAAM,qBAAqB,CAAC;AACxG,OAAO,EAAE,+BAA+B,EAAE,kCAAkC,EAAE,MAAM,yBAAyB,CAAC;AAC9G,OAAO,EAAE,cAAc,EAAE,MAAM,0BAA0B,CAAC;AAG1D,OAAO,EAAE,KAAK,EAAE,MAAM,sBAAsB,CAAC;AAK7C,OAAO,EAAE,MAAM,EAAE,MAAM,uBAAuB,CAAC;AAU/C,OAAO,EAAE,KAAK,EAAE,MAAM,oBAAoB,CAAC;AAE3C,OAAO,EAAE,GAAG,EAAE,MAAM,WAAW,CAAC;AAEhC,MAAM,OAAO,OAAO;IAsMT;IACA;IACA;IACA;IACA;IACA;IACA;IACA;IA5MH,MAAM,CAAC,sBAAsB,CAAC,OAA2B;QAC/D,OAAO,CAAC,SAAS,CAAC,QAAQ,EAAE,uFAAuF,CAAC,CAAC;QACrH,OAAO,CAAC,SAAS,CAAC,iBAAiB,EAAE,UAAU,CAAC,CAAC;QACjD,OAAO,CAAC,SAAS,CAAC,YAAY,EAAE,OAAO,CAAC,CAAC;QACzC,OAAO,CAAC,SAAS,CAAC,YAAY,EAAE,qJAAqJ,CAAC,CAAC;IACxL,CAAC;IAEM,MAAM,CAAC,OAAO,CACnB,OAAiC,EACjC,GAAW,EACX,cAAsB,EACtB,WAAmB,EACnB,OAAiB;QAElB,OAAO,IAAI,OAAO,CAAkB,CAAC,OAAqC,EAAE,MAA0B,EAAQ,EAAE;YAC/G,MAAM,KAAK,GAAW,IAAI,IAAI,EAAE,CAAC,OAAO,EAAE,CAAC;YAC3C,IAAI,QAAQ,GAAY,KAAK,CAAC;YAE9B,IAAI,SAAS,GAAY,KAAK,CAAC;YAC/B,IAAI,QAAQ,GAAY,KAAK,CAAC;YAC9B,MAAM,eAAe,GAAW,uBAAuB,GAAG,EAAE,CAAC;YAE7D,MAAM,kBAAkB,GAAW,WAAW,GAAG,oBAAoB,CAAC;YACtE,mBAAmB,CACjB,cAAc,GAAG,KAAK,EACtB,kBAAkB,CACnB;iBACE,IAAI,CAAC,GAAS,EAAE;gBAChB,IAAI,QAAQ,IAAI,SAAS;oBAAE,OAAO;gBAElC,eAAe,CAAC,yBAAyB,GAAG,EAAE,CAAC,CAAC;gBAEhD,QAAQ,GAAG,IAAI,CAAC;gBAChB,MAAM,CAAC,IAAI,KAAK,CAAC,eAAe,CAAC,CAAC,CAAC;gBACnC,OAAO;YACR,CAAC,CAAC;iBACD,KAAK,CAAC,CAAC,CAAQ,EAAQ,EAAE;gBACzB,IAAI,CAAC,CAAC,OAAO,KAAK,qBAAqB;oBAAE,OAAO;gBAChD,eAAe,CAAC,mBAAmB,CAAC,CAAC;gBACrC,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;gBACf,MAAM,CAAC,CAAC;YACT,CAAC,CAAC,CAAC;YAEL,MAAM,GAAG,GAAuB,OAAO,CAAC,OAAO,CAC7C,GAAG,EACH,CAAC,GAAyB,EAAQ,EAAE;gBACnC,4EAA4E;gBAC5E,GAAG,CAAC,UAAU,CAAC,cAAc,CAAC,CAAC;gBAE/B,GAAG,CAAC,UAAU,CAAC,cAAc,CAAC,CAAC;gBAE/B,MAAM,GAAG,GAAW,IAAI,IAAI,EAAE,CAAC,OAAO,EAAE,CAAC;gBACzC,MAAM,OAAO,GAAW,GAAG,GAAG,KAAK,CAAC;gBAEpC,gDAAgD;gBAEhD,IAAI,IAAI,GAAW,CAAC,CAAC;gBACrB,MAAM,IAAI,GAAa,EAAE,CAAC;gBAC1B,GAAG,CAAC,EAAE,CACJ,MAAM,EACN,CAAC,KAAa,EAAQ,EAAE;oBACvB,IAAI,IAAI,GAAG,WAAW,EAAE,CAAC;wBACxB,IAAI,CAAC,QAAQ,EAAE,CAAC;4BACf,QAAQ,GAAG,IAAI,CAAC;4BAChB,GAAG,CAAC,OAAO,EAAE,CAAC;4BAEd,eAAe,CAAC,iCAAiC,GAAG,EAAE,CAAC,CAAC;wBACzD,CAAC;wBAED,OAAO;oBACR,CAAC;oBACD,IAAI,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;oBACjB,IAAI,IAAI,KAAK,CAAC,MAAM,CAAC;oBACrB,IAAI,OAAO;wBAAE,OAAO,CAAC,SAAS,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC;gBAC9C,CAAC,CACF,CAAC;gBACF,GAAG,CAAC,EAAE,CACJ,KAAK,EACL,GAAS,EAAE;oBACV,IAAI,QAAQ,IAAI,SAAS;wBAAE,OAAO;oBAElC,SAAS,GAAG,IAAI,CAAC;oBAEjB,wBAAwB,CAAC,kBAAkB,CAAC,CAAC;oBAE7C,OAAO,CAAC;wBACN,OAAO,EAAE,OAAO;wBAChB,mEAAmE;wBACnE,EAAE,EAAG,GAAuB,CAAC,UAAU,CAAC;wBACxC,UAAU,EAAE,GAAG,CAAC,UAAU,IAAI,GAAG;wBACjC,OAAO,EAAE,GAAG,CAAC,OAAO;wBACpB,IAAI,EAAE,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC;wBACzB,QAAQ,EAAE,QAAQ;qBACnB,CAAC,CAAC;gBACJ,CAAC,CACF,CAAC;gBAEF,wEAAwE;gBACxE,GAAG,CAAC,EAAE,CACJ,OAAO,EACP,CAAC,GAAU,EAAQ,EAAE;oBACpB,IAAI,QAAQ,IAAI,SAAS;wBAAE,OAAO;oBAElC,wBAAwB,CAAC,kBAAkB,CAAC,CAAC;oBAE7C,MAAM,CAAC,GAAG,CAAC,CAAC;gBACb,CAAC,CACF,CAAC;YACH,CAAC,CACF,CAAC;YAEF,GAAG,CAAC,UAAU,CAAC,cAAc,CAAC,CAAC;YAE/B,OAAO,CAAC,sBAAsB,CAAC,GAAG,CAAC,CAAC;YAEpC,GAAG,CAAC,EAAE,CAAC,SAAS,EAAE,GAAS,EAAE;gBAC5B,IAAI,QAAQ,IAAI,SAAS;oBAAE,OAAO;gBAElC,QAAQ,GAAG,IAAI,CAAC;gBAChB,GAAG,CAAC,OAAO,EAAE,CAAC;gBAEd,wBAAwB,CAAC,kBAAkB,CAAC,CAAC;gBAE7C,MAAM,CAAC,IAAI,KAAK,CAAC,eAAe,CAAC,CAAC,CAAC;YACpC,CAAC,CAAC,CAAC;YAEH,GAAG,CAAC,EAAE,CACJ,UAAU,EACV,CAAC,GAAyB,EAAQ,EAAE;gBAClC,GAAuB,CAAC,UAAU,CAAC,GAAG,GAAG,CAAC,UAAU,CAAC,aAAa,CAAC;YACrE,CAAC,CACF,CAAC;YAEF,GAAG,CAAC,EAAE,CACJ,OAAO,EACP,CAAC,GAAU,EAAQ,EAAE;gBACpB,IAAI,QAAQ,IAAI,SAAS;oBAAE,OAAO;gBAElC,wBAAwB,CAAC,kBAAkB,CAAC,CAAC;gBAE7C,MAAM,CAAC,GAAG,CAAC,CAAC;YACb,CAAC,CACF,CAAC;YAEF,GAAG,CAAC,EAAE,CACJ,QAAQ,EACR,CAAC,MAAc,EAAQ,EAAE;gBACxB,MAAM,CAAC,UAAU,CAAC,cAAc,CAAC,CAAC;gBAClC,MAAM,CAAC,EAAE,CACP,SAAS,EACT,GAAS,EAAE;oBACV,IAAI,QAAQ,IAAI,SAAS;wBAAE,OAAO;oBAElC,wBAAwB,CAAC,kBAAkB,CAAC,CAAC;oBAE7C,QAAQ,GAAG,IAAI,CAAC;oBAChB,GAAG,CAAC,OAAO,EAAE,CAAC;oBAEd,MAAM,CAAC,IAAI,KAAK,CAAC,eAAe,CAAC,CAAC,CAAC;gBACpC,CAAC,CACF,CAAC;YACH,CAAC,CACF,CAAC;YAEF,GAAG,CAAC,GAAG,EAAE,CAAC;QACX,CAAC,CAAC,CAAC;IACJ,CAAC;IAEO,MAAM,CAAC,YAAY,CAAC,OAA4B,EAAE,WAAqB;QAC9E,MAAM,GAAG,GAAoC,IAAI,GAAG,EAA8B,CAAC;QAEnF,MAAM,IAAI,GAAoC,EAAE,CAAC;QACjD,KAAK,MAAM,CAAC,IAAI,WAAW,EAAE,CAAC;YAC7B,MAAM,EAAE,GAAa,CAAC,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC;YAClC,IAAI,CAAC,IAAI,CAAC,EAAE,GAAG,EAAE,EAAE,CAAC,CAAC,CAAC,EAAE,IAAI,EAAE,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC;QACxC,CAAC;QAED,KAAK,MAAM,GAAG,IAAI,IAAI,EAAE,CAAC;YACxB,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC,QAAQ,CAAC,GAAG,CAAC,GAAG,CAAC;gBAAE,SAAS;YACtD,IAAI,CAAC,4BAA4B,CAAC,OAAO,EAAE,GAAG,CAAC,GAAG,CAAC;gBAAE,SAAS;YAE9D,MAAM,KAAK,GAAW,OAAO,CAAC,GAAG,CAAC,GAAG,CAAW,CAAC;YACjD,QAAQ,GAAG,CAAC,IAAI,EAAE,CAAC;gBAClB,KAAK,QAAQ;oBAAE,GAAG,CAAC,GAAG,CAAC,GAAG,CAAC,GAAG,EAAE,KAAK,CAAC,QAAQ,EAAE,CAAC,CAAC;oBAAC,MAAM;gBACzD,KAAK,QAAQ;oBAAE,GAAG,CAAC,GAAG,CAAC,GAAG,CAAC,GAAG,EAAE,QAAQ,CAAC,KAAK,EAAE,EAAE,CAAC,CAAC,CAAC;oBAAC,MAAM;gBAC5D,KAAK,MAAM;oBAAE,GAAG,CAAC,GAAG,CAAC,GAAG,CAAC,GAAG,EAAE,IAAI,IAAI,CAAC,KAAK,CAAC,CAAC,CAAC;oBAAC,MAAM;gBACtD,OAAO,CAAC,CAAC,MAAM,IAAI,KAAK,CAAC,yBAAyB,CAAC,CAAC;YACrD,CAAC;QACF,CAAC;QAED,OAAO,GAAG,CAAC;IACZ,CAAC;IAEO,QAAQ,GAAY,KAAK,CAAC;IAC1B,SAAS,GAAY,KAAK,CAAC;IAEnC,YACU,MAAc,EACd,QAAyB,EACzB,WAAyB,EACzB,aAA6C,EAC7C,YAA2B,EAC3B,OAAsB,EACtB,KAAY,EACZ,OAAiB;QAPjB,WAAM,GAAN,MAAM,CAAQ;QACd,aAAQ,GAAR,QAAQ,CAAiB;QACzB,gBAAW,GAAX,WAAW,CAAc;QACzB,kBAAa,GAAb,aAAa,CAAgC;QAC7C,iBAAY,GAAZ,YAAY,CAAe;QAC3B,YAAO,GAAP,OAAO,CAAe;QACtB,UAAK,GAAL,KAAK,CAAO;QACZ,YAAO,GAAP,OAAO,CAAU;IACxB,CAAC;IAEI,KAAK;QACZ,IAAI,CAAC,SAAS,GAAG,IAAI,CAAC;QACtB,wBAAwB,CAAC,SAAS,IAAI,CAAC,MAAM,EAAE,CAAC,CAAC;IAClD,CAAC;IAEM,KAAK;QACX,eAAe,CAAC,uBAAuB,IAAI,CAAC,MAAM,EAAE,CAAC,CAAC;QAEtD,IAAI,CAAC,QAAQ,GAAG,IAAI,CAAC;IACtB,CAAC;IAEM,MAAM;QACZ,cAAc,CAAC,wBAAwB,IAAI,CAAC,MAAM,EAAE,CAAC,CAAC;QAEtD,IAAI,CAAC,QAAQ,GAAG,KAAK,CAAC;IACvB,CAAC;IAEM,KAAK,CAAC,KAAK,CAAC,GAAW,EAAE,WAAoB;QACnD,cAAc,CAAC,YAAY,GAAG,EAAE,CAAC,CAAC;QAElC,MAAM,MAAM,GAAQ,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC;QAEjC,IAAI,OAA2C,CAAC;QAChD,QAAQ,MAAM,CAAC,QAAQ,EAAE,CAAC;YACzB,KAAK,OAAO;gBAAE,OAAO,GAAG,IAAI,CAAC;gBAAC,MAAM;YACpC,KAAK,QAAQ;gBAAE,OAAO,GAAG,KAAK,CAAC;gBAAC,MAAM;YACtC;gBACC,MAAM,IAAI,KAAK,CAAC,6BAA6B,MAAM,CAAC,QAAQ,EAAE,CAAC,CAAC;QAClE,CAAC;QAED,IAAI,OAAwB,CAAC;QAC7B,4CAA4C;QAC5C,IAAI,CAAC;YACJ,OAAO,GAAG,MAAM,OAAO,CAAC,OAAO,CAC7B,OAAO,EACP,GAAG,EACH,IAAI,CAAC,WAAW,CAAC,cAAc,EAC/B,IAAI,CAAC,WAAW,CAAC,WAAW,EAC5B,IAAI,CAAC,OAAO,CACb,CAAC;QACH,CAAC;QAAC,OAAO,EAAE,EAAE,CAAC;YACb,kEAAkE;YAClE,MAAM,EAAE,CAAC;QACV,CAAC;QAED,IAAI,WAAW,EAAE,CAAC;YACjB,MAAM,IAAI,CAAC,QAAQ,CAAC,MAAM,CAAC,MAAM,CAAC,QAAQ,EAAE,OAAO,CAAC,EAAE,CAAC,CAAC;YACxD,IAAI,IAAI,CAAC,OAAO;gBAAE,IAAI,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC;QACzC,CAAC;QAED,MAAM,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,GAAG,EAAE,OAAO,CAAC,UAAU,CAAC,CAAC;QAE3D,MAAM,OAAO,GAAoC,OAAO,CAAC,YAAY,CAAC,OAAO,CAAC,OAAO,EAAE,IAAI,CAAC,WAAW,CAAC,WAAW,CAAC,CAAC;QACrH,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,gBAAgB,CAAC,IAAI,OAAO,CAAC,IAAI,KAAK,SAAS;YAAE,OAAO,CAAC,GAAG,CAAC,gBAAgB,EAAE,OAAO,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QACrH,MAAM,IAAI,CAAC,QAAQ,CAAC,UAAU,CAAC,GAAG,EAAE,kBAAkB,CAAC,OAAO,CAAC,CAAC,CAAC;QAEjE,MAAM,QAAQ,GAAa,EAAE,CAAC;QAE9B,IACC,OAAO,CAAC,UAAU,IAAI,GAAG;eACtB,OAAO,CAAC,UAAU,GAAG,GAAG;eACxB,OAAO,CAAC,GAAG,CAAC,UAAU,CAAC;eACvB,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,KAAK,EAAE,GAAG,CAAC,CAAC,0CAA0C;UAC/E,CAAC;YACF,iBAAiB;YACjB,MAAM,QAAQ,GAAQ,IAAI,GAAG,CAAC,OAAO,CAAC,GAAG,CAAC,UAAU,CAAY,EAAE,GAAG,CAAC,CAAC;YAEvE,IAAI,QAAQ,CAAC,QAAQ,CAAC,KAAK,CAAC,aAAa,CAAC,EAAE,CAAC;gBAC5C,MAAM,KAAK,GAAY,MAAM,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,QAAQ,CAAC,QAAQ,EAAE,EAAE,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,IAAI,EAAE,QAAQ,CAAC,QAAQ,EAAE,CAAC,CAAC,CAAC;gBACzH,IAAI,KAAK,IAAI,IAAI,CAAC,OAAO;oBAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,IAAI,EAAE,QAAQ,CAAC,QAAQ,EAAE,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;gBAEpI,IAAI,QAAQ,CAAC,QAAQ,EAAE,KAAK,GAAG;oBAAE,QAAQ,CAAC,IAAI,CAAC,QAAQ,CAAC,QAAQ,EAAE,CAAC,CAAC;YACrE,CAAC;QACF,CAAC;QAED,IAAI,OAAO,CAAC,IAAI,EAAE,CAAC;YAClB,MAAM,IAAI,GAAW,cAAc,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC;YAClD,MAAM,QAAQ,GAAqB,MAAM,IAAI,CAAC,QAAQ,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC;YAEpE,IAAI,IAAI,KAAK,QAAQ;gBAAE,MAAM,IAAI,CAAC,QAAQ,CAAC,OAAO,CAAC,GAAG,EAAE,IAAI,CAAC,CAAC;QAC/D,CAAC;QAED,IAAI,OAAO,CAAC,IAAI,IAAI,OAAO,CAAC,IAAI,CAAC,MAAM,IAAI,OAAO,CAAC,GAAG,CAAC,cAAc,CAAC,EAAE,CAAC;YACxE,MAAM,WAAW,GAAW,OAAO,CAAC,GAAG,CAAC,cAAc,CAAY,CAAC;YACnE,MAAM,OAAO,GAAY,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,KAAK,EAAE,GAAG,CAAC,CAAC;YAE5D,KAAK,MAAM,IAAI,IAAI,IAAI,CAAC,OAAO,EAAE,CAAC;gBACjC,MAAM,MAAM,GAAY,IAAI,IAAI,CAAC,GAAG,EAAE,OAAO,EAAE,IAAI,CAAC,aAAa,CAAC,CAAC;gBACnE,IAAI,CAAC,MAAM,CAAC,SAAS,EAAE;oBAAE,SAAS;gBAElC,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,WAAW,EAAE,OAAO,CAAC;oBAAE,SAAS;gBAErD,IAAI,CAAC;oBACJ,MAAM,MAAM,CAAC,KAAK,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;gBACnC,CAAC;gBAAC,OAAO,EAAE,EAAE,CAAC;oBACb,eAAe,CAAC,kBAAkB,CAAC,CAAC;oBACpC,OAAO,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;gBACjB,CAAC;gBAED,IAAI,OAAO,EAAE,CAAC;oBACb,IAAI,CAAC;wBACJ,MAAM,KAAK,GAAa,MAAM,MAAM,CAAC,KAAK,EAAE,CAAC;wBAC7C,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC;4BAAE,SAAS;wBAEjC,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;4BAC1B,IAAI,IAAI,KAAK,GAAG;gCAAE,SAAS;4BAC3B,IAAI,CAAC;gCACJ,QAAQ,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;4BACrB,CAAC;4BAAC,OAAO,GAAG,EAAE,CAAC,CAAC,gBAAgB,CAAC,CAAC;wBACnC,CAAC;oBACF,CAAC;oBAAC,OAAO,EAAE,EAAE,CAAC;wBACb,eAAe,CAAC,kBAAkB,CAAC,CAAC;wBACpC,OAAO,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;oBACjB,CAAC;gBACF,CAAC;YACF,CAAC;QACF,CAAC;QAED,KAAK,MAAM,IAAI,IAAI,QAAQ,EAAE,CAAC;YAC7B,MAAM,KAAK,GAAY,MAAM,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,IAAI,EAAE,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC,CAAC;YAC3F,IAAI,KAAK,IAAI,IAAI,CAAC,OAAO;gBAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;QACtH,CAAC;QACD,MAAM,IAAI,CAAC,QAAQ,CAAC,IAAI,CAAC,GAAG,EAAE,QAAQ,CAAC,CAAC;QAExC,IAAI,IAAI,CAAC,OAAO;YAAE,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;QAErD,OAAO,OAAO,CAAC,UAAU,CAAC;IAC3B,CAAC;IAEM,KAAK,CAAC,KAAK;QACjB,MAAM,eAAe,GAAW,+BAA+B,CAAC,GAAS,EAAE;YAC1E,eAAe,CAAC,8CAA8C,IAAI,CAAC,MAAM,GAAG,CAAC,CAAC;YAE9E,IAAI,CAAC,KAAK,EAAE,CAAC;QACd,CAAC,CAAC,CAAC;QAEH,IAAI,CAAC;YACJ,IAAI,CAAC;gBACJ,MAAM,GAAG,CAAC,OAAO,CAAC,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,WAAW,CAAC,cAAc,CAAC,CAAC;YACjE,CAAC;YAAC,OAAO,EAAE,EAAE,CAAC;gBACb,IAAK,EAAY,CAAC,OAAO,KAAK,aAAa,IAAI,CAAC,IAAI,CAAC,WAAW,CAAC,qBAAqB,EAAE,CAAC;oBACxF,eAAe,CAAC,qBAAqB,IAAI,CAAC,MAAM,yBAAyB,CAAC,CAAC;oBAC3E,OAAO;gBACR,CAAC;gBAED,eAAe,CAAC,UAAU,IAAI,CAAC,MAAM,WAAW,CAAC,CAAC;gBAClD,MAAM,IAAI,CAAC,QAAQ,CAAC,QAAQ,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;gBAC1C,OAAO;YACR,CAAC;YAED,MAAM,MAAM,GAAU,IAAI,KAAK,CAC7B,IAAI,CAAC,MAAM,EACX,IAAI,CAAC,WAAW,EAChB,IAAI,CAAC,YAAY,EACjB,IAAI,CAAC,OAAO,CACb,CAAC;YACF,MAAM,MAAM,CAAC,IAAI,EAAE,CAAC;YAEpB,IAAI,KAAK,GAAW,CAAC,CAAC;YACtB,OAAO,IAAI,EAAE,CAAC;gBACb,IAAI,IAAI,CAAC,SAAS;oBAAE,MAAM;gBAE1B,IAAI,IAAI,CAAC,QAAQ,EAAE,CAAC;oBACnB,MAAM,mBAAmB,CAAC,IAAI,CAAC,CAAC;oBAChC,SAAS;gBACV,CAAC;gBAED,MAAM,GAAG,GAAqB,MAAM,IAAI,CAAC,QAAQ,CAAC,IAAI,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;gBACpE,IAAI,CAAC,GAAG,EAAE,CAAC;oBACV,cAAc,CAAC,aAAa,IAAI,CAAC,MAAM,aAAa,CAAC,CAAC;oBACtD,MAAM;gBACP,CAAC;gBAED,MAAM,IAAI,CAAC,QAAQ,CAAC,eAAe,CAAC,GAAG,CAAC,CAAC;gBAEzC,IAAI,IAAI,CAAC,OAAO;oBAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC,CAAC;gBAEzD,IAAI,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,IAAI,EAAE,GAAG,CAAC,EAAE,CAAC;oBACvC,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,CAAC,GAAG,EAAE,OAAO,CAAC,IAAI,CAAC,CAAC;oBACjD,MAAM,IAAI,CAAC,QAAQ,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC;oBAClC,IAAI,IAAI,CAAC,OAAO;wBAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC;oBAEtD,uDAAuD;oBACvD,4DAA4D;oBAC5D,MAAM,IAAI,CAAC,QAAQ,CAAC,IAAI,CAAC,GAAG,EAAE,EAAE,CAAC,CAAC;oBAClC,SAAS;gBACV,CAAC;gBAED,IAAI,MAAM,CAAC,YAAY,CAAC,GAAG,CAAC,EAAE,CAAC;oBAC9B,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,CAAC,GAAG,EAAE,OAAO,CAAC,UAAU,CAAC,CAAC;oBACvD,MAAM,IAAI,CAAC,QAAQ,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC;oBAClC,IAAI,IAAI,CAAC,OAAO;wBAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC;oBAE5D,uDAAuD;oBACvD,4DAA4D;oBAC5D,MAAM,IAAI,CAAC,QAAQ,CAAC,IAAI,CAAC,GAAG,EAAE,EAAE,CAAC,CAAC;oBAClC,SAAS;gBACV,CAAC;gBAED,IAAI,CAAC,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,CAAC,GAAG,EAAE,OAAO,CAAC,MAAM,CAAC,EAAE,CAAC;oBACzD,eAAe,CAAC,sCAAsC,GAAG,qBAAqB,CAAC,CAAC;oBAChF,MAAM;gBACP,CAAC;gBACD,IAAI,IAAI,CAAC,OAAO;oBAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;gBAExD,IAAI,KAAK,GAAG,CAAC,EAAE,CAAC;oBACf,IAAI,CAAC;wBACJ,MAAM,OAAO,GAAW,MAAM,CAAC,SAAS,CAAC,IAAI,CAAC,WAAW,CAAC,iBAAiB,EAAE,IAAI,CAAC,WAAW,CAAC,CAAC;wBAE/F,MAAM,mBAAmB,CAAC,OAAO,EAAE,SAAS,IAAI,CAAC,MAAM,EAAE,CAAC,CAAC;wBAE3D,OAAO,IAAI,CAAC,QAAQ,IAAI,CAAC,IAAI,CAAC,SAAS,EAAE,CAAC;4BACzC,MAAM,mBAAmB,CAAC,IAAI,CAAC,CAAC;wBACjC,CAAC;oBACF,CAAC;oBAAC,OAAO,GAAG,EAAE,CAAC,CAAC,YAAY,CAAC,CAAC;gBAC/B,CAAC;gBACD,IAAI,IAAI,CAAC,SAAS;oBAAE,MAAM;gBAE1B,IAAI,IAAI,CAAC,OAAO;oBAAE,MAAM,IAAI,CAAC,OAAO,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC;gBACnD,IAAI,CAAC;oBACJ,MAAM,UAAU,GAAW,MAAM,IAAI,CAAC,KAAK,CAAC,GAAG,EAAE,KAAK,KAAK,CAAC,CAAC,CAAC;oBAE9D,IAAI,IAAI,CAAC,OAAO;wBAAE,MAAM,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,GAAG,EAAE,UAAU,CAAC,CAAC;oBAC3D,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,CAAC,GAAG,EAAE,OAAO,CAAC,IAAI,CAAC,CAAC;oBACjD,MAAM,IAAI,CAAC,QAAQ,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC;oBAClC,IAAI,IAAI,CAAC,OAAO;wBAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC;gBACvD,CAAC;gBAAC,OAAO,EAAE,EAAE,CAAC;oBACb,IAAI,IAAI,CAAC,OAAO;wBAAE,MAAM,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC;oBAEjD,MAAM,GAAG,GAAW,MAAM,IAAI,CAAC,QAAQ,CAAC,MAAM,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;oBACzD,IAAI,GAAG,GAAG,IAAI,CAAC,WAAW,CAAC,YAAY,EAAE,CAAC;wBACzC,MAAM,IAAI,CAAC,QAAQ,CAAC,MAAM,CAAC,GAAG,EAAE,GAAG,GAAG,CAAC,CAAC,CAAC;wBACzC,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,CAAC,GAAG,EAAE,OAAO,CAAC,MAAM,CAAC,CAAC;wBACnD,IAAI,IAAI,CAAC,OAAO;4BAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;oBACzD,CAAC;yBAAM,CAAC;wBACP,MAAM,IAAI,CAAC,QAAQ,CAAC,SAAS,CAAC,GAAG,EAAE,OAAO,CAAC,MAAM,CAAC,CAAC;wBACnD,IAAI,IAAI,CAAC,OAAO;4BAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC;wBAExD,IAAI,4BAA4B,CAAC,EAAE,EAAE,MAAM,CAAC,EAAE,CAAC;4BAC9C,MAAM,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,GAAG,EAAG,EAAuB,CAAC,IAAI,CAAC,CAAC;wBACvE,CAAC;6BAAM,IAAI,4BAA4B,CAAC,EAAE,EAAE,SAAS,CAAC,EAAE,CAAC;4BACxD,IAAI,mBAAmB,CAAC,IAAI,CAAE,EAA0B,CAAC,OAAO,CAAC,EAAE,CAAC;gCACnE,MAAM,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,GAAG,EAAE,SAAS,CAAC,CAAC;4BACnD,CAAC;iCAAM,CAAC;gCACP,MAAM,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC,GAAG,EAAG,EAA0B,CAAC,OAAO,CAAC,CAAC;4BAC7E,CAAC;wBACF,CAAC;oBACF,CAAC;gBACF,CAAC;wBAAS,CAAC;oBACV,IAAI,IAAI,CAAC,OAAO;wBAAE,IAAI,CAAC,OAAO,CAAC,KAAK,CAAC,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC,CAAC;gBAC1D,CAAC;gBAED,KAAK,EAAE,CAAC;gBACR,IAAI,KAAK,IAAI,IAAI,CAAC,WAAW,CAAC,kBAAkB,EAAE,CAAC;oBAClD,eAAe,CAAC,aAAa,IAAI,CAAC,MAAM,0DAA0D,CAAC,CAAC;oBACpG,MAAM;gBACP,CAAC;YACF,CAAC;QACF,CAAC;QAAC,OAAO,CAAC,EAAE,CAAC;YACZ,eAAe,CAAC,kBAAkB,CAAC,CAAC;YACpC,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QAChB,CAAC;gBAAS,CAAC;YACV,kCAAkC,CAAC,eAAe,CAAC,CAAC;QACrD,CAAC;IACF,CAAC;CACD"}
@@ -1,6 +1,6 @@
1
1
  import * as dns from 'dns';
2
- import { commonsAsyncAbortTimeout, commonsAsyncTimeout } from 'tscommons-es-async';
3
- import { commonsOutputDebug } from 'nodecommons-es-cli';
2
+ import { commonsAsyncAbortTimeout, commonsAsyncTimeout } from 'tscommons-esm-async';
3
+ import { commonsLogDebug } from 'nodecommons-esm-log';
4
4
  export class Dns {
5
5
  static resolve(domain, connectTimeout) {
6
6
  // try IP4 first, then IP6
@@ -15,7 +15,7 @@ export class Dns {
15
15
  .catch((e) => {
16
16
  if (e.message === 'abortTimeout called')
17
17
  return;
18
- commonsOutputDebug('debug position 4');
18
+ commonsLogDebug('debug position 4');
19
19
  console.log(e);
20
20
  reject(e);
21
21
  });
@@ -44,4 +44,4 @@ export class Dns {
44
44
  });
45
45
  }
46
46
  }
47
- //# sourceMappingURL=dns.js.map
47
+ //# sourceMappingURL=dns.mjs.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"dns.mjs","sourceRoot":"","sources":["../../src/classes/dns.mts"],"names":[],"mappings":"AAAA,OAAO,KAAK,GAAG,MAAM,KAAK,CAAC;AAE3B,OAAO,EAAE,wBAAwB,EAAE,mBAAmB,EAAE,MAAM,qBAAqB,CAAC;AAEpF,OAAO,EAAE,eAAe,EAAE,MAAM,qBAAqB,CAAC;AAEtD,MAAM,OAAgB,GAAG;IACjB,MAAM,CAAC,OAAO,CACnB,MAAc,EACd,cAAsB;QAEvB,0BAA0B;QAE1B,OAAO,IAAI,OAAO,CAAW,CAAC,OAA8B,EAAE,MAA0B,EAAQ,EAAE;YACjG,IAAI,QAAQ,GAAY,KAAK,CAAC;YAC9B,MAAM,SAAS,GAAW,OAAO,MAAM,UAAU,CAAC;YAElD,mBAAmB,CACjB,cAAc,EACd,SAAS,CACV;iBACE,IAAI,CAAC,GAAS,EAAE;gBAChB,QAAQ,GAAG,IAAI,CAAC;gBAChB,MAAM,CAAC,IAAI,KAAK,CAAC,aAAa,CAAC,CAAC,CAAC;YAClC,CAAC,CAAC;iBACD,KAAK,CAAC,CAAC,CAAQ,EAAQ,EAAE;gBACzB,IAAI,CAAC,CAAC,OAAO,KAAK,qBAAqB;oBAAE,OAAO;gBAChD,eAAe,CAAC,kBAAkB,CAAC,CAAC;gBACpC,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;gBACf,MAAM,CAAC,CAAC,CAAC,CAAC;YACX,CAAC,CAAC,CAAC;YAEL,GAAG,CAAC,QAAQ,CAAC,MAAM,EAAE,CAAC,GAAe,EAAE,OAAiB,EAAQ,EAAE;gBACjE,IAAI,GAAG,EAAE,CAAC;oBACT,GAAG,CAAC,QAAQ,CAAC,MAAM,EAAE,CAAC,IAAgB,EAAE,QAAkB,EAAQ,EAAE;wBACnE,IAAI,IAAI,EAAE,CAAC;4BACV,IAAI,CAAC,QAAQ;gCAAE,wBAAwB,CAAC,SAAS,CAAC,CAAC;4BACnD,MAAM,CAAC,IAAI,CAAC,CAAC;4BACb,OAAO;wBACR,CAAC;wBACD,IAAI,CAAC,QAAQ,EAAE,CAAC;4BACf,wBAAwB,CAAC,SAAS,CAAC,CAAC;4BACpC,OAAO,CAAC,QAAQ,CAAC,CAAC;wBACnB,CAAC;wBACD,OAAO;oBACR,CAAC,CAAC,CAAC;oBACH,OAAO;gBACR,CAAC;gBACD,IAAI,CAAC,QAAQ,EAAE,CAAC;oBACf,wBAAwB,CAAC,SAAS,CAAC,CAAC;oBACpC,OAAO,CAAC,OAAO,CAAC,CAAC;gBAClB,CAAC;YACF,CAAC,CAAC,CAAC;QACJ,CAAC,CAAC,CAAC;IACJ,CAAC;CACD"}
@@ -1,5 +1,5 @@
1
- import { Expiry } from '../classes/expiry';
2
- import { DatabaseService } from '../services/database.service';
1
+ import { Expiry } from '../classes/expiry.mjs';
2
+ import { DatabaseService } from '../services/database.service.mjs';
3
3
  export declare class Expirer {
4
4
  private expiry;
5
5
  private database;
@@ -0,0 +1,117 @@
1
+ import mongodb from 'mongodb';
2
+ import { commonsArrayChunk, commonsDateDateToYmdHis, commonsTypeHasPropertyDate } from 'tscommons-esm-core';
3
+ import { EStatus } from 'hydra-crawler-esm-assets';
4
+ import { commonsLogAlert, commonsLogDoing } from 'nodecommons-esm-log';
5
+ import { isTMongoIdRow } from '../services/database.service.mjs';
6
+ export class Expirer {
7
+ expiry;
8
+ database;
9
+ constructor(expiry, database) {
10
+ this.expiry = expiry;
11
+ this.database = database;
12
+ }
13
+ async listQueuedAndActive() {
14
+ const log = commonsLogDoing('expirer', 'Enumering queued and active domains');
15
+ const results = this.database.getUrls().aggregate([
16
+ { $match: { status: { $in: [EStatus.QUEUED, EStatus.ACTIVE] } } },
17
+ { $group: { _id: '$domain' } }
18
+ ], { allowDiskUse: true });
19
+ const queued = await this.database.listQueryResults(results, isTMongoIdRow);
20
+ log.success(queued.length);
21
+ return queued
22
+ // eslint-disable-next-line no-underscore-dangle
23
+ .map((q) => q._id);
24
+ }
25
+ async expire(limit) {
26
+ commonsLogAlert('Running expiry thread');
27
+ const queued = await this.listQueuedAndActive();
28
+ const expired = [];
29
+ { // scope
30
+ const log = commonsLogDoing('expirer', 'Searching for expired URLs');
31
+ const results = this.database.getUrls().find({ $and: [
32
+ { status: { $nin: [
33
+ EStatus.ARCHIVED,
34
+ EStatus.QUEUED,
35
+ EStatus.ACTIVE
36
+ ] } },
37
+ { domain: { $nin: queued } },
38
+ { attempted: { $exists: true } }
39
+ ] }, {});
40
+ const now = new Date().getTime() / 1000;
41
+ let tally = 0;
42
+ let found = 0;
43
+ while (true) {
44
+ tally++;
45
+ if ((tally % 1000) === 0)
46
+ log.progress(`${tally}, ${found}`);
47
+ if (limit !== undefined && tally > limit)
48
+ break;
49
+ const row = await results.next();
50
+ if (row === null)
51
+ break;
52
+ const interval = this.expiry.getBestExpiry(row.url);
53
+ if (!commonsTypeHasPropertyDate(row, 'attempted'))
54
+ continue;
55
+ const attempted = row['attempted'].getTime() / 1000;
56
+ if ((attempted + interval) < now) {
57
+ // eslint-disable-next-line @typescript-eslint/no-unsafe-argument
58
+ expired.push(row['_id']);
59
+ found++;
60
+ }
61
+ }
62
+ log.success(found);
63
+ if (found === 0)
64
+ return false;
65
+ }
66
+ const batches = commonsArrayChunk(expired, 100);
67
+ { // scope
68
+ const log = commonsLogDoing('expirer', 'Re-queuing expired');
69
+ let tally = 0;
70
+ for (const batch of batches) {
71
+ const batchIds = batch
72
+ .map((id) => new mongodb.ObjectId(id));
73
+ await this.database.getUrls().updateMany({ _id: { $in: batchIds } }, {
74
+ $set: { status: EStatus.QUEUED },
75
+ $unset: { ttl: true }
76
+ });
77
+ tally += 100;
78
+ log.progress(tally);
79
+ }
80
+ log.success();
81
+ }
82
+ return true;
83
+ }
84
+ async expireFixed(threshold) {
85
+ commonsLogAlert('Running fixed date expiry thread');
86
+ const queued = await this.listQueuedAndActive();
87
+ { // scope
88
+ const log = commonsLogDoing('expirer', `Searching attempted before date ${commonsDateDateToYmdHis(threshold)}`);
89
+ const count = await this.database.getUrls().find({ $and: [
90
+ { status: { $ne: EStatus.ARCHIVED } },
91
+ { domain: { $nin: queued } },
92
+ { attempted: { $exists: true } },
93
+ { attempted: { $lt: threshold } }
94
+ ] }, {}).count();
95
+ log.success(count);
96
+ if (count === 0)
97
+ return false;
98
+ }
99
+ { // scope
100
+ const log = commonsLogDoing('expirer', 'Re-queuing expired');
101
+ await this.database.getUrls().updateMany({ $and: [
102
+ { status: { $ne: EStatus.ARCHIVED } },
103
+ { domain: { $nin: queued } },
104
+ { attempted: { $exists: true } },
105
+ { attempted: { $lt: threshold } }
106
+ ] }, {
107
+ $set: { status: EStatus.QUEUED },
108
+ $unset: { ttl: true }
109
+ });
110
+ log.success();
111
+ }
112
+ // ?
113
+ // const log: CommonsSubLoggable = commonsLogDoing('expirer', 'Searching for expired URLs');
114
+ return true;
115
+ }
116
+ }
117
+ //# sourceMappingURL=expirer.mjs.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"expirer.mjs","sourceRoot":"","sources":["../../src/classes/expirer.mts"],"names":[],"mappings":"AAAA,OAAO,OAAO,MAAM,SAAS,CAAC;AAE9B,OAAO,EAAE,iBAAiB,EAAE,uBAAuB,EAAE,0BAA0B,EAAmB,MAAM,oBAAoB,CAAC;AAE7H,OAAO,EAAE,OAAO,EAAE,MAAM,0BAA0B,CAAC;AAGnD,OAAO,EAAE,eAAe,EAAE,eAAe,EAAsB,MAAM,qBAAqB,CAAC;AAI3F,OAAO,EAAgC,aAAa,EAAE,MAAM,kCAAkC,CAAC;AAE/F,MAAM,OAAO,OAAO;IAET;IACA;IAFV,YACU,MAAc,EACd,QAAyB;QADzB,WAAM,GAAN,MAAM,CAAQ;QACd,aAAQ,GAAR,QAAQ,CAAiB;IAChC,CAAC;IAEI,KAAK,CAAC,mBAAmB;QAChC,MAAM,GAAG,GAAuB,eAAe,CAAC,SAAS,EAAE,qCAAqC,CAAC,CAAC;QAClG,MAAM,OAAO,GAA2C,IAAI,CAAC,QAAQ,CAAC,OAAO,EAAE,CAAC,SAAS,CAAc;YACrG,EAAE,MAAM,EAAE,EAAE,MAAM,EAAE,EAAE,GAAG,EAAE,CAAE,OAAO,CAAC,MAAM,EAAE,OAAO,CAAC,MAAM,CAAE,EAAE,EAAE,EAAE;YACnE,EAAE,MAAM,EAAE,EAAE,GAAG,EAAE,SAAS,EAAE,EAAE;SAC/B,EAAE,EAAE,YAAY,EAAE,IAAI,EAAE,CAAC,CAAC;QAE3B,MAAM,MAAM,GAAkB,MAAM,IAAI,CAAC,QAAQ,CAAC,gBAAgB,CAAC,OAAO,EAAE,aAAa,CAAC,CAAC;QAE3F,GAAG,CAAC,OAAO,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;QAE3B,OAAO,MAAM;YACX,gDAAgD;aAC/C,GAAG,CAAC,CAAC,CAAc,EAAU,EAAE,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;IAC3C,CAAC;IAEM,KAAK,CAAC,MAAM,CAAC,KAAc;QACjC,eAAe,CAAC,uBAAuB,CAAC,CAAC;QAEzC,MAAM,MAAM,GAAa,MAAM,IAAI,CAAC,mBAAmB,EAAE,CAAC;QAE1D,MAAM,OAAO,GAAa,EAAE,CAAC;QAC7B,CAAC,CAAC,QAAQ;YACT,MAAM,GAAG,GAAuB,eAAe,CAAC,SAAS,EAAE,4BAA4B,CAAC,CAAC;YAEzF,MAAM,OAAO,GAA6B,IAAI,CAAC,QAAQ,CAAC,OAAO,EAAE,CAAC,IAAI,CACpE,EAAE,IAAI,EAAE;oBACN,EAAE,MAAM,EAAE,EAAE,IAAI,EAAE;gCAChB,OAAO,CAAC,QAAQ;gCAChB,OAAO,CAAC,MAAM;gCACd,OAAO,CAAC,MAAM;6BACf,EAAE,EAAE;oBACL,EAAE,MAAM,EAAE,EAAE,IAAI,EAAE,MAAM,EAAE,EAAE;oBAC5B,EAAE,SAAS,EAAE,EAAE,OAAO,EAAE,IAAI,EAAE,EAAE;iBACjC,EAAC,EACF,EAAE,CACH,CAAC;YAEF,MAAM,GAAG,GAAW,IAAI,IAAI,EAAE,CAAC,OAAO,EAAE,GAAG,IAAI,CAAC;YAEhD,IAAI,KAAK,GAAW,CAAC,CAAC;YACtB,IAAI,KAAK,GAAW,CAAC,CAAC;YACtB,OAAO,IAAI,EAAE,CAAC;gBACb,KAAK,EAAE,CAAC;gBACR,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC;oBAAE,GAAG,CAAC,QAAQ,CAAC,GAAG,KAAK,KAAK,KAAK,EAAE,CAAC,CAAC;gBAC7D,IAAI,KAAK,KAAK,SAAS,IAAI,KAAK,GAAG,KAAK;oBAAE,MAAM;gBAEhD,MAAM,GAAG,GAAc,MAAM,OAAO,CAAC,IAAI,EAAE,CAAC;gBAC5C,IAAI,GAAG,KAAK,IAAI;oBAAE,MAAM;gBAExB,MAAM,QAAQ,GAAW,IAAI,CAAC,MAAM,CAAC,aAAa,CAAC,GAAG,CAAC,GAAG,CAAC,CAAC;gBAE5D,IAAI,CAAC,0BAA0B,CAAC,GAAG,EAAE,WAAW,CAAC;oBAAE,SAAS;gBAE5D,MAAM,SAAS,GAAa,GAAuB,CAAC,WAAW,CAAU,CAAC,OAAO,EAAE,GAAG,IAAI,CAAC;gBAC3F,IAAI,CAAC,SAAS,GAAG,QAAQ,CAAC,GAAG,GAAG,EAAE,CAAC;oBAClC,iEAAiE;oBACjE,OAAO,CAAC,IAAI,CAAE,GAAuB,CAAC,KAAK,CAAC,CAAC,CAAC;oBAC9C,KAAK,EAAE,CAAC;gBACT,CAAC;YACF,CAAC;YACD,GAAG,CAAC,OAAO,CAAC,KAAK,CAAC,CAAC;YAEnB,IAAI,KAAK,KAAK,CAAC;gBAAE,OAAO,KAAK,CAAC;QAC/B,CAAC;QAED,MAAM,OAAO,GAAe,iBAAiB,CAAC,OAAO,EAAE,GAAG,CAAC,CAAC;QAE5D,CAAC,CAAC,QAAQ;YACT,MAAM,GAAG,GAAuB,eAAe,CAAC,SAAS,EAAE,oBAAoB,CAAC,CAAC;YACjF,IAAI,KAAK,GAAW,CAAC,CAAC;YACtB,KAAK,MAAM,KAAK,IAAI,OAAO,EAAE,CAAC;gBAC7B,MAAM,QAAQ,GAAuB,KAAK;qBACvC,GAAG,CAAC,CAAC,EAAU,EAAoB,EAAE,CAAC,IAAI,OAAO,CAAC,QAAQ,CAAC,EAAE,CAAC,CAAC,CAAC;gBAEnE,MAAM,IAAI,CAAC,QAAQ,CAAC,OAAO,EAAE,CAAC,UAAU,CACtC,EAAE,GAAG,EAAE,EAAE,GAAG,EAAE,QAAQ,EAAE,EAAE,EAC1B;oBACE,IAAI,EAAE,EAAE,MAAM,EAAE,OAAO,CAAC,MAAM,EAAE;oBAChC,MAAM,EAAE,EAAE,GAAG,EAAE,IAAI,EAAE;iBACtB,CACF,CAAC;gBAEF,KAAK,IAAI,GAAG,CAAC;gBACb,GAAG,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC;YACrB,CAAC;YACD,GAAG,CAAC,OAAO,EAAE,CAAC;QACf,CAAC;QAED,OAAO,IAAI,CAAC;IACb,CAAC;IAEM,KAAK,CAAC,WAAW,CAAC,SAAe;QACvC,eAAe,CAAC,kCAAkC,CAAC,CAAC;QAEpD,MAAM,MAAM,GAAa,MAAM,IAAI,CAAC,mBAAmB,EAAE,CAAC;QAE1D,CAAC,CAAC,QAAQ;YACT,MAAM,GAAG,GAAuB,eAAe,CAAC,SAAS,EAAE,mCAAmC,uBAAuB,CAAC,SAAS,CAAC,EAAE,CAAC,CAAC;YACpI,MAAM,KAAK,GAAW,MAAM,IAAI,CAAC,QAAQ,CAAC,OAAO,EAAE,CAAC,IAAI,CACtD,EAAE,IAAI,EAAE;oBACN,EAAE,MAAM,EAAE,EAAE,GAAG,EAAE,OAAO,CAAC,QAAQ,EAAE,EAAE;oBACrC,EAAE,MAAM,EAAE,EAAE,IAAI,EAAE,MAAM,EAAE,EAAE;oBAC5B,EAAE,SAAS,EAAE,EAAE,OAAO,EAAE,IAAI,EAAE,EAAE;oBAChC,EAAE,SAAS,EAAE,EAAE,GAAG,EAAE,SAAS,EAAE,EAAE;iBAClC,EAAC,EACF,EAAE,CACH,CAAC,KAAK,EAAE,CAAC;YACV,GAAG,CAAC,OAAO,CAAC,KAAK,CAAC,CAAC;YAEnB,IAAI,KAAK,KAAK,CAAC;gBAAE,OAAO,KAAK,CAAC;QAC/B,CAAC;QAED,CAAC,CAAC,QAAQ;YACT,MAAM,GAAG,GAAuB,eAAe,CAAC,SAAS,EAAE,oBAAoB,CAAC,CAAC;YACjF,MAAM,IAAI,CAAC,QAAQ,CAAC,OAAO,EAAE,CAAC,UAAU,CACtC,EAAE,IAAI,EAAE;oBACN,EAAE,MAAM,EAAE,EAAE,GAAG,EAAE,OAAO,CAAC,QAAQ,EAAE,EAAE;oBACrC,EAAE,MAAM,EAAE,EAAE,IAAI,EAAE,MAAM,EAAE,EAAE;oBAC5B,EAAE,SAAS,EAAE,EAAE,OAAO,EAAE,IAAI,EAAE,EAAE;oBAChC,EAAE,SAAS,EAAE,EAAE,GAAG,EAAE,SAAS,EAAE,EAAE;iBAClC,EAAC,EACF;gBACE,IAAI,EAAE,EAAE,MAAM,EAAE,OAAO,CAAC,MAAM,EAAE;gBAChC,MAAM,EAAE,EAAE,GAAG,EAAE,IAAI,EAAE;aACtB,CACF,CAAC;YACF,GAAG,CAAC,OAAO,EAAE,CAAC;QACf,CAAC;QAED,IAAI;QACJ,4FAA4F;QAE5F,OAAO,IAAI,CAAC;IACb,CAAC;CACD"}
@@ -1,4 +1,4 @@
1
- import { IExpiry } from '../interfaces/iexpiry';
1
+ import { IExpiry } from '../interfaces/iexpiry.mjs';
2
2
  export declare class Expiry {
3
3
  static loadFromFile(file: string): IExpiry[];
4
4
  private static getScore;
@@ -1,12 +1,9 @@
1
1
  import { URL } from 'url';
2
- import { commonsTypeHasPropertyString, commonsTypeIsArray, commonsTypeIsTArray } from 'tscommons-es-core';
3
- import { commonsFileReadJsonFile } from 'nodecommons-es-file';
4
- import { Matcher } from '../helpers/matcher';
5
- import { isIExpiry, toIExpiry } from '../interfaces/iexpiry';
2
+ import { commonsTypeHasPropertyString, commonsTypeIsArray, commonsTypeIsTArray } from 'tscommons-esm-core';
3
+ import { commonsFileReadJsonFile } from 'nodecommons-esm-file';
4
+ import { Matcher } from '../helpers/matcher.mjs';
5
+ import { isIExpiry, toIExpiry } from '../interfaces/iexpiry.mjs';
6
6
  export class Expiry {
7
- constructor() {
8
- this.expiries = [];
9
- }
10
7
  static loadFromFile(file) {
11
8
  const json = commonsFileReadJsonFile(file);
12
9
  if (!commonsTypeIsArray(json))
@@ -16,7 +13,7 @@ export class Expiry {
16
13
  try {
17
14
  return toIExpiry(entry);
18
15
  }
19
- catch (e) {
16
+ catch (_e) {
20
17
  return undefined;
21
18
  }
22
19
  });
@@ -37,6 +34,7 @@ export class Expiry {
37
34
  }
38
35
  return total;
39
36
  }
37
+ expiries = [];
40
38
  add(expiries) {
41
39
  for (const expiry of expiries) {
42
40
  this.expiries.push(expiry);
@@ -60,4 +58,4 @@ export class Expiry {
60
58
  return best.expiry;
61
59
  }
62
60
  }
63
- //# sourceMappingURL=expiry.js.map
61
+ //# sourceMappingURL=expiry.mjs.map