@staticn0va/wigolo 0.1.0 → 0.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (982) hide show
  1. package/LICENSE +1 -1
  2. package/README.md +195 -73
  3. package/SKILL.md +382 -0
  4. package/assets/blocks/claude-code/CLAUDE.md.block +20 -0
  5. package/assets/blocks/claude-code/wigolo-command.md +40 -0
  6. package/assets/blocks/cursor/wigolo.mdc +46 -0
  7. package/assets/blocks/gemini-cli/GEMINI.md.block +18 -0
  8. package/assets/blocks/vscode/copilot-instructions.md.block +18 -0
  9. package/assets/skills/wigolo/SKILL.md +50 -0
  10. package/assets/skills/wigolo/rules/cache-first.md +30 -0
  11. package/assets/skills/wigolo/rules/synthesis.md +43 -0
  12. package/assets/skills/wigolo-agent/SKILL.md +73 -0
  13. package/assets/skills/wigolo-crawl/SKILL.md +60 -0
  14. package/assets/skills/wigolo-extract/SKILL.md +59 -0
  15. package/assets/skills/wigolo-fetch/SKILL.md +65 -0
  16. package/assets/skills/wigolo-find-similar/SKILL.md +72 -0
  17. package/assets/skills/wigolo-research/SKILL.md +77 -0
  18. package/assets/skills/wigolo-search/SKILL.md +78 -0
  19. package/dist/agent/executor.d.ts +33 -0
  20. package/dist/agent/executor.d.ts.map +1 -0
  21. package/dist/agent/executor.js +233 -0
  22. package/dist/agent/executor.js.map +1 -0
  23. package/dist/agent/pipeline.d.ts +5 -0
  24. package/dist/agent/pipeline.d.ts.map +1 -0
  25. package/dist/agent/pipeline.js +208 -0
  26. package/dist/agent/pipeline.js.map +1 -0
  27. package/dist/agent/planner.d.ts +13 -0
  28. package/dist/agent/planner.d.ts.map +1 -0
  29. package/dist/agent/planner.js +271 -0
  30. package/dist/agent/planner.js.map +1 -0
  31. package/dist/agent/relevance.d.ts +15 -0
  32. package/dist/agent/relevance.d.ts.map +1 -0
  33. package/dist/agent/relevance.js +60 -0
  34. package/dist/agent/relevance.js.map +1 -0
  35. package/dist/cache/backfill-embeddings.d.ts +23 -0
  36. package/dist/cache/backfill-embeddings.d.ts.map +1 -0
  37. package/dist/cache/backfill-embeddings.js +105 -0
  38. package/dist/cache/backfill-embeddings.js.map +1 -0
  39. package/dist/cache/change-detector.d.ts +7 -0
  40. package/dist/cache/change-detector.d.ts.map +1 -0
  41. package/dist/cache/change-detector.js +43 -0
  42. package/dist/cache/change-detector.js.map +1 -0
  43. package/dist/cache/db.d.ts +1 -0
  44. package/dist/cache/db.d.ts.map +1 -1
  45. package/dist/cache/db.js +94 -22
  46. package/dist/cache/db.js.map +1 -1
  47. package/dist/cache/diff-summary.d.ts +2 -0
  48. package/dist/cache/diff-summary.d.ts.map +1 -0
  49. package/dist/cache/diff-summary.js +82 -0
  50. package/dist/cache/diff-summary.js.map +1 -0
  51. package/dist/cache/migrations/runner.d.ts +29 -0
  52. package/dist/cache/migrations/runner.d.ts.map +1 -0
  53. package/dist/cache/migrations/runner.js +147 -0
  54. package/dist/cache/migrations/runner.js.map +1 -0
  55. package/dist/cache/sqlite-vec-store.d.ts +42 -0
  56. package/dist/cache/sqlite-vec-store.d.ts.map +1 -0
  57. package/dist/cache/sqlite-vec-store.js +176 -0
  58. package/dist/cache/sqlite-vec-store.js.map +1 -0
  59. package/dist/cache/store.d.ts +46 -1
  60. package/dist/cache/store.d.ts.map +1 -1
  61. package/dist/cache/store.js +362 -168
  62. package/dist/cache/store.js.map +1 -1
  63. package/dist/cli/agents/antigravity.d.ts +20 -0
  64. package/dist/cli/agents/antigravity.d.ts.map +1 -0
  65. package/dist/cli/agents/antigravity.js +49 -0
  66. package/dist/cli/agents/antigravity.js.map +1 -0
  67. package/dist/cli/agents/claude-code.d.ts +25 -0
  68. package/dist/cli/agents/claude-code.d.ts.map +1 -0
  69. package/dist/cli/agents/claude-code.js +111 -0
  70. package/dist/cli/agents/claude-code.js.map +1 -0
  71. package/dist/cli/agents/cursor.d.ts +21 -0
  72. package/dist/cli/agents/cursor.d.ts.map +1 -0
  73. package/dist/cli/agents/cursor.js +58 -0
  74. package/dist/cli/agents/cursor.js.map +1 -0
  75. package/dist/cli/agents/gemini-cli.d.ts +21 -0
  76. package/dist/cli/agents/gemini-cli.d.ts.map +1 -0
  77. package/dist/cli/agents/gemini-cli.js +55 -0
  78. package/dist/cli/agents/gemini-cli.js.map +1 -0
  79. package/dist/cli/agents/registry.d.ts +21 -0
  80. package/dist/cli/agents/registry.d.ts.map +1 -0
  81. package/dist/cli/agents/registry.js +27 -0
  82. package/dist/cli/agents/registry.js.map +1 -0
  83. package/dist/cli/agents/utils.d.ts +26 -0
  84. package/dist/cli/agents/utils.d.ts.map +1 -0
  85. package/dist/cli/agents/utils.js +136 -0
  86. package/dist/cli/agents/utils.js.map +1 -0
  87. package/dist/cli/agents/vscode.d.ts +21 -0
  88. package/dist/cli/agents/vscode.d.ts.map +1 -0
  89. package/dist/cli/agents/vscode.js +62 -0
  90. package/dist/cli/agents/vscode.js.map +1 -0
  91. package/dist/cli/auth.d.ts +2 -0
  92. package/dist/cli/auth.d.ts.map +1 -0
  93. package/dist/cli/auth.js +94 -0
  94. package/dist/cli/auth.js.map +1 -0
  95. package/dist/cli/backfill.d.ts +2 -0
  96. package/dist/cli/backfill.d.ts.map +1 -0
  97. package/dist/cli/backfill.js +58 -0
  98. package/dist/cli/backfill.js.map +1 -0
  99. package/dist/cli/daemon.d.ts +6 -1
  100. package/dist/cli/daemon.d.ts.map +1 -1
  101. package/dist/cli/daemon.js +61 -3
  102. package/dist/cli/daemon.js.map +1 -1
  103. package/dist/cli/doctor.d.ts +8 -0
  104. package/dist/cli/doctor.d.ts.map +1 -0
  105. package/dist/cli/doctor.js +318 -0
  106. package/dist/cli/doctor.js.map +1 -0
  107. package/dist/cli/health.d.ts +1 -1
  108. package/dist/cli/health.d.ts.map +1 -1
  109. package/dist/cli/health.js +42 -3
  110. package/dist/cli/health.js.map +1 -1
  111. package/dist/cli/help.d.ts +6 -0
  112. package/dist/cli/help.d.ts.map +1 -0
  113. package/dist/cli/help.js +63 -0
  114. package/dist/cli/help.js.map +1 -0
  115. package/dist/cli/index.d.ts +1 -1
  116. package/dist/cli/index.d.ts.map +1 -1
  117. package/dist/cli/index.js +35 -7
  118. package/dist/cli/index.js.map +1 -1
  119. package/dist/cli/init.d.ts +2 -0
  120. package/dist/cli/init.d.ts.map +1 -0
  121. package/dist/cli/init.js +201 -0
  122. package/dist/cli/init.js.map +1 -0
  123. package/dist/cli/plugin.d.ts +5 -0
  124. package/dist/cli/plugin.d.ts.map +1 -0
  125. package/dist/cli/plugin.js +185 -0
  126. package/dist/cli/plugin.js.map +1 -0
  127. package/dist/cli/setup-mcp.d.ts +2 -0
  128. package/dist/cli/setup-mcp.d.ts.map +1 -0
  129. package/dist/cli/setup-mcp.js +114 -0
  130. package/dist/cli/setup-mcp.js.map +1 -0
  131. package/dist/cli/shell.d.ts +2 -0
  132. package/dist/cli/shell.d.ts.map +1 -0
  133. package/dist/cli/shell.js +86 -0
  134. package/dist/cli/shell.js.map +1 -0
  135. package/dist/cli/status.d.ts +2 -0
  136. package/dist/cli/status.d.ts.map +1 -0
  137. package/dist/cli/status.js +31 -0
  138. package/dist/cli/status.js.map +1 -0
  139. package/dist/cli/telemetry.d.ts +10 -0
  140. package/dist/cli/telemetry.d.ts.map +1 -0
  141. package/dist/cli/telemetry.js +56 -0
  142. package/dist/cli/telemetry.js.map +1 -0
  143. package/dist/cli/tui/agents-types.d.ts +28 -0
  144. package/dist/cli/tui/agents-types.d.ts.map +1 -0
  145. package/dist/cli/tui/agents-types.js +1 -0
  146. package/dist/cli/tui/agents-types.js.map +1 -0
  147. package/dist/cli/tui/agents.d.ts +11 -0
  148. package/dist/cli/tui/agents.d.ts.map +1 -0
  149. package/dist/cli/tui/agents.js +93 -0
  150. package/dist/cli/tui/agents.js.map +1 -0
  151. package/dist/cli/tui/banner.d.ts +3 -0
  152. package/dist/cli/tui/banner.d.ts.map +1 -0
  153. package/dist/cli/tui/banner.js +30 -0
  154. package/dist/cli/tui/banner.js.map +1 -0
  155. package/dist/cli/tui/components/AgentSelect.d.ts +13 -0
  156. package/dist/cli/tui/components/AgentSelect.d.ts.map +1 -0
  157. package/dist/cli/tui/components/AgentSelect.js +116 -0
  158. package/dist/cli/tui/components/AgentSelect.js.map +1 -0
  159. package/dist/cli/tui/components/Banner.d.ts +6 -0
  160. package/dist/cli/tui/components/Banner.d.ts.map +1 -0
  161. package/dist/cli/tui/components/Banner.js +25 -0
  162. package/dist/cli/tui/components/Banner.js.map +1 -0
  163. package/dist/cli/tui/components/BrowserSelect.d.ts +7 -0
  164. package/dist/cli/tui/components/BrowserSelect.d.ts.map +1 -0
  165. package/dist/cli/tui/components/BrowserSelect.js +19 -0
  166. package/dist/cli/tui/components/BrowserSelect.js.map +1 -0
  167. package/dist/cli/tui/components/InstallProgress.d.ts +9 -0
  168. package/dist/cli/tui/components/InstallProgress.d.ts.map +1 -0
  169. package/dist/cli/tui/components/InstallProgress.js +67 -0
  170. package/dist/cli/tui/components/InstallProgress.js.map +1 -0
  171. package/dist/cli/tui/components/SkillInstall.d.ts +14 -0
  172. package/dist/cli/tui/components/SkillInstall.d.ts.map +1 -0
  173. package/dist/cli/tui/components/SkillInstall.js +94 -0
  174. package/dist/cli/tui/components/SkillInstall.js.map +1 -0
  175. package/dist/cli/tui/components/Summary.d.ts +22 -0
  176. package/dist/cli/tui/components/Summary.d.ts.map +1 -0
  177. package/dist/cli/tui/components/Summary.js +135 -0
  178. package/dist/cli/tui/components/Summary.js.map +1 -0
  179. package/dist/cli/tui/components/SystemCheck.d.ts +8 -0
  180. package/dist/cli/tui/components/SystemCheck.d.ts.map +1 -0
  181. package/dist/cli/tui/components/SystemCheck.js +71 -0
  182. package/dist/cli/tui/components/SystemCheck.js.map +1 -0
  183. package/dist/cli/tui/components/Verification.d.ts +8 -0
  184. package/dist/cli/tui/components/Verification.d.ts.map +1 -0
  185. package/dist/cli/tui/components/Verification.js +63 -0
  186. package/dist/cli/tui/components/Verification.js.map +1 -0
  187. package/dist/cli/tui/config-writer-cli.d.ts +12 -0
  188. package/dist/cli/tui/config-writer-cli.d.ts.map +1 -0
  189. package/dist/cli/tui/config-writer-cli.js +39 -0
  190. package/dist/cli/tui/config-writer-cli.js.map +1 -0
  191. package/dist/cli/tui/config-writer-json.d.ts +16 -0
  192. package/dist/cli/tui/config-writer-json.d.ts.map +1 -0
  193. package/dist/cli/tui/config-writer-json.js +86 -0
  194. package/dist/cli/tui/config-writer-json.js.map +1 -0
  195. package/dist/cli/tui/config-writer-toml.d.ts +16 -0
  196. package/dist/cli/tui/config-writer-toml.d.ts.map +1 -0
  197. package/dist/cli/tui/config-writer-toml.js +83 -0
  198. package/dist/cli/tui/config-writer-toml.js.map +1 -0
  199. package/dist/cli/tui/config-writer.d.ts +25 -0
  200. package/dist/cli/tui/config-writer.d.ts.map +1 -0
  201. package/dist/cli/tui/config-writer.js +101 -0
  202. package/dist/cli/tui/config-writer.js.map +1 -0
  203. package/dist/cli/tui/detect-helpers.d.ts +6 -0
  204. package/dist/cli/tui/detect-helpers.d.ts.map +1 -0
  205. package/dist/cli/tui/detect-helpers.js +45 -0
  206. package/dist/cli/tui/detect-helpers.js.map +1 -0
  207. package/dist/cli/tui/extras-prompt.d.ts +7 -0
  208. package/dist/cli/tui/extras-prompt.d.ts.map +1 -0
  209. package/dist/cli/tui/extras-prompt.js +42 -0
  210. package/dist/cli/tui/extras-prompt.js.map +1 -0
  211. package/dist/cli/tui/flags-types.d.ts +19 -0
  212. package/dist/cli/tui/flags-types.d.ts.map +1 -0
  213. package/dist/cli/tui/flags-types.js +23 -0
  214. package/dist/cli/tui/flags-types.js.map +1 -0
  215. package/dist/cli/tui/flags.d.ts +5 -0
  216. package/dist/cli/tui/flags.d.ts.map +1 -0
  217. package/dist/cli/tui/flags.js +132 -0
  218. package/dist/cli/tui/flags.js.map +1 -0
  219. package/dist/cli/tui/format.d.ts +14 -0
  220. package/dist/cli/tui/format.d.ts.map +1 -0
  221. package/dist/cli/tui/format.js +37 -0
  222. package/dist/cli/tui/format.js.map +1 -0
  223. package/dist/cli/tui/hooks/useAgentDetect.d.ts +6 -0
  224. package/dist/cli/tui/hooks/useAgentDetect.d.ts.map +1 -0
  225. package/dist/cli/tui/hooks/useAgentDetect.js +19 -0
  226. package/dist/cli/tui/hooks/useAgentDetect.js.map +1 -0
  227. package/dist/cli/tui/hooks/useInstall.d.ts +14 -0
  228. package/dist/cli/tui/hooks/useInstall.d.ts.map +1 -0
  229. package/dist/cli/tui/hooks/useInstall.js +90 -0
  230. package/dist/cli/tui/hooks/useInstall.js.map +1 -0
  231. package/dist/cli/tui/hooks/useSystemCheck.d.ts +13 -0
  232. package/dist/cli/tui/hooks/useSystemCheck.d.ts.map +1 -0
  233. package/dist/cli/tui/hooks/useSystemCheck.js +95 -0
  234. package/dist/cli/tui/hooks/useSystemCheck.js.map +1 -0
  235. package/dist/cli/tui/hooks/useVerify.d.ts +14 -0
  236. package/dist/cli/tui/hooks/useVerify.d.ts.map +1 -0
  237. package/dist/cli/tui/hooks/useVerify.js +71 -0
  238. package/dist/cli/tui/hooks/useVerify.js.map +1 -0
  239. package/dist/cli/tui/ink-init.d.ts +2 -0
  240. package/dist/cli/tui/ink-init.d.ts.map +1 -0
  241. package/dist/cli/tui/ink-init.js +198 -0
  242. package/dist/cli/tui/ink-init.js.map +1 -0
  243. package/dist/cli/tui/reporter-auto.d.ts +7 -0
  244. package/dist/cli/tui/reporter-auto.d.ts.map +1 -0
  245. package/dist/cli/tui/reporter-auto.js +15 -0
  246. package/dist/cli/tui/reporter-auto.js.map +1 -0
  247. package/dist/cli/tui/reporter.d.ts +26 -0
  248. package/dist/cli/tui/reporter.d.ts.map +1 -0
  249. package/dist/cli/tui/reporter.js +32 -0
  250. package/dist/cli/tui/reporter.js.map +1 -0
  251. package/dist/cli/tui/run-command.d.ts +14 -0
  252. package/dist/cli/tui/run-command.d.ts.map +1 -0
  253. package/dist/cli/tui/run-command.js +72 -0
  254. package/dist/cli/tui/run-command.js.map +1 -0
  255. package/dist/cli/tui/select-agents.d.ts +6 -0
  256. package/dist/cli/tui/select-agents.d.ts.map +1 -0
  257. package/dist/cli/tui/select-agents.js +32 -0
  258. package/dist/cli/tui/select-agents.js.map +1 -0
  259. package/dist/cli/tui/status-agents.d.ts +11 -0
  260. package/dist/cli/tui/status-agents.d.ts.map +1 -0
  261. package/dist/cli/tui/status-agents.js +53 -0
  262. package/dist/cli/tui/status-agents.js.map +1 -0
  263. package/dist/cli/tui/status-cache.d.ts +6 -0
  264. package/dist/cli/tui/status-cache.d.ts.map +1 -0
  265. package/dist/cli/tui/status-cache.js +39 -0
  266. package/dist/cli/tui/status-cache.js.map +1 -0
  267. package/dist/cli/tui/status-format.d.ts +14 -0
  268. package/dist/cli/tui/status-format.d.ts.map +1 -0
  269. package/dist/cli/tui/status-format.js +41 -0
  270. package/dist/cli/tui/status-format.js.map +1 -0
  271. package/dist/cli/tui/status-python.d.ts +6 -0
  272. package/dist/cli/tui/status-python.d.ts.map +1 -0
  273. package/dist/cli/tui/status-python.js +30 -0
  274. package/dist/cli/tui/status-python.js.map +1 -0
  275. package/dist/cli/tui/system-check.d.ts +24 -0
  276. package/dist/cli/tui/system-check.d.ts.map +1 -0
  277. package/dist/cli/tui/system-check.js +103 -0
  278. package/dist/cli/tui/system-check.js.map +1 -0
  279. package/dist/cli/tui/tui-reporter.d.ts +19 -0
  280. package/dist/cli/tui/tui-reporter.d.ts.map +1 -0
  281. package/dist/cli/tui/tui-reporter.js +95 -0
  282. package/dist/cli/tui/tui-reporter.js.map +1 -0
  283. package/dist/cli/tui/utils/config-writer.d.ts +3 -0
  284. package/dist/cli/tui/utils/config-writer.d.ts.map +1 -0
  285. package/dist/cli/tui/utils/config-writer.js +22 -0
  286. package/dist/cli/tui/utils/config-writer.js.map +1 -0
  287. package/dist/cli/tui/utils/suppress-logs.d.ts +3 -0
  288. package/dist/cli/tui/utils/suppress-logs.d.ts.map +1 -0
  289. package/dist/cli/tui/utils/suppress-logs.js +11 -0
  290. package/dist/cli/tui/utils/suppress-logs.js.map +1 -0
  291. package/dist/cli/tui/verify-suggestions.d.ts +5 -0
  292. package/dist/cli/tui/verify-suggestions.d.ts.map +1 -0
  293. package/dist/cli/tui/verify-suggestions.js +20 -0
  294. package/dist/cli/tui/verify-suggestions.js.map +1 -0
  295. package/dist/cli/tui/verify.d.ts +14 -0
  296. package/dist/cli/tui/verify.d.ts.map +1 -0
  297. package/dist/cli/tui/verify.js +101 -0
  298. package/dist/cli/tui/verify.js.map +1 -0
  299. package/dist/cli/tui/version.d.ts +2 -0
  300. package/dist/cli/tui/version.d.ts.map +1 -0
  301. package/dist/cli/tui/version.js +14 -0
  302. package/dist/cli/tui/version.js.map +1 -0
  303. package/dist/cli/uninstall.d.ts +2 -0
  304. package/dist/cli/uninstall.d.ts.map +1 -0
  305. package/dist/cli/uninstall.js +57 -0
  306. package/dist/cli/uninstall.js.map +1 -0
  307. package/dist/cli/warmup.d.ts +10 -2
  308. package/dist/cli/warmup.d.ts.map +1 -1
  309. package/dist/cli/warmup.js +226 -93
  310. package/dist/cli/warmup.js.map +1 -1
  311. package/dist/config.d.ts +28 -2
  312. package/dist/config.d.ts.map +1 -1
  313. package/dist/config.js +106 -56
  314. package/dist/config.js.map +1 -1
  315. package/dist/crawl/crawler.d.ts +6 -0
  316. package/dist/crawl/crawler.d.ts.map +1 -1
  317. package/dist/crawl/crawler.js +210 -209
  318. package/dist/crawl/crawler.js.map +1 -1
  319. package/dist/crawl/dedup.d.ts +1 -0
  320. package/dist/crawl/dedup.d.ts.map +1 -1
  321. package/dist/crawl/dedup.js +124 -81
  322. package/dist/crawl/dedup.js.map +1 -1
  323. package/dist/crawl/etag-incremental.d.ts +43 -0
  324. package/dist/crawl/etag-incremental.d.ts.map +1 -0
  325. package/dist/crawl/etag-incremental.js +94 -0
  326. package/dist/crawl/etag-incremental.js.map +1 -0
  327. package/dist/crawl/index-to-vec.d.ts +10 -0
  328. package/dist/crawl/index-to-vec.d.ts.map +1 -0
  329. package/dist/crawl/index-to-vec.js +44 -0
  330. package/dist/crawl/index-to-vec.js.map +1 -0
  331. package/dist/crawl/mapper.js +136 -164
  332. package/dist/crawl/mapper.js.map +1 -1
  333. package/dist/crawl/rate-limiter.js +63 -66
  334. package/dist/crawl/rate-limiter.js.map +1 -1
  335. package/dist/crawl/robots.js +58 -57
  336. package/dist/crawl/robots.js.map +1 -1
  337. package/dist/crawl/sitemap-first.d.ts +12 -0
  338. package/dist/crawl/sitemap-first.d.ts.map +1 -0
  339. package/dist/crawl/sitemap-first.js +47 -0
  340. package/dist/crawl/sitemap-first.js.map +1 -0
  341. package/dist/crawl/sitemap.js +33 -32
  342. package/dist/crawl/sitemap.js.map +1 -1
  343. package/dist/crawl/url-utils.d.ts +1 -0
  344. package/dist/crawl/url-utils.d.ts.map +1 -1
  345. package/dist/crawl/url-utils.js +49 -37
  346. package/dist/crawl/url-utils.js.map +1 -1
  347. package/dist/daemon/health-check.d.ts +16 -0
  348. package/dist/daemon/health-check.d.ts.map +1 -0
  349. package/dist/daemon/health-check.js +33 -0
  350. package/dist/daemon/health-check.js.map +1 -0
  351. package/dist/daemon/http-server.d.ts +26 -0
  352. package/dist/daemon/http-server.d.ts.map +1 -0
  353. package/dist/daemon/http-server.js +275 -0
  354. package/dist/daemon/http-server.js.map +1 -0
  355. package/dist/daemon/proxy.d.ts +10 -0
  356. package/dist/daemon/proxy.d.ts.map +1 -0
  357. package/dist/daemon/proxy.js +93 -0
  358. package/dist/daemon/proxy.js.map +1 -0
  359. package/dist/embedding/embed.d.ts +59 -0
  360. package/dist/embedding/embed.d.ts.map +1 -0
  361. package/dist/embedding/embed.js +233 -0
  362. package/dist/embedding/embed.js.map +1 -0
  363. package/dist/embedding/fastembed-provider.d.ts +19 -0
  364. package/dist/embedding/fastembed-provider.d.ts.map +1 -0
  365. package/dist/embedding/fastembed-provider.js +51 -0
  366. package/dist/embedding/fastembed-provider.js.map +1 -0
  367. package/dist/embedding/key-terms.d.ts +12 -0
  368. package/dist/embedding/key-terms.d.ts.map +1 -0
  369. package/dist/embedding/key-terms.js +234 -0
  370. package/dist/embedding/key-terms.js.map +1 -0
  371. package/dist/extraction/boilerplate.d.ts +15 -0
  372. package/dist/extraction/boilerplate.d.ts.map +1 -0
  373. package/dist/extraction/boilerplate.js +52 -0
  374. package/dist/extraction/boilerplate.js.map +1 -0
  375. package/dist/extraction/defuddle.d.ts.map +1 -1
  376. package/dist/extraction/defuddle.js +27 -23
  377. package/dist/extraction/defuddle.js.map +1 -1
  378. package/dist/extraction/extract.d.ts.map +1 -1
  379. package/dist/extraction/extract.js +76 -76
  380. package/dist/extraction/extract.js.map +1 -1
  381. package/dist/extraction/jsonld.js +50 -54
  382. package/dist/extraction/jsonld.js.map +1 -1
  383. package/dist/extraction/lang-hints.d.ts +2 -0
  384. package/dist/extraction/lang-hints.d.ts.map +1 -0
  385. package/dist/extraction/lang-hints.js +30 -0
  386. package/dist/extraction/lang-hints.js.map +1 -0
  387. package/dist/extraction/llm-fallback.d.ts +17 -0
  388. package/dist/extraction/llm-fallback.d.ts.map +1 -0
  389. package/dist/extraction/llm-fallback.js +130 -0
  390. package/dist/extraction/llm-fallback.js.map +1 -0
  391. package/dist/extraction/markdown-sanitize.d.ts +2 -0
  392. package/dist/extraction/markdown-sanitize.d.ts.map +1 -0
  393. package/dist/extraction/markdown-sanitize.js +151 -0
  394. package/dist/extraction/markdown-sanitize.js.map +1 -0
  395. package/dist/extraction/markdown.d.ts +11 -0
  396. package/dist/extraction/markdown.d.ts.map +1 -1
  397. package/dist/extraction/markdown.js +195 -91
  398. package/dist/extraction/markdown.js.map +1 -1
  399. package/dist/extraction/pipeline.d.ts +8 -0
  400. package/dist/extraction/pipeline.d.ts.map +1 -1
  401. package/dist/extraction/pipeline.js +57 -91
  402. package/dist/extraction/pipeline.js.map +1 -1
  403. package/dist/extraction/readability.d.ts +1 -1
  404. package/dist/extraction/readability.d.ts.map +1 -1
  405. package/dist/extraction/readability.js +28 -29
  406. package/dist/extraction/readability.js.map +1 -1
  407. package/dist/extraction/schema.d.ts +12 -0
  408. package/dist/extraction/schema.d.ts.map +1 -1
  409. package/dist/extraction/schema.js +135 -72
  410. package/dist/extraction/schema.js.map +1 -1
  411. package/dist/extraction/site-extractors/docs-generic.d.ts.map +1 -1
  412. package/dist/extraction/site-extractors/docs-generic.js +81 -91
  413. package/dist/extraction/site-extractors/docs-generic.js.map +1 -1
  414. package/dist/extraction/site-extractors/github.d.ts.map +1 -1
  415. package/dist/extraction/site-extractors/github.js +87 -95
  416. package/dist/extraction/site-extractors/github.js.map +1 -1
  417. package/dist/extraction/site-extractors/mdn.d.ts.map +1 -1
  418. package/dist/extraction/site-extractors/mdn.js +46 -54
  419. package/dist/extraction/site-extractors/mdn.js.map +1 -1
  420. package/dist/extraction/site-extractors/stackoverflow.d.ts.map +1 -1
  421. package/dist/extraction/site-extractors/stackoverflow.js +71 -80
  422. package/dist/extraction/site-extractors/stackoverflow.js.map +1 -1
  423. package/dist/extraction/structured-data.d.ts +4 -0
  424. package/dist/extraction/structured-data.d.ts.map +1 -0
  425. package/dist/extraction/structured-data.js +173 -0
  426. package/dist/extraction/structured-data.js.map +1 -0
  427. package/dist/extraction/structured.d.ts +4 -0
  428. package/dist/extraction/structured.d.ts.map +1 -0
  429. package/dist/extraction/structured.js +163 -0
  430. package/dist/extraction/structured.js.map +1 -0
  431. package/dist/extraction/v1/classifier.d.ts +3 -0
  432. package/dist/extraction/v1/classifier.d.ts.map +1 -0
  433. package/dist/extraction/v1/classifier.js +110 -0
  434. package/dist/extraction/v1/classifier.js.map +1 -0
  435. package/dist/extraction/v1/extract-provider.d.ts +16 -0
  436. package/dist/extraction/v1/extract-provider.d.ts.map +1 -0
  437. package/dist/extraction/v1/extract-provider.js +43 -0
  438. package/dist/extraction/v1/extract-provider.js.map +1 -0
  439. package/dist/extraction/v1/local-llm.d.ts +8 -0
  440. package/dist/extraction/v1/local-llm.d.ts.map +1 -0
  441. package/dist/extraction/v1/local-llm.js +58 -0
  442. package/dist/extraction/v1/local-llm.js.map +1 -0
  443. package/dist/extraction/v1/news.d.ts +3 -0
  444. package/dist/extraction/v1/news.d.ts.map +1 -0
  445. package/dist/extraction/v1/news.js +61 -0
  446. package/dist/extraction/v1/news.js.map +1 -0
  447. package/dist/extraction/v1/product.d.ts +3 -0
  448. package/dist/extraction/v1/product.d.ts.map +1 -0
  449. package/dist/extraction/v1/product.js +166 -0
  450. package/dist/extraction/v1/product.js.map +1 -0
  451. package/dist/extraction/v1/recipe.d.ts +3 -0
  452. package/dist/extraction/v1/recipe.d.ts.map +1 -0
  453. package/dist/extraction/v1/recipe.js +136 -0
  454. package/dist/extraction/v1/recipe.js.map +1 -0
  455. package/dist/extraction/v1/routed.d.ts +17 -0
  456. package/dist/extraction/v1/routed.d.ts.map +1 -0
  457. package/dist/extraction/v1/routed.js +68 -0
  458. package/dist/extraction/v1/routed.js.map +1 -0
  459. package/dist/extraction/v1/schemas/Article.d.ts +11 -0
  460. package/dist/extraction/v1/schemas/Article.d.ts.map +1 -0
  461. package/dist/extraction/v1/schemas/Article.js +23 -0
  462. package/dist/extraction/v1/schemas/Article.js.map +1 -0
  463. package/dist/extraction/v1/schemas/CodeSnippet.d.ts +9 -0
  464. package/dist/extraction/v1/schemas/CodeSnippet.d.ts.map +1 -0
  465. package/dist/extraction/v1/schemas/CodeSnippet.js +90 -0
  466. package/dist/extraction/v1/schemas/CodeSnippet.js.map +1 -0
  467. package/dist/extraction/v1/schemas/EventListing.d.ts +10 -0
  468. package/dist/extraction/v1/schemas/EventListing.d.ts.map +1 -0
  469. package/dist/extraction/v1/schemas/EventListing.js +122 -0
  470. package/dist/extraction/v1/schemas/EventListing.js.map +1 -0
  471. package/dist/extraction/v1/schemas/Paper.d.ts +10 -0
  472. package/dist/extraction/v1/schemas/Paper.d.ts.map +1 -0
  473. package/dist/extraction/v1/schemas/Paper.js +156 -0
  474. package/dist/extraction/v1/schemas/Paper.js.map +1 -0
  475. package/dist/extraction/v1/schemas/Product.d.ts +17 -0
  476. package/dist/extraction/v1/schemas/Product.d.ts.map +1 -0
  477. package/dist/extraction/v1/schemas/Product.js +149 -0
  478. package/dist/extraction/v1/schemas/Product.js.map +1 -0
  479. package/dist/extraction/v1/schemas/Recipe.d.ts +14 -0
  480. package/dist/extraction/v1/schemas/Recipe.d.ts.map +1 -0
  481. package/dist/extraction/v1/schemas/Recipe.js +160 -0
  482. package/dist/extraction/v1/schemas/Recipe.js.map +1 -0
  483. package/dist/extraction/v1/schemas/index.d.ts +13 -0
  484. package/dist/extraction/v1/schemas/index.d.ts.map +1 -0
  485. package/dist/extraction/v1/schemas/index.js +44 -0
  486. package/dist/extraction/v1/schemas/index.js.map +1 -0
  487. package/dist/extraction/v1/site-extractors.d.ts +5 -0
  488. package/dist/extraction/v1/site-extractors.d.ts.map +1 -0
  489. package/dist/extraction/v1/site-extractors.js +31 -0
  490. package/dist/extraction/v1/site-extractors.js.map +1 -0
  491. package/dist/fetch/action-executor.d.ts +28 -0
  492. package/dist/fetch/action-executor.d.ts.map +1 -0
  493. package/dist/fetch/action-executor.js +88 -0
  494. package/dist/fetch/action-executor.js.map +1 -0
  495. package/dist/fetch/auth.d.ts +2 -1
  496. package/dist/fetch/auth.d.ts.map +1 -1
  497. package/dist/fetch/auth.js +56 -26
  498. package/dist/fetch/auth.js.map +1 -1
  499. package/dist/fetch/browser-pool.d.ts +30 -11
  500. package/dist/fetch/browser-pool.d.ts.map +1 -1
  501. package/dist/fetch/browser-pool.js +303 -127
  502. package/dist/fetch/browser-pool.js.map +1 -1
  503. package/dist/fetch/browser-selector.d.ts +17 -0
  504. package/dist/fetch/browser-selector.d.ts.map +1 -0
  505. package/dist/fetch/browser-selector.js +72 -0
  506. package/dist/fetch/browser-selector.js.map +1 -0
  507. package/dist/fetch/browser-types.d.ts +3 -0
  508. package/dist/fetch/browser-types.d.ts.map +1 -0
  509. package/dist/fetch/browser-types.js +45 -0
  510. package/dist/fetch/browser-types.js.map +1 -0
  511. package/dist/fetch/cdp-client.d.ts +9 -0
  512. package/dist/fetch/cdp-client.d.ts.map +1 -0
  513. package/dist/fetch/cdp-client.js +89 -0
  514. package/dist/fetch/cdp-client.js.map +1 -0
  515. package/dist/fetch/content-check.js +39 -46
  516. package/dist/fetch/content-check.js.map +1 -1
  517. package/dist/fetch/http-client.d.ts +4 -0
  518. package/dist/fetch/http-client.d.ts.map +1 -1
  519. package/dist/fetch/http-client.js +147 -128
  520. package/dist/fetch/http-client.js.map +1 -1
  521. package/dist/fetch/lightpanda.d.ts +28 -0
  522. package/dist/fetch/lightpanda.d.ts.map +1 -0
  523. package/dist/fetch/lightpanda.js +174 -0
  524. package/dist/fetch/lightpanda.js.map +1 -0
  525. package/dist/fetch/playwright-tier.d.ts +19 -0
  526. package/dist/fetch/playwright-tier.d.ts.map +1 -0
  527. package/dist/fetch/playwright-tier.js +76 -0
  528. package/dist/fetch/playwright-tier.js.map +1 -0
  529. package/dist/fetch/router.d.ts +49 -3
  530. package/dist/fetch/router.d.ts.map +1 -1
  531. package/dist/fetch/router.js +185 -81
  532. package/dist/fetch/router.js.map +1 -1
  533. package/dist/index.js +97 -17
  534. package/dist/index.js.map +1 -1
  535. package/dist/instructions.d.ts +31 -0
  536. package/dist/instructions.d.ts.map +1 -0
  537. package/dist/instructions.js +245 -0
  538. package/dist/instructions.js.map +1 -0
  539. package/dist/integrations/cloud/llm/anthropic.d.ts +3 -0
  540. package/dist/integrations/cloud/llm/anthropic.d.ts.map +1 -0
  541. package/dist/integrations/cloud/llm/anthropic.js +41 -0
  542. package/dist/integrations/cloud/llm/anthropic.js.map +1 -0
  543. package/dist/integrations/cloud/llm/cache.d.ts +5 -0
  544. package/dist/integrations/cloud/llm/cache.d.ts.map +1 -0
  545. package/dist/integrations/cloud/llm/cache.js +49 -0
  546. package/dist/integrations/cloud/llm/cache.js.map +1 -0
  547. package/dist/integrations/cloud/llm/gemini.d.ts +3 -0
  548. package/dist/integrations/cloud/llm/gemini.d.ts.map +1 -0
  549. package/dist/integrations/cloud/llm/gemini.js +37 -0
  550. package/dist/integrations/cloud/llm/gemini.js.map +1 -0
  551. package/dist/integrations/cloud/llm/groq.d.ts +3 -0
  552. package/dist/integrations/cloud/llm/groq.d.ts.map +1 -0
  553. package/dist/integrations/cloud/llm/groq.js +74 -0
  554. package/dist/integrations/cloud/llm/groq.js.map +1 -0
  555. package/dist/integrations/cloud/llm/hash.d.ts +3 -0
  556. package/dist/integrations/cloud/llm/hash.d.ts.map +1 -0
  557. package/dist/integrations/cloud/llm/hash.js +26 -0
  558. package/dist/integrations/cloud/llm/hash.js.map +1 -0
  559. package/dist/integrations/cloud/llm/openai.d.ts +3 -0
  560. package/dist/integrations/cloud/llm/openai.d.ts.map +1 -0
  561. package/dist/integrations/cloud/llm/openai.js +43 -0
  562. package/dist/integrations/cloud/llm/openai.js.map +1 -0
  563. package/dist/integrations/cloud/llm/select.d.ts +5 -0
  564. package/dist/integrations/cloud/llm/select.d.ts.map +1 -0
  565. package/dist/integrations/cloud/llm/select.js +30 -0
  566. package/dist/integrations/cloud/llm/select.js.map +1 -0
  567. package/dist/integrations/cloud/llm/types.d.ts +24 -0
  568. package/dist/integrations/cloud/llm/types.d.ts.map +1 -0
  569. package/dist/integrations/cloud/llm/types.js +1 -0
  570. package/dist/integrations/cloud/llm/types.js.map +1 -0
  571. package/dist/integrations/cloud/llm/validate.d.ts +6 -0
  572. package/dist/integrations/cloud/llm/validate.d.ts.map +1 -0
  573. package/dist/integrations/cloud/llm/validate.js +63 -0
  574. package/dist/integrations/cloud/llm/validate.js.map +1 -0
  575. package/dist/logger.d.ts +4 -1
  576. package/dist/logger.d.ts.map +1 -1
  577. package/dist/logger.js +71 -30
  578. package/dist/logger.js.map +1 -1
  579. package/dist/pdf-parse.d.js +1 -0
  580. package/dist/pdf-parse.d.js.map +1 -0
  581. package/dist/plugins/loader.d.ts +20 -0
  582. package/dist/plugins/loader.d.ts.map +1 -0
  583. package/dist/plugins/loader.js +157 -0
  584. package/dist/plugins/loader.js.map +1 -0
  585. package/dist/plugins/registry.d.ts +26 -0
  586. package/dist/plugins/registry.d.ts.map +1 -0
  587. package/dist/plugins/registry.js +71 -0
  588. package/dist/plugins/registry.js.map +1 -0
  589. package/dist/plugins/validate.d.ts +9 -0
  590. package/dist/plugins/validate.d.ts.map +1 -0
  591. package/dist/plugins/validate.js +79 -0
  592. package/dist/plugins/validate.js.map +1 -0
  593. package/dist/providers/embed-provider.d.ts +11 -0
  594. package/dist/providers/embed-provider.d.ts.map +1 -0
  595. package/dist/providers/embed-provider.js +24 -0
  596. package/dist/providers/embed-provider.js.map +1 -0
  597. package/dist/providers/extract-provider.d.ts +23 -0
  598. package/dist/providers/extract-provider.d.ts.map +1 -0
  599. package/dist/providers/extract-provider.js +25 -0
  600. package/dist/providers/extract-provider.js.map +1 -0
  601. package/dist/providers/rerank-provider.d.ts +16 -0
  602. package/dist/providers/rerank-provider.d.ts.map +1 -0
  603. package/dist/providers/rerank-provider.js +28 -0
  604. package/dist/providers/rerank-provider.js.map +1 -0
  605. package/dist/providers/search-provider.d.ts +25 -0
  606. package/dist/providers/search-provider.d.ts.map +1 -0
  607. package/dist/providers/search-provider.js +44 -0
  608. package/dist/providers/search-provider.js.map +1 -0
  609. package/dist/providers/vector-store.d.ts +27 -0
  610. package/dist/providers/vector-store.d.ts.map +1 -0
  611. package/dist/providers/vector-store.js +27 -0
  612. package/dist/providers/vector-store.js.map +1 -0
  613. package/dist/python-env.d.ts +9 -0
  614. package/dist/python-env.d.ts.map +1 -0
  615. package/dist/python-env.js +13 -0
  616. package/dist/python-env.js.map +1 -0
  617. package/dist/repl/commands/agent.d.ts +5 -0
  618. package/dist/repl/commands/agent.d.ts.map +1 -0
  619. package/dist/repl/commands/agent.js +62 -0
  620. package/dist/repl/commands/agent.js.map +1 -0
  621. package/dist/repl/commands/cache.d.ts +4 -0
  622. package/dist/repl/commands/cache.d.ts.map +1 -0
  623. package/dist/repl/commands/cache.js +43 -0
  624. package/dist/repl/commands/cache.js.map +1 -0
  625. package/dist/repl/commands/crawl.d.ts +7 -0
  626. package/dist/repl/commands/crawl.d.ts.map +1 -0
  627. package/dist/repl/commands/crawl.js +44 -0
  628. package/dist/repl/commands/crawl.js.map +1 -0
  629. package/dist/repl/commands/extract.d.ts +5 -0
  630. package/dist/repl/commands/extract.d.ts.map +1 -0
  631. package/dist/repl/commands/extract.js +47 -0
  632. package/dist/repl/commands/extract.js.map +1 -0
  633. package/dist/repl/commands/fetch.d.ts +5 -0
  634. package/dist/repl/commands/fetch.d.ts.map +1 -0
  635. package/dist/repl/commands/fetch.js +67 -0
  636. package/dist/repl/commands/fetch.js.map +1 -0
  637. package/dist/repl/commands/find-similar.d.ts +5 -0
  638. package/dist/repl/commands/find-similar.d.ts.map +1 -0
  639. package/dist/repl/commands/find-similar.js +74 -0
  640. package/dist/repl/commands/find-similar.js.map +1 -0
  641. package/dist/repl/commands/research.d.ts +5 -0
  642. package/dist/repl/commands/research.d.ts.map +1 -0
  643. package/dist/repl/commands/research.js +65 -0
  644. package/dist/repl/commands/research.js.map +1 -0
  645. package/dist/repl/commands/search.d.ts +5 -0
  646. package/dist/repl/commands/search.d.ts.map +1 -0
  647. package/dist/repl/commands/search.js +74 -0
  648. package/dist/repl/commands/search.js.map +1 -0
  649. package/dist/repl/commands/types.d.ts +9 -0
  650. package/dist/repl/commands/types.d.ts.map +1 -0
  651. package/dist/repl/commands/types.js +1 -0
  652. package/dist/repl/commands/types.js.map +1 -0
  653. package/dist/repl/formatters.d.ts +13 -0
  654. package/dist/repl/formatters.d.ts.map +1 -0
  655. package/dist/repl/formatters.js +283 -0
  656. package/dist/repl/formatters.js.map +1 -0
  657. package/dist/repl/parser.d.ts +9 -0
  658. package/dist/repl/parser.d.ts.map +1 -0
  659. package/dist/repl/parser.js +86 -0
  660. package/dist/repl/parser.js.map +1 -0
  661. package/dist/repl/shell.d.ts +8 -0
  662. package/dist/repl/shell.d.ts.map +1 -0
  663. package/dist/repl/shell.js +184 -0
  664. package/dist/repl/shell.js.map +1 -0
  665. package/dist/research/branch-exploration.d.ts +14 -0
  666. package/dist/research/branch-exploration.d.ts.map +1 -0
  667. package/dist/research/branch-exploration.js +100 -0
  668. package/dist/research/branch-exploration.js.map +1 -0
  669. package/dist/research/brief.d.ts +5 -0
  670. package/dist/research/brief.d.ts.map +1 -0
  671. package/dist/research/brief.js +242 -0
  672. package/dist/research/brief.js.map +1 -0
  673. package/dist/research/citation-graph.d.ts +9 -0
  674. package/dist/research/citation-graph.d.ts.map +1 -0
  675. package/dist/research/citation-graph.js +114 -0
  676. package/dist/research/citation-graph.js.map +1 -0
  677. package/dist/research/decompose.d.ts +14 -0
  678. package/dist/research/decompose.d.ts.map +1 -0
  679. package/dist/research/decompose.js +439 -0
  680. package/dist/research/decompose.js.map +1 -0
  681. package/dist/research/pipeline.d.ts +5 -0
  682. package/dist/research/pipeline.d.ts.map +1 -0
  683. package/dist/research/pipeline.js +269 -0
  684. package/dist/research/pipeline.js.map +1 -0
  685. package/dist/research/synthesis-local.d.ts +16 -0
  686. package/dist/research/synthesis-local.d.ts.map +1 -0
  687. package/dist/research/synthesis-local.js +73 -0
  688. package/dist/research/synthesis-local.js.map +1 -0
  689. package/dist/research/synthesize.d.ts +10 -0
  690. package/dist/research/synthesize.d.ts.map +1 -0
  691. package/dist/research/synthesize.js +137 -0
  692. package/dist/research/synthesize.js.map +1 -0
  693. package/dist/search/answer-synthesis.d.ts +33 -0
  694. package/dist/search/answer-synthesis.d.ts.map +1 -0
  695. package/dist/search/answer-synthesis.js +244 -0
  696. package/dist/search/answer-synthesis.js.map +1 -0
  697. package/dist/search/context-formatter.d.ts +3 -0
  698. package/dist/search/context-formatter.d.ts.map +1 -0
  699. package/dist/search/context-formatter.js +56 -0
  700. package/dist/search/context-formatter.js.map +1 -0
  701. package/dist/search/dedup.d.ts +1 -0
  702. package/dist/search/dedup.d.ts.map +1 -1
  703. package/dist/search/dedup.js +40 -32
  704. package/dist/search/dedup.js.map +1 -1
  705. package/dist/search/engines/arxiv.d.ts +7 -0
  706. package/dist/search/engines/arxiv.d.ts.map +1 -0
  707. package/dist/search/engines/arxiv.js +70 -0
  708. package/dist/search/engines/arxiv.js.map +1 -0
  709. package/dist/search/engines/bing-news.d.ts +7 -0
  710. package/dist/search/engines/bing-news.d.ts.map +1 -0
  711. package/dist/search/engines/bing-news.js +97 -0
  712. package/dist/search/engines/bing-news.js.map +1 -0
  713. package/dist/search/engines/bing.d.ts +1 -0
  714. package/dist/search/engines/bing.d.ts.map +1 -1
  715. package/dist/search/engines/bing.js +100 -44
  716. package/dist/search/engines/bing.js.map +1 -1
  717. package/dist/search/engines/devdocs.d.ts +6 -0
  718. package/dist/search/engines/devdocs.d.ts.map +1 -0
  719. package/dist/search/engines/devdocs.js +56 -0
  720. package/dist/search/engines/devdocs.js.map +1 -0
  721. package/dist/search/engines/duckduckgo.d.ts.map +1 -1
  722. package/dist/search/engines/duckduckgo.js +56 -44
  723. package/dist/search/engines/duckduckgo.js.map +1 -1
  724. package/dist/search/engines/github-code.d.ts +7 -0
  725. package/dist/search/engines/github-code.d.ts.map +1 -0
  726. package/dist/search/engines/github-code.js +55 -0
  727. package/dist/search/engines/github-code.js.map +1 -0
  728. package/dist/search/engines/hn-algolia.d.ts +7 -0
  729. package/dist/search/engines/hn-algolia.d.ts.map +1 -0
  730. package/dist/search/engines/hn-algolia.js +76 -0
  731. package/dist/search/engines/hn-algolia.js.map +1 -0
  732. package/dist/search/engines/lobsters.d.ts +7 -0
  733. package/dist/search/engines/lobsters.d.ts.map +1 -0
  734. package/dist/search/engines/lobsters.js +83 -0
  735. package/dist/search/engines/lobsters.js.map +1 -0
  736. package/dist/search/engines/mdn.d.ts +7 -0
  737. package/dist/search/engines/mdn.d.ts.map +1 -0
  738. package/dist/search/engines/mdn.js +48 -0
  739. package/dist/search/engines/mdn.js.map +1 -0
  740. package/dist/search/engines/semantic-scholar.d.ts +7 -0
  741. package/dist/search/engines/semantic-scholar.d.ts.map +1 -0
  742. package/dist/search/engines/semantic-scholar.js +69 -0
  743. package/dist/search/engines/semantic-scholar.js.map +1 -0
  744. package/dist/search/engines/stackoverflow.d.ts +7 -0
  745. package/dist/search/engines/stackoverflow.d.ts.map +1 -0
  746. package/dist/search/engines/stackoverflow.js +73 -0
  747. package/dist/search/engines/stackoverflow.js.map +1 -0
  748. package/dist/search/engines/startpage.d.ts.map +1 -1
  749. package/dist/search/engines/startpage.js +65 -46
  750. package/dist/search/engines/startpage.js.map +1 -1
  751. package/dist/search/evidence.d.ts +25 -0
  752. package/dist/search/evidence.d.ts.map +1 -0
  753. package/dist/search/evidence.js +220 -0
  754. package/dist/search/evidence.js.map +1 -0
  755. package/dist/search/filters.js +49 -55
  756. package/dist/search/filters.js.map +1 -1
  757. package/dist/search/find-similar/crawl-rank.d.ts +9 -0
  758. package/dist/search/find-similar/crawl-rank.d.ts.map +1 -0
  759. package/dist/search/find-similar/crawl-rank.js +272 -0
  760. package/dist/search/find-similar/crawl-rank.js.map +1 -0
  761. package/dist/search/find-similar/mode.d.ts +4 -0
  762. package/dist/search/find-similar/mode.d.ts.map +1 -0
  763. package/dist/search/find-similar/mode.js +12 -0
  764. package/dist/search/find-similar/mode.js.map +1 -0
  765. package/dist/search/find-similar.d.ts +5 -0
  766. package/dist/search/find-similar.d.ts.map +1 -0
  767. package/dist/search/find-similar.js +509 -0
  768. package/dist/search/find-similar.js.map +1 -0
  769. package/dist/search/highlights.d.ts +19 -0
  770. package/dist/search/highlights.d.ts.map +1 -0
  771. package/dist/search/highlights.js +167 -0
  772. package/dist/search/highlights.js.map +1 -0
  773. package/dist/search/language-filter.d.ts +29 -0
  774. package/dist/search/language-filter.d.ts.map +1 -0
  775. package/dist/search/language-filter.js +126 -0
  776. package/dist/search/language-filter.js.map +1 -0
  777. package/dist/search/legacy/searxng-orchestrator.d.ts +4 -0
  778. package/dist/search/legacy/searxng-orchestrator.d.ts.map +1 -0
  779. package/dist/search/legacy/searxng-orchestrator.js +501 -0
  780. package/dist/search/legacy/searxng-orchestrator.js.map +1 -0
  781. package/dist/search/legacy/searxng-provider.d.ts +7 -0
  782. package/dist/search/legacy/searxng-provider.d.ts.map +1 -0
  783. package/dist/search/legacy/searxng-provider.js +11 -0
  784. package/dist/search/legacy/searxng-provider.js.map +1 -0
  785. package/dist/search/multi-query.d.ts +25 -0
  786. package/dist/search/multi-query.d.ts.map +1 -0
  787. package/dist/search/multi-query.js +228 -0
  788. package/dist/search/multi-query.js.map +1 -0
  789. package/dist/search/query.js +32 -34
  790. package/dist/search/query.js.map +1 -1
  791. package/dist/search/rerank.d.ts +3 -1
  792. package/dist/search/rerank.d.ts.map +1 -1
  793. package/dist/search/rerank.js +44 -35
  794. package/dist/search/rerank.js.map +1 -1
  795. package/dist/search/reranker/authority-boost.d.ts +3 -0
  796. package/dist/search/reranker/authority-boost.d.ts.map +1 -0
  797. package/dist/search/reranker/authority-boost.js +179 -0
  798. package/dist/search/reranker/authority-boost.js.map +1 -0
  799. package/dist/search/reranker/consensus-boost.d.ts +3 -0
  800. package/dist/search/reranker/consensus-boost.d.ts.map +1 -0
  801. package/dist/search/reranker/consensus-boost.js +27 -0
  802. package/dist/search/reranker/consensus-boost.js.map +1 -0
  803. package/dist/search/reranker/recency-boost.d.ts +3 -0
  804. package/dist/search/reranker/recency-boost.d.ts.map +1 -0
  805. package/dist/search/reranker/recency-boost.js +13 -0
  806. package/dist/search/reranker/recency-boost.js.map +1 -0
  807. package/dist/search/reranker/recency.d.ts +3 -0
  808. package/dist/search/reranker/recency.d.ts.map +1 -0
  809. package/dist/search/reranker/recency.js +23 -0
  810. package/dist/search/reranker/recency.js.map +1 -0
  811. package/dist/search/reranker/transformers-rerank-provider.d.ts +12 -0
  812. package/dist/search/reranker/transformers-rerank-provider.d.ts.map +1 -0
  813. package/dist/search/reranker/transformers-rerank-provider.js +78 -0
  814. package/dist/search/reranker/transformers-rerank-provider.js.map +1 -0
  815. package/dist/search/rrf.d.ts +17 -0
  816. package/dist/search/rrf.d.ts.map +1 -0
  817. package/dist/search/rrf.js +39 -0
  818. package/dist/search/rrf.js.map +1 -0
  819. package/dist/search/sampling.d.ts +25 -0
  820. package/dist/search/sampling.d.ts.map +1 -0
  821. package/dist/search/sampling.js +52 -0
  822. package/dist/search/sampling.js.map +1 -0
  823. package/dist/search/searxng.d.ts.map +1 -1
  824. package/dist/search/searxng.js +69 -79
  825. package/dist/search/searxng.js.map +1 -1
  826. package/dist/search/tokens.d.ts +3 -0
  827. package/dist/search/tokens.d.ts.map +1 -0
  828. package/dist/search/tokens.js +39 -0
  829. package/dist/search/tokens.js.map +1 -0
  830. package/dist/search/truncate.d.ts +6 -0
  831. package/dist/search/truncate.d.ts.map +1 -0
  832. package/dist/search/truncate.js +26 -0
  833. package/dist/search/truncate.js.map +1 -0
  834. package/dist/search/url-unwrap.d.ts +3 -0
  835. package/dist/search/url-unwrap.d.ts.map +1 -0
  836. package/dist/search/url-unwrap.js +43 -0
  837. package/dist/search/url-unwrap.js.map +1 -0
  838. package/dist/search/v1/context-rank.d.ts +13 -0
  839. package/dist/search/v1/context-rank.d.ts.map +1 -0
  840. package/dist/search/v1/context-rank.js +74 -0
  841. package/dist/search/v1/context-rank.js.map +1 -0
  842. package/dist/search/v1/engine-base.d.ts +27 -0
  843. package/dist/search/v1/engine-base.d.ts.map +1 -0
  844. package/dist/search/v1/engine-base.js +110 -0
  845. package/dist/search/v1/engine-base.js.map +1 -0
  846. package/dist/search/v1/intent-router.d.ts +22 -0
  847. package/dist/search/v1/intent-router.d.ts.map +1 -0
  848. package/dist/search/v1/intent-router.js +138 -0
  849. package/dist/search/v1/intent-router.js.map +1 -0
  850. package/dist/search/v1/orchestrator.d.ts +24 -0
  851. package/dist/search/v1/orchestrator.d.ts.map +1 -0
  852. package/dist/search/v1/orchestrator.js +163 -0
  853. package/dist/search/v1/orchestrator.js.map +1 -0
  854. package/dist/search/v1/recency-boost.d.ts +9 -0
  855. package/dist/search/v1/recency-boost.d.ts.map +1 -0
  856. package/dist/search/v1/recency-boost.js +37 -0
  857. package/dist/search/v1/recency-boost.js.map +1 -0
  858. package/dist/search/v1/recent-cache-dedup.d.ts +6 -0
  859. package/dist/search/v1/recent-cache-dedup.d.ts.map +1 -0
  860. package/dist/search/v1/recent-cache-dedup.js +85 -0
  861. package/dist/search/v1/recent-cache-dedup.js.map +1 -0
  862. package/dist/search/v1/rss/feed-config.d.ts +21 -0
  863. package/dist/search/v1/rss/feed-config.d.ts.map +1 -0
  864. package/dist/search/v1/rss/feed-config.js +90 -0
  865. package/dist/search/v1/rss/feed-config.js.map +1 -0
  866. package/dist/search/v1/rss/feed-parser.d.ts +14 -0
  867. package/dist/search/v1/rss/feed-parser.d.ts.map +1 -0
  868. package/dist/search/v1/rss/feed-parser.js +104 -0
  869. package/dist/search/v1/rss/feed-parser.js.map +1 -0
  870. package/dist/search/v1/rss/feed-poller.d.ts +22 -0
  871. package/dist/search/v1/rss/feed-poller.d.ts.map +1 -0
  872. package/dist/search/v1/rss/feed-poller.js +102 -0
  873. package/dist/search/v1/rss/feed-poller.js.map +1 -0
  874. package/dist/search/v1/rss/feed-store.d.ts +30 -0
  875. package/dist/search/v1/rss/feed-store.d.ts.map +1 -0
  876. package/dist/search/v1/rss/feed-store.js +134 -0
  877. package/dist/search/v1/rss/feed-store.js.map +1 -0
  878. package/dist/search/v1/rss/rss-engine.d.ts +6 -0
  879. package/dist/search/v1/rss/rss-engine.d.ts.map +1 -0
  880. package/dist/search/v1/rss/rss-engine.js +28 -0
  881. package/dist/search/v1/rss/rss-engine.js.map +1 -0
  882. package/dist/search/v1/v1-provider.d.ts +7 -0
  883. package/dist/search/v1/v1-provider.d.ts.map +1 -0
  884. package/dist/search/v1/v1-provider.js +68 -0
  885. package/dist/search/v1/v1-provider.js.map +1 -0
  886. package/dist/search/v1/verticals/code.d.ts +4 -0
  887. package/dist/search/v1/verticals/code.d.ts.map +1 -0
  888. package/dist/search/v1/verticals/code.js +20 -0
  889. package/dist/search/v1/verticals/code.js.map +1 -0
  890. package/dist/search/v1/verticals/docs.d.ts +4 -0
  891. package/dist/search/v1/verticals/docs.d.ts.map +1 -0
  892. package/dist/search/v1/verticals/docs.js +20 -0
  893. package/dist/search/v1/verticals/docs.js.map +1 -0
  894. package/dist/search/v1/verticals/general.d.ts +4 -0
  895. package/dist/search/v1/verticals/general.d.ts.map +1 -0
  896. package/dist/search/v1/verticals/general.js +22 -0
  897. package/dist/search/v1/verticals/general.js.map +1 -0
  898. package/dist/search/v1/verticals/news.d.ts +10 -0
  899. package/dist/search/v1/verticals/news.d.ts.map +1 -0
  900. package/dist/search/v1/verticals/news.js +52 -0
  901. package/dist/search/v1/verticals/news.js.map +1 -0
  902. package/dist/search/v1/verticals/papers.d.ts +4 -0
  903. package/dist/search/v1/verticals/papers.d.ts.map +1 -0
  904. package/dist/search/v1/verticals/papers.js +23 -0
  905. package/dist/search/v1/verticals/papers.js.map +1 -0
  906. package/dist/search/validator.js +31 -31
  907. package/dist/search/validator.js.map +1 -1
  908. package/dist/searxng/bootstrap.d.ts +30 -0
  909. package/dist/searxng/bootstrap.d.ts.map +1 -1
  910. package/dist/searxng/bootstrap.js +223 -85
  911. package/dist/searxng/bootstrap.js.map +1 -1
  912. package/dist/searxng/docker.d.ts.map +1 -1
  913. package/dist/searxng/docker.js +69 -60
  914. package/dist/searxng/docker.js.map +1 -1
  915. package/dist/searxng/process.d.ts +13 -1
  916. package/dist/searxng/process.d.ts.map +1 -1
  917. package/dist/searxng/process.js +231 -164
  918. package/dist/searxng/process.js.map +1 -1
  919. package/dist/server/backend-status.d.ts +13 -0
  920. package/dist/server/backend-status.d.ts.map +1 -0
  921. package/dist/server/backend-status.js +40 -0
  922. package/dist/server/backend-status.js.map +1 -0
  923. package/dist/server/tool-schemas.d.ts +549 -0
  924. package/dist/server/tool-schemas.d.ts.map +1 -0
  925. package/dist/server/tool-schemas.js +464 -0
  926. package/dist/server/tool-schemas.js.map +1 -0
  927. package/dist/server/warmup-on-start.d.ts +9 -0
  928. package/dist/server/warmup-on-start.d.ts.map +1 -0
  929. package/dist/server/warmup-on-start.js +55 -0
  930. package/dist/server/warmup-on-start.js.map +1 -0
  931. package/dist/server.d.ts +17 -0
  932. package/dist/server.d.ts.map +1 -1
  933. package/dist/server.js +454 -297
  934. package/dist/server.js.map +1 -1
  935. package/dist/tools/agent.d.ts +5 -0
  936. package/dist/tools/agent.d.ts.map +1 -0
  937. package/dist/tools/agent.js +128 -0
  938. package/dist/tools/agent.js.map +1 -0
  939. package/dist/tools/cache.d.ts +2 -1
  940. package/dist/tools/cache.d.ts.map +1 -1
  941. package/dist/tools/cache.js +175 -44
  942. package/dist/tools/cache.js.map +1 -1
  943. package/dist/tools/crawl.d.ts.map +1 -1
  944. package/dist/tools/crawl.js +171 -88
  945. package/dist/tools/crawl.js.map +1 -1
  946. package/dist/tools/extract.d.ts +2 -2
  947. package/dist/tools/extract.d.ts.map +1 -1
  948. package/dist/tools/extract.js +175 -59
  949. package/dist/tools/extract.js.map +1 -1
  950. package/dist/tools/fetch.d.ts +2 -2
  951. package/dist/tools/fetch.d.ts.map +1 -1
  952. package/dist/tools/fetch.js +161 -68
  953. package/dist/tools/fetch.js.map +1 -1
  954. package/dist/tools/find-similar.d.ts +5 -0
  955. package/dist/tools/find-similar.d.ts.map +1 -0
  956. package/dist/tools/find-similar.js +127 -0
  957. package/dist/tools/find-similar.js.map +1 -0
  958. package/dist/tools/research.d.ts +5 -0
  959. package/dist/tools/research.d.ts.map +1 -0
  960. package/dist/tools/research.js +107 -0
  961. package/dist/tools/research.js.map +1 -0
  962. package/dist/tools/search.d.ts +10 -2
  963. package/dist/tools/search.d.ts.map +1 -1
  964. package/dist/tools/search.js +13 -158
  965. package/dist/tools/search.js.map +1 -1
  966. package/dist/types.d.ts +350 -7
  967. package/dist/types.d.ts.map +1 -1
  968. package/dist/types.js +6 -1
  969. package/dist/types.js.map +1 -1
  970. package/dist/util/mode.d.ts +4 -0
  971. package/dist/util/mode.d.ts.map +1 -0
  972. package/dist/util/mode.js +34 -0
  973. package/dist/util/mode.js.map +1 -0
  974. package/package.json +78 -8
  975. package/dist/extraction/trafilatura.d.ts +0 -6
  976. package/dist/extraction/trafilatura.d.ts.map +0 -1
  977. package/dist/extraction/trafilatura.js +0 -105
  978. package/dist/extraction/trafilatura.js.map +0 -1
  979. package/dist/search/flashrank.d.ts +0 -12
  980. package/dist/search/flashrank.d.ts.map +0 -1
  981. package/dist/search/flashrank.js +0 -63
  982. package/dist/search/flashrank.js.map +0 -1
@@ -0,0 +1,25 @@
1
+ import type { Citation, EvidenceItem, SearchInput, SearchOutput, SearchResultItem, SourceSpan } from '../types.js';
2
+ export interface BuildEvidenceOptions {
3
+ maxTokensOut?: number;
4
+ maxItems?: number;
5
+ }
6
+ export declare function buildEvidenceFromMarkdown(query: string, title: string, url: string, markdown: string, opts?: BuildEvidenceOptions): Promise<EvidenceItem[]>;
7
+ export declare function applyAggregateMarkdownBudget<T>(items: T[], getBody: (item: T) => string, setBody: (item: T, body: string) => void, opts: {
8
+ maxTokensOut?: number;
9
+ maxChars?: number;
10
+ }): void;
11
+ export declare function applyTokenBudget(items: EvidenceItem[], maxTokensOut: number): EvidenceItem[];
12
+ export declare function stableCitationId(url: string, start: number): string;
13
+ export declare function buildEvidenceItem(input: {
14
+ title: string;
15
+ url: string;
16
+ sectionHeading: string | null;
17
+ excerpt: string;
18
+ score: number;
19
+ sourceSpan: SourceSpan;
20
+ }): EvidenceItem;
21
+ export declare function applyEvidenceDefault(input: SearchInput, output: SearchOutput, results: SearchResultItem[], query: string): Promise<void>;
22
+ export declare function buildCitationsFromEvidence(results: SearchResultItem[], evidence: EvidenceItem[], baseCitations: Citation[]): Citation[];
23
+ export declare function renderCitationsXml(citations: Citation[]): string;
24
+ export declare function escapeXml(s: string): string;
25
+ //# sourceMappingURL=evidence.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"evidence.d.ts","sourceRoot":"","sources":["../../src/search/evidence.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,EACV,QAAQ,EAER,YAAY,EACZ,WAAW,EACX,YAAY,EACZ,gBAAgB,EAChB,UAAU,EACX,MAAM,aAAa,CAAC;AAYrB,MAAM,WAAW,oBAAoB;IACnC,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,QAAQ,CAAC,EAAE,MAAM,CAAC;CACnB;AAMD,wBAAsB,yBAAyB,CAC7C,KAAK,EAAE,MAAM,EACb,KAAK,EAAE,MAAM,EACb,GAAG,EAAE,MAAM,EACX,QAAQ,EAAE,MAAM,EAChB,IAAI,GAAE,oBAAyB,GAC9B,OAAO,CAAC,YAAY,EAAE,CAAC,CA+CzB;AAMD,wBAAgB,4BAA4B,CAAC,CAAC,EAC5C,KAAK,EAAE,CAAC,EAAE,EACV,OAAO,EAAE,CAAC,IAAI,EAAE,CAAC,KAAK,MAAM,EAC5B,OAAO,EAAE,CAAC,IAAI,EAAE,CAAC,EAAE,IAAI,EAAE,MAAM,KAAK,IAAI,EACxC,IAAI,EAAE;IAAE,YAAY,CAAC,EAAE,MAAM,CAAC;IAAC,QAAQ,CAAC,EAAE,MAAM,CAAA;CAAE,GACjD,IAAI,CAoBN;AAKD,wBAAgB,gBAAgB,CAAC,KAAK,EAAE,YAAY,EAAE,EAAE,YAAY,EAAE,MAAM,GAAG,YAAY,EAAE,CAa5F;AAED,wBAAgB,gBAAgB,CAAC,GAAG,EAAE,MAAM,EAAE,KAAK,EAAE,MAAM,GAAG,MAAM,CAEnE;AAED,wBAAgB,iBAAiB,CAAC,KAAK,EAAE;IACvC,KAAK,EAAE,MAAM,CAAC;IACd,GAAG,EAAE,MAAM,CAAC;IACZ,cAAc,EAAE,MAAM,GAAG,IAAI,CAAC;IAC9B,OAAO,EAAE,MAAM,CAAC;IAChB,KAAK,EAAE,MAAM,CAAC;IACd,UAAU,EAAE,UAAU,CAAC;CACxB,GAAG,YAAY,CAUf;AAED,wBAAsB,oBAAoB,CACxC,KAAK,EAAE,WAAW,EAClB,MAAM,EAAE,YAAY,EACpB,OAAO,EAAE,gBAAgB,EAAE,EAC3B,KAAK,EAAE,MAAM,GACZ,OAAO,CAAC,IAAI,CAAC,CAsFf;AAED,wBAAgB,0BAA0B,CACxC,OAAO,EAAE,gBAAgB,EAAE,EAC3B,QAAQ,EAAE,YAAY,EAAE,EACxB,aAAa,EAAE,QAAQ,EAAE,GACxB,QAAQ,EAAE,CAkCZ;AAED,wBAAgB,kBAAkB,CAAC,SAAS,EAAE,QAAQ,EAAE,GAAG,MAAM,CAQhE;AAED,wBAAgB,SAAS,CAAC,CAAC,EAAE,MAAM,GAAG,MAAM,CAO3C"}
@@ -0,0 +1,220 @@
1
+ import { createHash } from "node:crypto";
2
+ import { extractHighlights } from "./highlights.js";
3
+ import { countTokens, truncateByTokens } from "./tokens.js";
4
+ import { applyOutputBudget } from "./truncate.js";
5
+ import { createLogger } from "../logger.js";
6
+ const log = createLogger("search");
7
+ const DEFAULT_MAX_TOKENS_OUT = 4e3;
8
+ const MAX_EVIDENCE_PASSAGES = 20;
9
+ const TRUNCATION_MARKER = "[... content truncated]";
10
+ async function buildEvidenceFromMarkdown(query, title, url, markdown, opts = {}) {
11
+ if (!markdown) return [];
12
+ const maxItems = opts.maxItems ?? 1;
13
+ const synthetic = [{
14
+ title,
15
+ url,
16
+ snippet: "",
17
+ markdown_content: markdown,
18
+ relevance_score: 1
19
+ }];
20
+ let result;
21
+ try {
22
+ result = await extractHighlights(query, synthetic, Math.max(maxItems, 1));
23
+ } catch (err) {
24
+ log.debug("buildEvidenceFromMarkdown: extractHighlights failed", { error: String(err) });
25
+ return [];
26
+ }
27
+ const ranked = result.highlights.slice().sort((a, b) => b.relevance_score - a.relevance_score).slice(0, maxItems);
28
+ const out = [];
29
+ let used = 0;
30
+ const budget = opts.maxTokensOut;
31
+ for (const h of ranked) {
32
+ let excerpt = h.text;
33
+ if (budget !== void 0) {
34
+ const remaining = budget - used;
35
+ if (remaining <= 0) break;
36
+ excerpt = truncateByTokens(h.text, remaining);
37
+ if (!excerpt || excerpt.trim() === TRUNCATION_MARKER) break;
38
+ }
39
+ const span = h.source_span ?? { start: 0, end: excerpt.length };
40
+ out.push(buildEvidenceItem({
41
+ title: h.source_title || title,
42
+ url: h.source_url || url,
43
+ sectionHeading: h.section_heading ?? null,
44
+ excerpt,
45
+ score: h.relevance_score,
46
+ sourceSpan: span
47
+ }));
48
+ if (budget !== void 0) used += countTokens(excerpt);
49
+ }
50
+ return out;
51
+ }
52
+ function applyAggregateMarkdownBudget(items, getBody, setBody, opts) {
53
+ const budget = opts.maxTokensOut;
54
+ let used = 0;
55
+ for (const item of items) {
56
+ const body = getBody(item);
57
+ if (!body) continue;
58
+ if (budget !== void 0) {
59
+ const remaining = budget - used;
60
+ if (remaining <= 0) {
61
+ setBody(item, "");
62
+ continue;
63
+ }
64
+ const trimmed = applyOutputBudget(body, { maxTokensOut: remaining, maxChars: opts.maxChars });
65
+ setBody(item, trimmed);
66
+ used += countTokens(trimmed);
67
+ } else {
68
+ const trimmed = applyOutputBudget(body, { maxChars: opts.maxChars });
69
+ setBody(item, trimmed);
70
+ }
71
+ }
72
+ }
73
+ function applyTokenBudget(items, maxTokensOut) {
74
+ if (maxTokensOut <= 0) return [];
75
+ const out = [];
76
+ let used = 0;
77
+ for (const item of items) {
78
+ const remaining = maxTokensOut - used;
79
+ if (remaining <= 0) break;
80
+ const excerpt = truncateByTokens(item.excerpt, remaining);
81
+ if (!excerpt) break;
82
+ out.push({ ...item, excerpt });
83
+ used += countTokens(excerpt);
84
+ }
85
+ return out;
86
+ }
87
+ function stableCitationId(url, start) {
88
+ return createHash("sha1").update(`${url}#${start}`).digest("hex").slice(0, 12);
89
+ }
90
+ function buildEvidenceItem(input) {
91
+ return {
92
+ title: input.title,
93
+ url: input.url,
94
+ section_heading: input.sectionHeading,
95
+ excerpt: input.excerpt,
96
+ score: input.score,
97
+ citation_id: stableCitationId(input.url, input.sourceSpan.start),
98
+ source_span: input.sourceSpan
99
+ };
100
+ }
101
+ async function applyEvidenceDefault(input, output, results, query) {
102
+ if (results.length === 0) return;
103
+ const includeFullMarkdown = input.include_full_markdown ?? false;
104
+ const citationFormat = input.citation_format ?? "numbered";
105
+ const maxTokensOut = input.max_tokens_out ?? DEFAULT_MAX_TOKENS_OUT;
106
+ let highlightsResult;
107
+ try {
108
+ highlightsResult = await extractHighlights(query, results, MAX_EVIDENCE_PASSAGES);
109
+ } catch (err) {
110
+ log.debug("evidence extraction failed", { error: String(err) });
111
+ const msg = "evidence extraction failed; results returned without highlights";
112
+ output.warning = output.warning ? `${output.warning}; ${msg}` : msg;
113
+ highlightsResult = { highlights: [], citations: [], reranker_used: false };
114
+ }
115
+ const ranked = highlightsResult.highlights.slice().sort((a, b) => b.relevance_score - a.relevance_score);
116
+ let evidenceBudget = maxTokensOut;
117
+ if (input.max_tokens_out !== void 0) {
118
+ const skeleton = { ...output, citations: void 0, evidence: void 0, citations_xml: void 0 };
119
+ const skeletonTokens = countTokens(JSON.stringify(skeleton));
120
+ const resultsTokens = countTokens(JSON.stringify(results));
121
+ const overhead = skeletonTokens + resultsTokens;
122
+ evidenceBudget = Math.max(0, maxTokensOut - overhead);
123
+ }
124
+ const evidence = [];
125
+ let usedTokens = 0;
126
+ for (const h of ranked) {
127
+ if (usedTokens >= evidenceBudget) break;
128
+ const remaining = evidenceBudget - usedTokens;
129
+ const excerpt = truncateByTokens(h.text, remaining);
130
+ if (!excerpt) continue;
131
+ const span = h.source_span ?? { start: 0, end: excerpt.length };
132
+ const item = buildEvidenceItem({
133
+ title: h.source_title,
134
+ url: h.source_url,
135
+ sectionHeading: h.section_heading ?? null,
136
+ excerpt,
137
+ score: h.relevance_score,
138
+ sourceSpan: span
139
+ });
140
+ evidence.push(item);
141
+ usedTokens += countTokens(excerpt);
142
+ }
143
+ if (evidence.length > 0) {
144
+ output.evidence = evidence;
145
+ }
146
+ const citations = buildCitationsFromEvidence(results, evidence, highlightsResult.citations);
147
+ if (citationFormat === "numbered" || citationFormat === "json") {
148
+ if (citations.length > 0) output.citations = citations;
149
+ } else if (citationFormat === "anthropic_tags") {
150
+ if (citations.length > 0) {
151
+ output.citations = citations;
152
+ output.citations_xml = renderCitationsXml(citations);
153
+ }
154
+ }
155
+ if (!includeFullMarkdown) {
156
+ for (const r of results) {
157
+ if (r.markdown_content !== void 0) r.markdown_content = void 0;
158
+ }
159
+ } else if (input.max_tokens_out !== void 0) {
160
+ applyAggregateMarkdownBudget(
161
+ results,
162
+ (r) => typeof r.markdown_content === "string" ? r.markdown_content : "",
163
+ (r, body) => {
164
+ r.markdown_content = body;
165
+ },
166
+ { maxTokensOut: input.max_tokens_out }
167
+ );
168
+ }
169
+ }
170
+ function buildCitationsFromEvidence(results, evidence, baseCitations) {
171
+ const primaryByUrl = /* @__PURE__ */ new Map();
172
+ for (const ev of evidence) {
173
+ if (!primaryByUrl.has(ev.url)) primaryByUrl.set(ev.url, ev.citation_id);
174
+ }
175
+ const baseByUrl = /* @__PURE__ */ new Map();
176
+ for (const c of baseCitations) baseByUrl.set(c.url, c);
177
+ const out = [];
178
+ for (let i = 0; i < results.length; i++) {
179
+ const r = results[i];
180
+ const base = baseByUrl.get(r.url);
181
+ const citation = base ? { ...base } : {
182
+ index: i + 1,
183
+ url: r.url,
184
+ title: r.title,
185
+ snippet: r.snippet ?? ""
186
+ };
187
+ const primary = primaryByUrl.get(r.url);
188
+ if (primary !== void 0) {
189
+ citation.citation_id = primary;
190
+ } else {
191
+ delete citation.citation_id;
192
+ }
193
+ out.push(citation);
194
+ }
195
+ return out;
196
+ }
197
+ function renderCitationsXml(citations) {
198
+ return citations.map((c) => {
199
+ const id = c.citation_id ?? stableCitationId(c.url, 0);
200
+ const inner = escapeXml(`${c.title}
201
+ ${c.url}
202
+ ${c.snippet}`);
203
+ return `<source id="${id}">${inner}</source>`;
204
+ }).join("\n");
205
+ }
206
+ function escapeXml(s) {
207
+ return s.replace(/&/g, "&amp;").replace(/</g, "&lt;").replace(/>/g, "&gt;").replace(/"/g, "&quot;").replace(/'/g, "&apos;");
208
+ }
209
+ export {
210
+ applyAggregateMarkdownBudget,
211
+ applyEvidenceDefault,
212
+ applyTokenBudget,
213
+ buildCitationsFromEvidence,
214
+ buildEvidenceFromMarkdown,
215
+ buildEvidenceItem,
216
+ escapeXml,
217
+ renderCitationsXml,
218
+ stableCitationId
219
+ };
220
+ //# sourceMappingURL=evidence.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../../src/search/evidence.ts"],"sourcesContent":["import { createHash } from 'node:crypto';\nimport type {\n Citation,\n CitationFormat,\n EvidenceItem,\n SearchInput,\n SearchOutput,\n SearchResultItem,\n SourceSpan,\n} from '../types.js';\nimport { extractHighlights } from './highlights.js';\nimport { countTokens, truncateByTokens } from './tokens.js';\nimport { applyOutputBudget } from './truncate.js';\nimport { createLogger } from '../logger.js';\n\nconst log = createLogger('search');\n\nconst DEFAULT_MAX_TOKENS_OUT = 4000;\nconst MAX_EVIDENCE_PASSAGES = 20;\nconst TRUNCATION_MARKER = '[... content truncated]';\n\nexport interface BuildEvidenceOptions {\n maxTokensOut?: number;\n maxItems?: number;\n}\n\n// Build evidence items from a single page's markdown. Used by per-page tools\n// (fetch, crawl pages, find_similar results, agent/research sources). The\n// returned list is already truncated to fit `maxTokensOut` if provided; pass\n// `maxItems` to cap how many highlights are projected.\nexport async function buildEvidenceFromMarkdown(\n query: string,\n title: string,\n url: string,\n markdown: string,\n opts: BuildEvidenceOptions = {},\n): Promise<EvidenceItem[]> {\n if (!markdown) return [];\n const maxItems = opts.maxItems ?? 1;\n const synthetic: SearchResultItem[] = [{\n title,\n url,\n snippet: '',\n markdown_content: markdown,\n relevance_score: 1,\n }];\n\n let result;\n try {\n result = await extractHighlights(query, synthetic, Math.max(maxItems, 1));\n } catch (err) {\n log.debug('buildEvidenceFromMarkdown: extractHighlights failed', { error: String(err) });\n return [];\n }\n\n const ranked = result.highlights\n .slice()\n .sort((a, b) => b.relevance_score - a.relevance_score)\n .slice(0, maxItems);\n\n const out: EvidenceItem[] = [];\n let used = 0;\n const budget = opts.maxTokensOut;\n for (const h of ranked) {\n let excerpt = h.text;\n if (budget !== undefined) {\n const remaining = budget - used;\n if (remaining <= 0) break;\n excerpt = truncateByTokens(h.text, remaining);\n if (!excerpt || excerpt.trim() === TRUNCATION_MARKER) break;\n }\n const span = h.source_span ?? { start: 0, end: excerpt.length };\n out.push(buildEvidenceItem({\n title: h.source_title || title,\n url: h.source_url || url,\n sectionHeading: h.section_heading ?? null,\n excerpt,\n score: h.relevance_score,\n sourceSpan: span,\n }));\n if (budget !== undefined) used += countTokens(excerpt);\n }\n return out;\n}\n\n// Walk items in order, capping each item's body text against a shared token\n// budget. Bodies past the budget are cleared (set to ''). Used by all\n// multi-item tools (search markdown_content, find_similar, crawl, research,\n// agent) so per-tool max_tokens_out is an aggregate cap, not per-item.\nexport function applyAggregateMarkdownBudget<T>(\n items: T[],\n getBody: (item: T) => string,\n setBody: (item: T, body: string) => void,\n opts: { maxTokensOut?: number; maxChars?: number },\n): void {\n const budget = opts.maxTokensOut;\n let used = 0;\n for (const item of items) {\n const body = getBody(item);\n if (!body) continue;\n if (budget !== undefined) {\n const remaining = budget - used;\n if (remaining <= 0) {\n setBody(item, '');\n continue;\n }\n const trimmed = applyOutputBudget(body, { maxTokensOut: remaining, maxChars: opts.maxChars });\n setBody(item, trimmed);\n used += countTokens(trimmed);\n } else {\n const trimmed = applyOutputBudget(body, { maxChars: opts.maxChars });\n setBody(item, trimmed);\n }\n }\n}\n\n// Apply an aggregate token budget across an already-built list of evidence\n// items, truncating excerpts in order until the budget is exhausted. Items\n// past the budget are dropped.\nexport function applyTokenBudget(items: EvidenceItem[], maxTokensOut: number): EvidenceItem[] {\n if (maxTokensOut <= 0) return [];\n const out: EvidenceItem[] = [];\n let used = 0;\n for (const item of items) {\n const remaining = maxTokensOut - used;\n if (remaining <= 0) break;\n const excerpt = truncateByTokens(item.excerpt, remaining);\n if (!excerpt) break;\n out.push({ ...item, excerpt });\n used += countTokens(excerpt);\n }\n return out;\n}\n\nexport function stableCitationId(url: string, start: number): string {\n return createHash('sha1').update(`${url}#${start}`).digest('hex').slice(0, 12);\n}\n\nexport function buildEvidenceItem(input: {\n title: string;\n url: string;\n sectionHeading: string | null;\n excerpt: string;\n score: number;\n sourceSpan: SourceSpan;\n}): EvidenceItem {\n return {\n title: input.title,\n url: input.url,\n section_heading: input.sectionHeading,\n excerpt: input.excerpt,\n score: input.score,\n citation_id: stableCitationId(input.url, input.sourceSpan.start),\n source_span: input.sourceSpan,\n };\n}\n\nexport async function applyEvidenceDefault(\n input: SearchInput,\n output: SearchOutput,\n results: SearchResultItem[],\n query: string,\n): Promise<void> {\n if (results.length === 0) return;\n\n const includeFullMarkdown = input.include_full_markdown ?? false;\n const citationFormat: CitationFormat = input.citation_format ?? 'numbered';\n const maxTokensOut = input.max_tokens_out ?? DEFAULT_MAX_TOKENS_OUT;\n\n let highlightsResult;\n try {\n highlightsResult = await extractHighlights(query, results, MAX_EVIDENCE_PASSAGES);\n } catch (err) {\n log.debug('evidence extraction failed', { error: String(err) });\n const msg = 'evidence extraction failed; results returned without highlights';\n output.warning = output.warning ? `${output.warning}; ${msg}` : msg;\n highlightsResult = { highlights: [], citations: [], reranker_used: false };\n }\n\n const ranked = highlightsResult.highlights\n .slice()\n .sort((a, b) => b.relevance_score - a.relevance_score);\n\n // When the caller sets max_tokens_out explicitly, evidence shares the budget\n // with citations/results metadata. Reserve room for the structural overhead\n // so the total stringified output stays under the cap.\n // NOTE: this relies on JSON.stringify dropping `undefined` keys, and on\n // applyEvidenceDefault running before any post-evidence mutation that grows\n // the skeleton (e.g. output.warning); reserve overhead first, mutate later.\n let evidenceBudget = maxTokensOut;\n if (input.max_tokens_out !== undefined) {\n const skeleton: SearchOutput = { ...output, citations: undefined, evidence: undefined, citations_xml: undefined };\n const skeletonTokens = countTokens(JSON.stringify(skeleton));\n const resultsTokens = countTokens(JSON.stringify(results));\n const overhead = skeletonTokens + resultsTokens;\n evidenceBudget = Math.max(0, maxTokensOut - overhead);\n }\n\n const evidence: EvidenceItem[] = [];\n let usedTokens = 0;\n for (const h of ranked) {\n if (usedTokens >= evidenceBudget) break;\n const remaining = evidenceBudget - usedTokens;\n const excerpt = truncateByTokens(h.text, remaining);\n if (!excerpt) continue;\n const span = h.source_span ?? { start: 0, end: excerpt.length };\n const item = buildEvidenceItem({\n title: h.source_title,\n url: h.source_url,\n sectionHeading: h.section_heading ?? null,\n excerpt,\n score: h.relevance_score,\n sourceSpan: span,\n });\n evidence.push(item);\n usedTokens += countTokens(excerpt);\n }\n\n if (evidence.length > 0) {\n output.evidence = evidence;\n }\n\n const citations = buildCitationsFromEvidence(results, evidence, highlightsResult.citations);\n\n if (citationFormat === 'numbered' || citationFormat === 'json') {\n if (citations.length > 0) output.citations = citations;\n } else if (citationFormat === 'anthropic_tags') {\n if (citations.length > 0) {\n output.citations = citations;\n output.citations_xml = renderCitationsXml(citations);\n }\n }\n\n // Terminal mutation: applyEvidenceDefault is the last step before return.\n if (!includeFullMarkdown) {\n for (const r of results) {\n if (r.markdown_content !== undefined) r.markdown_content = undefined;\n }\n } else if (input.max_tokens_out !== undefined) {\n // Aggregate cap across all results in score order — sum of markdown_content\n // tokens stays under max_tokens_out; bodies past the budget are dropped.\n applyAggregateMarkdownBudget(\n results,\n (r) => (typeof r.markdown_content === 'string' ? r.markdown_content : ''),\n (r, body) => { r.markdown_content = body; },\n { maxTokensOut: input.max_tokens_out },\n );\n }\n}\n\nexport function buildCitationsFromEvidence(\n results: SearchResultItem[],\n evidence: EvidenceItem[],\n baseCitations: Citation[],\n): Citation[] {\n // Pick the primary citation_id per source: the first evidence item for that URL\n // (highest score after sort). Sources whose evidence was budget-cut have no\n // citation_id — consumers can interpret missing id as \"source-level citation,\n // no specific passage.\"\n const primaryByUrl = new Map<string, string>();\n for (const ev of evidence) {\n if (!primaryByUrl.has(ev.url)) primaryByUrl.set(ev.url, ev.citation_id);\n }\n const baseByUrl = new Map<string, Citation>();\n for (const c of baseCitations) baseByUrl.set(c.url, c);\n\n const out: Citation[] = [];\n for (let i = 0; i < results.length; i++) {\n const r = results[i];\n const base = baseByUrl.get(r.url);\n const citation: Citation = base\n ? { ...base }\n : {\n index: i + 1,\n url: r.url,\n title: r.title,\n snippet: r.snippet ?? '',\n };\n const primary = primaryByUrl.get(r.url);\n if (primary !== undefined) {\n citation.citation_id = primary;\n } else {\n // No surviving evidence passage for this source — leave citation_id absent.\n delete citation.citation_id;\n }\n out.push(citation);\n }\n return out;\n}\n\nexport function renderCitationsXml(citations: Citation[]): string {\n return citations\n .map((c) => {\n const id = c.citation_id ?? stableCitationId(c.url, 0);\n const inner = escapeXml(`${c.title}\\n${c.url}\\n${c.snippet}`);\n return `<source id=\"${id}\">${inner}</source>`;\n })\n .join('\\n');\n}\n\nexport function escapeXml(s: string): string {\n return s\n .replace(/&/g, '&amp;')\n .replace(/</g, '&lt;')\n .replace(/>/g, '&gt;')\n .replace(/\"/g, '&quot;')\n .replace(/'/g, '&apos;');\n}\n"],"mappings":"AAAA,SAAS,kBAAkB;AAU3B,SAAS,yBAAyB;AAClC,SAAS,aAAa,wBAAwB;AAC9C,SAAS,yBAAyB;AAClC,SAAS,oBAAoB;AAE7B,MAAM,MAAM,aAAa,QAAQ;AAEjC,MAAM,yBAAyB;AAC/B,MAAM,wBAAwB;AAC9B,MAAM,oBAAoB;AAW1B,eAAsB,0BACpB,OACA,OACA,KACA,UACA,OAA6B,CAAC,GACL;AACzB,MAAI,CAAC,SAAU,QAAO,CAAC;AACvB,QAAM,WAAW,KAAK,YAAY;AAClC,QAAM,YAAgC,CAAC;AAAA,IACrC;AAAA,IACA;AAAA,IACA,SAAS;AAAA,IACT,kBAAkB;AAAA,IAClB,iBAAiB;AAAA,EACnB,CAAC;AAED,MAAI;AACJ,MAAI;AACF,aAAS,MAAM,kBAAkB,OAAO,WAAW,KAAK,IAAI,UAAU,CAAC,CAAC;AAAA,EAC1E,SAAS,KAAK;AACZ,QAAI,MAAM,uDAAuD,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AACvF,WAAO,CAAC;AAAA,EACV;AAEA,QAAM,SAAS,OAAO,WACnB,MAAM,EACN,KAAK,CAAC,GAAG,MAAM,EAAE,kBAAkB,EAAE,eAAe,EACpD,MAAM,GAAG,QAAQ;AAEpB,QAAM,MAAsB,CAAC;AAC7B,MAAI,OAAO;AACX,QAAM,SAAS,KAAK;AACpB,aAAW,KAAK,QAAQ;AACtB,QAAI,UAAU,EAAE;AAChB,QAAI,WAAW,QAAW;AACxB,YAAM,YAAY,SAAS;AAC3B,UAAI,aAAa,EAAG;AACpB,gBAAU,iBAAiB,EAAE,MAAM,SAAS;AAC5C,UAAI,CAAC,WAAW,QAAQ,KAAK,MAAM,kBAAmB;AAAA,IACxD;AACA,UAAM,OAAO,EAAE,eAAe,EAAE,OAAO,GAAG,KAAK,QAAQ,OAAO;AAC9D,QAAI,KAAK,kBAAkB;AAAA,MACzB,OAAO,EAAE,gBAAgB;AAAA,MACzB,KAAK,EAAE,cAAc;AAAA,MACrB,gBAAgB,EAAE,mBAAmB;AAAA,MACrC;AAAA,MACA,OAAO,EAAE;AAAA,MACT,YAAY;AAAA,IACd,CAAC,CAAC;AACF,QAAI,WAAW,OAAW,SAAQ,YAAY,OAAO;AAAA,EACvD;AACA,SAAO;AACT;AAMO,SAAS,6BACd,OACA,SACA,SACA,MACM;AACN,QAAM,SAAS,KAAK;AACpB,MAAI,OAAO;AACX,aAAW,QAAQ,OAAO;AACxB,UAAM,OAAO,QAAQ,IAAI;AACzB,QAAI,CAAC,KAAM;AACX,QAAI,WAAW,QAAW;AACxB,YAAM,YAAY,SAAS;AAC3B,UAAI,aAAa,GAAG;AAClB,gBAAQ,MAAM,EAAE;AAChB;AAAA,MACF;AACA,YAAM,UAAU,kBAAkB,MAAM,EAAE,cAAc,WAAW,UAAU,KAAK,SAAS,CAAC;AAC5F,cAAQ,MAAM,OAAO;AACrB,cAAQ,YAAY,OAAO;AAAA,IAC7B,OAAO;AACL,YAAM,UAAU,kBAAkB,MAAM,EAAE,UAAU,KAAK,SAAS,CAAC;AACnE,cAAQ,MAAM,OAAO;AAAA,IACvB;AAAA,EACF;AACF;AAKO,SAAS,iBAAiB,OAAuB,cAAsC;AAC5F,MAAI,gBAAgB,EAAG,QAAO,CAAC;AAC/B,QAAM,MAAsB,CAAC;AAC7B,MAAI,OAAO;AACX,aAAW,QAAQ,OAAO;AACxB,UAAM,YAAY,eAAe;AACjC,QAAI,aAAa,EAAG;AACpB,UAAM,UAAU,iBAAiB,KAAK,SAAS,SAAS;AACxD,QAAI,CAAC,QAAS;AACd,QAAI,KAAK,EAAE,GAAG,MAAM,QAAQ,CAAC;AAC7B,YAAQ,YAAY,OAAO;AAAA,EAC7B;AACA,SAAO;AACT;AAEO,SAAS,iBAAiB,KAAa,OAAuB;AACnE,SAAO,WAAW,MAAM,EAAE,OAAO,GAAG,GAAG,IAAI,KAAK,EAAE,EAAE,OAAO,KAAK,EAAE,MAAM,GAAG,EAAE;AAC/E;AAEO,SAAS,kBAAkB,OAOjB;AACf,SAAO;AAAA,IACL,OAAO,MAAM;AAAA,IACb,KAAK,MAAM;AAAA,IACX,iBAAiB,MAAM;AAAA,IACvB,SAAS,MAAM;AAAA,IACf,OAAO,MAAM;AAAA,IACb,aAAa,iBAAiB,MAAM,KAAK,MAAM,WAAW,KAAK;AAAA,IAC/D,aAAa,MAAM;AAAA,EACrB;AACF;AAEA,eAAsB,qBACpB,OACA,QACA,SACA,OACe;AACf,MAAI,QAAQ,WAAW,EAAG;AAE1B,QAAM,sBAAsB,MAAM,yBAAyB;AAC3D,QAAM,iBAAiC,MAAM,mBAAmB;AAChE,QAAM,eAAe,MAAM,kBAAkB;AAE7C,MAAI;AACJ,MAAI;AACF,uBAAmB,MAAM,kBAAkB,OAAO,SAAS,qBAAqB;AAAA,EAClF,SAAS,KAAK;AACZ,QAAI,MAAM,8BAA8B,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AAC9D,UAAM,MAAM;AACZ,WAAO,UAAU,OAAO,UAAU,GAAG,OAAO,OAAO,KAAK,GAAG,KAAK;AAChE,uBAAmB,EAAE,YAAY,CAAC,GAAG,WAAW,CAAC,GAAG,eAAe,MAAM;AAAA,EAC3E;AAEA,QAAM,SAAS,iBAAiB,WAC7B,MAAM,EACN,KAAK,CAAC,GAAG,MAAM,EAAE,kBAAkB,EAAE,eAAe;AAQvD,MAAI,iBAAiB;AACrB,MAAI,MAAM,mBAAmB,QAAW;AACtC,UAAM,WAAyB,EAAE,GAAG,QAAQ,WAAW,QAAW,UAAU,QAAW,eAAe,OAAU;AAChH,UAAM,iBAAiB,YAAY,KAAK,UAAU,QAAQ,CAAC;AAC3D,UAAM,gBAAgB,YAAY,KAAK,UAAU,OAAO,CAAC;AACzD,UAAM,WAAW,iBAAiB;AAClC,qBAAiB,KAAK,IAAI,GAAG,eAAe,QAAQ;AAAA,EACtD;AAEA,QAAM,WAA2B,CAAC;AAClC,MAAI,aAAa;AACjB,aAAW,KAAK,QAAQ;AACtB,QAAI,cAAc,eAAgB;AAClC,UAAM,YAAY,iBAAiB;AACnC,UAAM,UAAU,iBAAiB,EAAE,MAAM,SAAS;AAClD,QAAI,CAAC,QAAS;AACd,UAAM,OAAO,EAAE,eAAe,EAAE,OAAO,GAAG,KAAK,QAAQ,OAAO;AAC9D,UAAM,OAAO,kBAAkB;AAAA,MAC7B,OAAO,EAAE;AAAA,MACT,KAAK,EAAE;AAAA,MACP,gBAAgB,EAAE,mBAAmB;AAAA,MACrC;AAAA,MACA,OAAO,EAAE;AAAA,MACT,YAAY;AAAA,IACd,CAAC;AACD,aAAS,KAAK,IAAI;AAClB,kBAAc,YAAY,OAAO;AAAA,EACnC;AAEA,MAAI,SAAS,SAAS,GAAG;AACvB,WAAO,WAAW;AAAA,EACpB;AAEA,QAAM,YAAY,2BAA2B,SAAS,UAAU,iBAAiB,SAAS;AAE1F,MAAI,mBAAmB,cAAc,mBAAmB,QAAQ;AAC9D,QAAI,UAAU,SAAS,EAAG,QAAO,YAAY;AAAA,EAC/C,WAAW,mBAAmB,kBAAkB;AAC9C,QAAI,UAAU,SAAS,GAAG;AACxB,aAAO,YAAY;AACnB,aAAO,gBAAgB,mBAAmB,SAAS;AAAA,IACrD;AAAA,EACF;AAGA,MAAI,CAAC,qBAAqB;AACxB,eAAW,KAAK,SAAS;AACvB,UAAI,EAAE,qBAAqB,OAAW,GAAE,mBAAmB;AAAA,IAC7D;AAAA,EACF,WAAW,MAAM,mBAAmB,QAAW;AAG7C;AAAA,MACE;AAAA,MACA,CAAC,MAAO,OAAO,EAAE,qBAAqB,WAAW,EAAE,mBAAmB;AAAA,MACtE,CAAC,GAAG,SAAS;AAAE,UAAE,mBAAmB;AAAA,MAAM;AAAA,MAC1C,EAAE,cAAc,MAAM,eAAe;AAAA,IACvC;AAAA,EACF;AACF;AAEO,SAAS,2BACd,SACA,UACA,eACY;AAKZ,QAAM,eAAe,oBAAI,IAAoB;AAC7C,aAAW,MAAM,UAAU;AACzB,QAAI,CAAC,aAAa,IAAI,GAAG,GAAG,EAAG,cAAa,IAAI,GAAG,KAAK,GAAG,WAAW;AAAA,EACxE;AACA,QAAM,YAAY,oBAAI,IAAsB;AAC5C,aAAW,KAAK,cAAe,WAAU,IAAI,EAAE,KAAK,CAAC;AAErD,QAAM,MAAkB,CAAC;AACzB,WAAS,IAAI,GAAG,IAAI,QAAQ,QAAQ,KAAK;AACvC,UAAM,IAAI,QAAQ,CAAC;AACnB,UAAM,OAAO,UAAU,IAAI,EAAE,GAAG;AAChC,UAAM,WAAqB,OACvB,EAAE,GAAG,KAAK,IACV;AAAA,MACE,OAAO,IAAI;AAAA,MACX,KAAK,EAAE;AAAA,MACP,OAAO,EAAE;AAAA,MACT,SAAS,EAAE,WAAW;AAAA,IACxB;AACJ,UAAM,UAAU,aAAa,IAAI,EAAE,GAAG;AACtC,QAAI,YAAY,QAAW;AACzB,eAAS,cAAc;AAAA,IACzB,OAAO;AAEL,aAAO,SAAS;AAAA,IAClB;AACA,QAAI,KAAK,QAAQ;AAAA,EACnB;AACA,SAAO;AACT;AAEO,SAAS,mBAAmB,WAA+B;AAChE,SAAO,UACJ,IAAI,CAAC,MAAM;AACV,UAAM,KAAK,EAAE,eAAe,iBAAiB,EAAE,KAAK,CAAC;AACrD,UAAM,QAAQ,UAAU,GAAG,EAAE,KAAK;AAAA,EAAK,EAAE,GAAG;AAAA,EAAK,EAAE,OAAO,EAAE;AAC5D,WAAO,eAAe,EAAE,KAAK,KAAK;AAAA,EACpC,CAAC,EACA,KAAK,IAAI;AACd;AAEO,SAAS,UAAU,GAAmB;AAC3C,SAAO,EACJ,QAAQ,MAAM,OAAO,EACrB,QAAQ,MAAM,MAAM,EACpB,QAAQ,MAAM,MAAM,EACpB,QAAQ,MAAM,QAAQ,EACtB,QAAQ,MAAM,QAAQ;AAC3B;","names":[]}
@@ -1,63 +1,57 @@
1
1
  function getDomain(url) {
2
- try {
3
- return new URL(url).hostname.toLowerCase();
4
- }
5
- catch {
6
- return '';
7
- }
2
+ try {
3
+ return new URL(url).hostname.toLowerCase();
4
+ } catch {
5
+ return "";
6
+ }
8
7
  }
9
8
  function normalizeDomain(domain) {
10
- return domain.replace(/\/+$/, '').toLowerCase();
9
+ return domain.replace(/\/+$/, "").toLowerCase();
11
10
  }
12
11
  function domainMatches(hostname, domain) {
13
- const normalized = normalizeDomain(domain);
14
- return hostname === normalized || hostname.endsWith('.' + normalized);
15
- }
16
- export function filterByDomains(results, includeDomains, excludeDomains) {
17
- if (!includeDomains?.length && !excludeDomains?.length)
18
- return results;
19
- return results.filter((r) => {
20
- const hostname = getDomain(r.url);
21
- if (!hostname) {
22
- return !includeDomains?.length;
23
- }
24
- if (includeDomains?.length) {
25
- if (!includeDomains.some((d) => domainMatches(hostname, d)))
26
- return false;
27
- }
28
- if (excludeDomains?.length) {
29
- if (excludeDomains.some((d) => domainMatches(hostname, d)))
30
- return false;
31
- }
32
- return true;
33
- });
12
+ const normalized = normalizeDomain(domain);
13
+ return hostname === normalized || hostname.endsWith("." + normalized);
14
+ }
15
+ function filterByDomains(results, includeDomains, excludeDomains) {
16
+ if (!includeDomains?.length && !excludeDomains?.length) return results;
17
+ return results.filter((r) => {
18
+ const hostname = getDomain(r.url);
19
+ if (!hostname) {
20
+ return !includeDomains?.length;
21
+ }
22
+ if (includeDomains?.length) {
23
+ if (!includeDomains.some((d) => domainMatches(hostname, d))) return false;
24
+ }
25
+ if (excludeDomains?.length) {
26
+ if (excludeDomains.some((d) => domainMatches(hostname, d))) return false;
27
+ }
28
+ return true;
29
+ });
34
30
  }
35
31
  function isValidIsoDate(dateStr) {
36
- const parsed = new Date(dateStr);
37
- return !isNaN(parsed.getTime()) && /^\d{4}-\d{2}-\d{2}$/.test(dateStr);
38
- }
39
- export function filterByDateRange(results, fromDate, toDate) {
40
- if (!fromDate && !toDate)
41
- return results;
42
- if (fromDate && !isValidIsoDate(fromDate))
43
- return results;
44
- if (toDate && !isValidIsoDate(toDate))
45
- return results;
46
- if (fromDate && toDate && new Date(fromDate) > new Date(toDate))
47
- return results;
48
- // Date filtering is best-effort on direct scraping engines.
49
- // SearXNG handles dates natively via time_range. For fallback engines,
50
- // snippet text doesn't reliably contain dates, so we keep all results.
51
- return results;
52
- }
53
- export function filterByCategory(results, _category) {
54
- // Category filtering is handled by SearXNG natively.
55
- return results;
56
- }
57
- export function applyAllFilters(results, options) {
58
- let filtered = filterByDomains(results, options.includeDomains, options.excludeDomains);
59
- filtered = filterByDateRange(filtered, options.fromDate, options.toDate);
60
- filtered = filterByCategory(filtered, options.category);
61
- return filtered;
62
- }
32
+ const parsed = new Date(dateStr);
33
+ return !isNaN(parsed.getTime()) && /^\d{4}-\d{2}-\d{2}$/.test(dateStr);
34
+ }
35
+ function filterByDateRange(results, fromDate, toDate) {
36
+ if (!fromDate && !toDate) return results;
37
+ if (fromDate && !isValidIsoDate(fromDate)) return results;
38
+ if (toDate && !isValidIsoDate(toDate)) return results;
39
+ if (fromDate && toDate && new Date(fromDate) > new Date(toDate)) return results;
40
+ return results;
41
+ }
42
+ function filterByCategory(results, _category) {
43
+ return results;
44
+ }
45
+ function applyAllFilters(results, options) {
46
+ let filtered = filterByDomains(results, options.includeDomains, options.excludeDomains);
47
+ filtered = filterByDateRange(filtered, options.fromDate, options.toDate);
48
+ filtered = filterByCategory(filtered, options.category);
49
+ return filtered;
50
+ }
51
+ export {
52
+ applyAllFilters,
53
+ filterByCategory,
54
+ filterByDateRange,
55
+ filterByDomains
56
+ };
63
57
  //# sourceMappingURL=filters.js.map
@@ -1 +1 @@
1
- {"version":3,"file":"filters.js","sourceRoot":"","sources":["../../src/search/filters.ts"],"names":[],"mappings":"AAAA,SAAS,SAAS,CAAC,GAAW;IAC5B,IAAI,CAAC;QACH,OAAO,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC,QAAQ,CAAC,WAAW,EAAE,CAAC;IAC7C,CAAC;IAAC,MAAM,CAAC;QACP,OAAO,EAAE,CAAC;IACZ,CAAC;AACH,CAAC;AAED,SAAS,eAAe,CAAC,MAAc;IACrC,OAAO,MAAM,CAAC,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC,CAAC,WAAW,EAAE,CAAC;AAClD,CAAC;AAED,SAAS,aAAa,CAAC,QAAgB,EAAE,MAAc;IACrD,MAAM,UAAU,GAAG,eAAe,CAAC,MAAM,CAAC,CAAC;IAC3C,OAAO,QAAQ,KAAK,UAAU,IAAI,QAAQ,CAAC,QAAQ,CAAC,GAAG,GAAG,UAAU,CAAC,CAAC;AACxE,CAAC;AAED,MAAM,UAAU,eAAe,CAC7B,OAAY,EACZ,cAAyB,EACzB,cAAyB;IAEzB,IAAI,CAAC,cAAc,EAAE,MAAM,IAAI,CAAC,cAAc,EAAE,MAAM;QAAE,OAAO,OAAO,CAAC;IAEvE,OAAO,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE;QAC1B,MAAM,QAAQ,GAAG,SAAS,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;QAClC,IAAI,CAAC,QAAQ,EAAE,CAAC;YACd,OAAO,CAAC,cAAc,EAAE,MAAM,CAAC;QACjC,CAAC;QACD,IAAI,cAAc,EAAE,MAAM,EAAE,CAAC;YAC3B,IAAI,CAAC,cAAc,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,aAAa,CAAC,QAAQ,EAAE,CAAC,CAAC,CAAC;gBAAE,OAAO,KAAK,CAAC;QAC5E,CAAC;QACD,IAAI,cAAc,EAAE,MAAM,EAAE,CAAC;YAC3B,IAAI,cAAc,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,aAAa,CAAC,QAAQ,EAAE,CAAC,CAAC,CAAC;gBAAE,OAAO,KAAK,CAAC;QAC3E,CAAC;QACD,OAAO,IAAI,CAAC;IACd,CAAC,CAAC,CAAC;AACL,CAAC;AAED,SAAS,cAAc,CAAC,OAAe;IACrC,MAAM,MAAM,GAAG,IAAI,IAAI,CAAC,OAAO,CAAC,CAAC;IACjC,OAAO,CAAC,KAAK,CAAC,MAAM,CAAC,OAAO,EAAE,CAAC,IAAI,qBAAqB,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC;AACzE,CAAC;AAED,MAAM,UAAU,iBAAiB,CAC/B,OAAY,EACZ,QAAiB,EACjB,MAAe;IAEf,IAAI,CAAC,QAAQ,IAAI,CAAC,MAAM;QAAE,OAAO,OAAO,CAAC;IAEzC,IAAI,QAAQ,IAAI,CAAC,cAAc,CAAC,QAAQ,CAAC;QAAE,OAAO,OAAO,CAAC;IAC1D,IAAI,MAAM,IAAI,CAAC,cAAc,CAAC,MAAM,CAAC;QAAE,OAAO,OAAO,CAAC;IAEtD,IAAI,QAAQ,IAAI,MAAM,IAAI,IAAI,IAAI,CAAC,QAAQ,CAAC,GAAG,IAAI,IAAI,CAAC,MAAM,CAAC;QAAE,OAAO,OAAO,CAAC;IAEhF,4DAA4D;IAC5D,uEAAuE;IACvE,uEAAuE;IACvE,OAAO,OAAO,CAAC;AACjB,CAAC;AAED,MAAM,UAAU,gBAAgB,CAC9B,OAAY,EACZ,SAAkB;IAElB,qDAAqD;IACrD,OAAO,OAAO,CAAC;AACjB,CAAC;AAUD,MAAM,UAAU,eAAe,CAC7B,OAAY,EACZ,OAAsB;IAEtB,IAAI,QAAQ,GAAG,eAAe,CAAC,OAAO,EAAE,OAAO,CAAC,cAAc,EAAE,OAAO,CAAC,cAAc,CAAC,CAAC;IACxF,QAAQ,GAAG,iBAAiB,CAAC,QAAQ,EAAE,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,MAAM,CAAC,CAAC;IACzE,QAAQ,GAAG,gBAAgB,CAAC,QAAQ,EAAE,OAAO,CAAC,QAAQ,CAAC,CAAC;IACxD,OAAO,QAAQ,CAAC;AAClB,CAAC"}
1
+ {"version":3,"sources":["../../src/search/filters.ts"],"sourcesContent":["function getDomain(url: string): string {\n try {\n return new URL(url).hostname.toLowerCase();\n } catch {\n return '';\n }\n}\n\nfunction normalizeDomain(domain: string): string {\n return domain.replace(/\\/+$/, '').toLowerCase();\n}\n\nfunction domainMatches(hostname: string, domain: string): boolean {\n const normalized = normalizeDomain(domain);\n return hostname === normalized || hostname.endsWith('.' + normalized);\n}\n\nexport function filterByDomains<T extends { url: string }>(\n results: T[],\n includeDomains?: string[],\n excludeDomains?: string[],\n): T[] {\n if (!includeDomains?.length && !excludeDomains?.length) return results;\n\n return results.filter((r) => {\n const hostname = getDomain(r.url);\n if (!hostname) {\n return !includeDomains?.length;\n }\n if (includeDomains?.length) {\n if (!includeDomains.some((d) => domainMatches(hostname, d))) return false;\n }\n if (excludeDomains?.length) {\n if (excludeDomains.some((d) => domainMatches(hostname, d))) return false;\n }\n return true;\n });\n}\n\nfunction isValidIsoDate(dateStr: string): boolean {\n const parsed = new Date(dateStr);\n return !isNaN(parsed.getTime()) && /^\\d{4}-\\d{2}-\\d{2}$/.test(dateStr);\n}\n\nexport function filterByDateRange<T>(\n results: T[],\n fromDate?: string,\n toDate?: string,\n): T[] {\n if (!fromDate && !toDate) return results;\n\n if (fromDate && !isValidIsoDate(fromDate)) return results;\n if (toDate && !isValidIsoDate(toDate)) return results;\n\n if (fromDate && toDate && new Date(fromDate) > new Date(toDate)) return results;\n\n // Date filtering is best-effort on direct scraping engines.\n // SearXNG handles dates natively via time_range. For fallback engines,\n // snippet text doesn't reliably contain dates, so we keep all results.\n return results;\n}\n\nexport function filterByCategory<T>(\n results: T[],\n _category?: string,\n): T[] {\n // Category filtering is handled by SearXNG natively.\n return results;\n}\n\nexport interface FilterOptions {\n includeDomains?: string[];\n excludeDomains?: string[];\n fromDate?: string;\n toDate?: string;\n category?: string;\n}\n\nexport function applyAllFilters<T extends { url: string }>(\n results: T[],\n options: FilterOptions,\n): T[] {\n let filtered = filterByDomains(results, options.includeDomains, options.excludeDomains);\n filtered = filterByDateRange(filtered, options.fromDate, options.toDate);\n filtered = filterByCategory(filtered, options.category);\n return filtered;\n}\n"],"mappings":"AAAA,SAAS,UAAU,KAAqB;AACtC,MAAI;AACF,WAAO,IAAI,IAAI,GAAG,EAAE,SAAS,YAAY;AAAA,EAC3C,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAEA,SAAS,gBAAgB,QAAwB;AAC/C,SAAO,OAAO,QAAQ,QAAQ,EAAE,EAAE,YAAY;AAChD;AAEA,SAAS,cAAc,UAAkB,QAAyB;AAChE,QAAM,aAAa,gBAAgB,MAAM;AACzC,SAAO,aAAa,cAAc,SAAS,SAAS,MAAM,UAAU;AACtE;AAEO,SAAS,gBACd,SACA,gBACA,gBACK;AACL,MAAI,CAAC,gBAAgB,UAAU,CAAC,gBAAgB,OAAQ,QAAO;AAE/D,SAAO,QAAQ,OAAO,CAAC,MAAM;AAC3B,UAAM,WAAW,UAAU,EAAE,GAAG;AAChC,QAAI,CAAC,UAAU;AACb,aAAO,CAAC,gBAAgB;AAAA,IAC1B;AACA,QAAI,gBAAgB,QAAQ;AAC1B,UAAI,CAAC,eAAe,KAAK,CAAC,MAAM,cAAc,UAAU,CAAC,CAAC,EAAG,QAAO;AAAA,IACtE;AACA,QAAI,gBAAgB,QAAQ;AAC1B,UAAI,eAAe,KAAK,CAAC,MAAM,cAAc,UAAU,CAAC,CAAC,EAAG,QAAO;AAAA,IACrE;AACA,WAAO;AAAA,EACT,CAAC;AACH;AAEA,SAAS,eAAe,SAA0B;AAChD,QAAM,SAAS,IAAI,KAAK,OAAO;AAC/B,SAAO,CAAC,MAAM,OAAO,QAAQ,CAAC,KAAK,sBAAsB,KAAK,OAAO;AACvE;AAEO,SAAS,kBACd,SACA,UACA,QACK;AACL,MAAI,CAAC,YAAY,CAAC,OAAQ,QAAO;AAEjC,MAAI,YAAY,CAAC,eAAe,QAAQ,EAAG,QAAO;AAClD,MAAI,UAAU,CAAC,eAAe,MAAM,EAAG,QAAO;AAE9C,MAAI,YAAY,UAAU,IAAI,KAAK,QAAQ,IAAI,IAAI,KAAK,MAAM,EAAG,QAAO;AAKxE,SAAO;AACT;AAEO,SAAS,iBACd,SACA,WACK;AAEL,SAAO;AACT;AAUO,SAAS,gBACd,SACA,SACK;AACL,MAAI,WAAW,gBAAgB,SAAS,QAAQ,gBAAgB,QAAQ,cAAc;AACtF,aAAW,kBAAkB,UAAU,QAAQ,UAAU,QAAQ,MAAM;AACvE,aAAW,iBAAiB,UAAU,QAAQ,QAAQ;AACtD,SAAO;AACT;","names":[]}
@@ -0,0 +1,9 @@
1
+ import type { FindSimilarInput, FindSimilarOutput } from '../../types.js';
2
+ import type { SmartRouter } from '../../fetch/router.js';
3
+ export interface CrawlRankOptions {
4
+ maxPages?: number;
5
+ concurrency?: number;
6
+ fetchTimeoutMs?: number;
7
+ }
8
+ export declare function crawlRank(seedUrl: string, input: FindSimilarInput, router: SmartRouter, options?: CrawlRankOptions): Promise<FindSimilarOutput>;
9
+ //# sourceMappingURL=crawl-rank.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"crawl-rank.d.ts","sourceRoot":"","sources":["../../../src/search/find-similar/crawl-rank.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACV,gBAAgB,EAChB,iBAAiB,EAElB,MAAM,gBAAgB,CAAC;AACxB,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,uBAAuB,CAAC;AAazD,MAAM,WAAW,gBAAgB;IAC/B,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,cAAc,CAAC,EAAE,MAAM,CAAC;CACzB;AASD,wBAAsB,SAAS,CAC7B,OAAO,EAAE,MAAM,EACf,KAAK,EAAE,gBAAgB,EACvB,MAAM,EAAE,WAAW,EACnB,OAAO,GAAE,gBAAqB,GAC7B,OAAO,CAAC,iBAAiB,CAAC,CA+J5B"}