@staticn0va/wigolo 0.1.0 → 0.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (982) hide show
  1. package/LICENSE +1 -1
  2. package/README.md +195 -73
  3. package/SKILL.md +382 -0
  4. package/assets/blocks/claude-code/CLAUDE.md.block +20 -0
  5. package/assets/blocks/claude-code/wigolo-command.md +40 -0
  6. package/assets/blocks/cursor/wigolo.mdc +46 -0
  7. package/assets/blocks/gemini-cli/GEMINI.md.block +18 -0
  8. package/assets/blocks/vscode/copilot-instructions.md.block +18 -0
  9. package/assets/skills/wigolo/SKILL.md +50 -0
  10. package/assets/skills/wigolo/rules/cache-first.md +30 -0
  11. package/assets/skills/wigolo/rules/synthesis.md +43 -0
  12. package/assets/skills/wigolo-agent/SKILL.md +73 -0
  13. package/assets/skills/wigolo-crawl/SKILL.md +60 -0
  14. package/assets/skills/wigolo-extract/SKILL.md +59 -0
  15. package/assets/skills/wigolo-fetch/SKILL.md +65 -0
  16. package/assets/skills/wigolo-find-similar/SKILL.md +72 -0
  17. package/assets/skills/wigolo-research/SKILL.md +77 -0
  18. package/assets/skills/wigolo-search/SKILL.md +78 -0
  19. package/dist/agent/executor.d.ts +33 -0
  20. package/dist/agent/executor.d.ts.map +1 -0
  21. package/dist/agent/executor.js +233 -0
  22. package/dist/agent/executor.js.map +1 -0
  23. package/dist/agent/pipeline.d.ts +5 -0
  24. package/dist/agent/pipeline.d.ts.map +1 -0
  25. package/dist/agent/pipeline.js +208 -0
  26. package/dist/agent/pipeline.js.map +1 -0
  27. package/dist/agent/planner.d.ts +13 -0
  28. package/dist/agent/planner.d.ts.map +1 -0
  29. package/dist/agent/planner.js +271 -0
  30. package/dist/agent/planner.js.map +1 -0
  31. package/dist/agent/relevance.d.ts +15 -0
  32. package/dist/agent/relevance.d.ts.map +1 -0
  33. package/dist/agent/relevance.js +60 -0
  34. package/dist/agent/relevance.js.map +1 -0
  35. package/dist/cache/backfill-embeddings.d.ts +23 -0
  36. package/dist/cache/backfill-embeddings.d.ts.map +1 -0
  37. package/dist/cache/backfill-embeddings.js +105 -0
  38. package/dist/cache/backfill-embeddings.js.map +1 -0
  39. package/dist/cache/change-detector.d.ts +7 -0
  40. package/dist/cache/change-detector.d.ts.map +1 -0
  41. package/dist/cache/change-detector.js +43 -0
  42. package/dist/cache/change-detector.js.map +1 -0
  43. package/dist/cache/db.d.ts +1 -0
  44. package/dist/cache/db.d.ts.map +1 -1
  45. package/dist/cache/db.js +94 -22
  46. package/dist/cache/db.js.map +1 -1
  47. package/dist/cache/diff-summary.d.ts +2 -0
  48. package/dist/cache/diff-summary.d.ts.map +1 -0
  49. package/dist/cache/diff-summary.js +82 -0
  50. package/dist/cache/diff-summary.js.map +1 -0
  51. package/dist/cache/migrations/runner.d.ts +29 -0
  52. package/dist/cache/migrations/runner.d.ts.map +1 -0
  53. package/dist/cache/migrations/runner.js +147 -0
  54. package/dist/cache/migrations/runner.js.map +1 -0
  55. package/dist/cache/sqlite-vec-store.d.ts +42 -0
  56. package/dist/cache/sqlite-vec-store.d.ts.map +1 -0
  57. package/dist/cache/sqlite-vec-store.js +176 -0
  58. package/dist/cache/sqlite-vec-store.js.map +1 -0
  59. package/dist/cache/store.d.ts +46 -1
  60. package/dist/cache/store.d.ts.map +1 -1
  61. package/dist/cache/store.js +362 -168
  62. package/dist/cache/store.js.map +1 -1
  63. package/dist/cli/agents/antigravity.d.ts +20 -0
  64. package/dist/cli/agents/antigravity.d.ts.map +1 -0
  65. package/dist/cli/agents/antigravity.js +49 -0
  66. package/dist/cli/agents/antigravity.js.map +1 -0
  67. package/dist/cli/agents/claude-code.d.ts +25 -0
  68. package/dist/cli/agents/claude-code.d.ts.map +1 -0
  69. package/dist/cli/agents/claude-code.js +111 -0
  70. package/dist/cli/agents/claude-code.js.map +1 -0
  71. package/dist/cli/agents/cursor.d.ts +21 -0
  72. package/dist/cli/agents/cursor.d.ts.map +1 -0
  73. package/dist/cli/agents/cursor.js +58 -0
  74. package/dist/cli/agents/cursor.js.map +1 -0
  75. package/dist/cli/agents/gemini-cli.d.ts +21 -0
  76. package/dist/cli/agents/gemini-cli.d.ts.map +1 -0
  77. package/dist/cli/agents/gemini-cli.js +55 -0
  78. package/dist/cli/agents/gemini-cli.js.map +1 -0
  79. package/dist/cli/agents/registry.d.ts +21 -0
  80. package/dist/cli/agents/registry.d.ts.map +1 -0
  81. package/dist/cli/agents/registry.js +27 -0
  82. package/dist/cli/agents/registry.js.map +1 -0
  83. package/dist/cli/agents/utils.d.ts +26 -0
  84. package/dist/cli/agents/utils.d.ts.map +1 -0
  85. package/dist/cli/agents/utils.js +136 -0
  86. package/dist/cli/agents/utils.js.map +1 -0
  87. package/dist/cli/agents/vscode.d.ts +21 -0
  88. package/dist/cli/agents/vscode.d.ts.map +1 -0
  89. package/dist/cli/agents/vscode.js +62 -0
  90. package/dist/cli/agents/vscode.js.map +1 -0
  91. package/dist/cli/auth.d.ts +2 -0
  92. package/dist/cli/auth.d.ts.map +1 -0
  93. package/dist/cli/auth.js +94 -0
  94. package/dist/cli/auth.js.map +1 -0
  95. package/dist/cli/backfill.d.ts +2 -0
  96. package/dist/cli/backfill.d.ts.map +1 -0
  97. package/dist/cli/backfill.js +58 -0
  98. package/dist/cli/backfill.js.map +1 -0
  99. package/dist/cli/daemon.d.ts +6 -1
  100. package/dist/cli/daemon.d.ts.map +1 -1
  101. package/dist/cli/daemon.js +61 -3
  102. package/dist/cli/daemon.js.map +1 -1
  103. package/dist/cli/doctor.d.ts +8 -0
  104. package/dist/cli/doctor.d.ts.map +1 -0
  105. package/dist/cli/doctor.js +318 -0
  106. package/dist/cli/doctor.js.map +1 -0
  107. package/dist/cli/health.d.ts +1 -1
  108. package/dist/cli/health.d.ts.map +1 -1
  109. package/dist/cli/health.js +42 -3
  110. package/dist/cli/health.js.map +1 -1
  111. package/dist/cli/help.d.ts +6 -0
  112. package/dist/cli/help.d.ts.map +1 -0
  113. package/dist/cli/help.js +63 -0
  114. package/dist/cli/help.js.map +1 -0
  115. package/dist/cli/index.d.ts +1 -1
  116. package/dist/cli/index.d.ts.map +1 -1
  117. package/dist/cli/index.js +35 -7
  118. package/dist/cli/index.js.map +1 -1
  119. package/dist/cli/init.d.ts +2 -0
  120. package/dist/cli/init.d.ts.map +1 -0
  121. package/dist/cli/init.js +201 -0
  122. package/dist/cli/init.js.map +1 -0
  123. package/dist/cli/plugin.d.ts +5 -0
  124. package/dist/cli/plugin.d.ts.map +1 -0
  125. package/dist/cli/plugin.js +185 -0
  126. package/dist/cli/plugin.js.map +1 -0
  127. package/dist/cli/setup-mcp.d.ts +2 -0
  128. package/dist/cli/setup-mcp.d.ts.map +1 -0
  129. package/dist/cli/setup-mcp.js +114 -0
  130. package/dist/cli/setup-mcp.js.map +1 -0
  131. package/dist/cli/shell.d.ts +2 -0
  132. package/dist/cli/shell.d.ts.map +1 -0
  133. package/dist/cli/shell.js +86 -0
  134. package/dist/cli/shell.js.map +1 -0
  135. package/dist/cli/status.d.ts +2 -0
  136. package/dist/cli/status.d.ts.map +1 -0
  137. package/dist/cli/status.js +31 -0
  138. package/dist/cli/status.js.map +1 -0
  139. package/dist/cli/telemetry.d.ts +10 -0
  140. package/dist/cli/telemetry.d.ts.map +1 -0
  141. package/dist/cli/telemetry.js +56 -0
  142. package/dist/cli/telemetry.js.map +1 -0
  143. package/dist/cli/tui/agents-types.d.ts +28 -0
  144. package/dist/cli/tui/agents-types.d.ts.map +1 -0
  145. package/dist/cli/tui/agents-types.js +1 -0
  146. package/dist/cli/tui/agents-types.js.map +1 -0
  147. package/dist/cli/tui/agents.d.ts +11 -0
  148. package/dist/cli/tui/agents.d.ts.map +1 -0
  149. package/dist/cli/tui/agents.js +93 -0
  150. package/dist/cli/tui/agents.js.map +1 -0
  151. package/dist/cli/tui/banner.d.ts +3 -0
  152. package/dist/cli/tui/banner.d.ts.map +1 -0
  153. package/dist/cli/tui/banner.js +30 -0
  154. package/dist/cli/tui/banner.js.map +1 -0
  155. package/dist/cli/tui/components/AgentSelect.d.ts +13 -0
  156. package/dist/cli/tui/components/AgentSelect.d.ts.map +1 -0
  157. package/dist/cli/tui/components/AgentSelect.js +116 -0
  158. package/dist/cli/tui/components/AgentSelect.js.map +1 -0
  159. package/dist/cli/tui/components/Banner.d.ts +6 -0
  160. package/dist/cli/tui/components/Banner.d.ts.map +1 -0
  161. package/dist/cli/tui/components/Banner.js +25 -0
  162. package/dist/cli/tui/components/Banner.js.map +1 -0
  163. package/dist/cli/tui/components/BrowserSelect.d.ts +7 -0
  164. package/dist/cli/tui/components/BrowserSelect.d.ts.map +1 -0
  165. package/dist/cli/tui/components/BrowserSelect.js +19 -0
  166. package/dist/cli/tui/components/BrowserSelect.js.map +1 -0
  167. package/dist/cli/tui/components/InstallProgress.d.ts +9 -0
  168. package/dist/cli/tui/components/InstallProgress.d.ts.map +1 -0
  169. package/dist/cli/tui/components/InstallProgress.js +67 -0
  170. package/dist/cli/tui/components/InstallProgress.js.map +1 -0
  171. package/dist/cli/tui/components/SkillInstall.d.ts +14 -0
  172. package/dist/cli/tui/components/SkillInstall.d.ts.map +1 -0
  173. package/dist/cli/tui/components/SkillInstall.js +94 -0
  174. package/dist/cli/tui/components/SkillInstall.js.map +1 -0
  175. package/dist/cli/tui/components/Summary.d.ts +22 -0
  176. package/dist/cli/tui/components/Summary.d.ts.map +1 -0
  177. package/dist/cli/tui/components/Summary.js +135 -0
  178. package/dist/cli/tui/components/Summary.js.map +1 -0
  179. package/dist/cli/tui/components/SystemCheck.d.ts +8 -0
  180. package/dist/cli/tui/components/SystemCheck.d.ts.map +1 -0
  181. package/dist/cli/tui/components/SystemCheck.js +71 -0
  182. package/dist/cli/tui/components/SystemCheck.js.map +1 -0
  183. package/dist/cli/tui/components/Verification.d.ts +8 -0
  184. package/dist/cli/tui/components/Verification.d.ts.map +1 -0
  185. package/dist/cli/tui/components/Verification.js +63 -0
  186. package/dist/cli/tui/components/Verification.js.map +1 -0
  187. package/dist/cli/tui/config-writer-cli.d.ts +12 -0
  188. package/dist/cli/tui/config-writer-cli.d.ts.map +1 -0
  189. package/dist/cli/tui/config-writer-cli.js +39 -0
  190. package/dist/cli/tui/config-writer-cli.js.map +1 -0
  191. package/dist/cli/tui/config-writer-json.d.ts +16 -0
  192. package/dist/cli/tui/config-writer-json.d.ts.map +1 -0
  193. package/dist/cli/tui/config-writer-json.js +86 -0
  194. package/dist/cli/tui/config-writer-json.js.map +1 -0
  195. package/dist/cli/tui/config-writer-toml.d.ts +16 -0
  196. package/dist/cli/tui/config-writer-toml.d.ts.map +1 -0
  197. package/dist/cli/tui/config-writer-toml.js +83 -0
  198. package/dist/cli/tui/config-writer-toml.js.map +1 -0
  199. package/dist/cli/tui/config-writer.d.ts +25 -0
  200. package/dist/cli/tui/config-writer.d.ts.map +1 -0
  201. package/dist/cli/tui/config-writer.js +101 -0
  202. package/dist/cli/tui/config-writer.js.map +1 -0
  203. package/dist/cli/tui/detect-helpers.d.ts +6 -0
  204. package/dist/cli/tui/detect-helpers.d.ts.map +1 -0
  205. package/dist/cli/tui/detect-helpers.js +45 -0
  206. package/dist/cli/tui/detect-helpers.js.map +1 -0
  207. package/dist/cli/tui/extras-prompt.d.ts +7 -0
  208. package/dist/cli/tui/extras-prompt.d.ts.map +1 -0
  209. package/dist/cli/tui/extras-prompt.js +42 -0
  210. package/dist/cli/tui/extras-prompt.js.map +1 -0
  211. package/dist/cli/tui/flags-types.d.ts +19 -0
  212. package/dist/cli/tui/flags-types.d.ts.map +1 -0
  213. package/dist/cli/tui/flags-types.js +23 -0
  214. package/dist/cli/tui/flags-types.js.map +1 -0
  215. package/dist/cli/tui/flags.d.ts +5 -0
  216. package/dist/cli/tui/flags.d.ts.map +1 -0
  217. package/dist/cli/tui/flags.js +132 -0
  218. package/dist/cli/tui/flags.js.map +1 -0
  219. package/dist/cli/tui/format.d.ts +14 -0
  220. package/dist/cli/tui/format.d.ts.map +1 -0
  221. package/dist/cli/tui/format.js +37 -0
  222. package/dist/cli/tui/format.js.map +1 -0
  223. package/dist/cli/tui/hooks/useAgentDetect.d.ts +6 -0
  224. package/dist/cli/tui/hooks/useAgentDetect.d.ts.map +1 -0
  225. package/dist/cli/tui/hooks/useAgentDetect.js +19 -0
  226. package/dist/cli/tui/hooks/useAgentDetect.js.map +1 -0
  227. package/dist/cli/tui/hooks/useInstall.d.ts +14 -0
  228. package/dist/cli/tui/hooks/useInstall.d.ts.map +1 -0
  229. package/dist/cli/tui/hooks/useInstall.js +90 -0
  230. package/dist/cli/tui/hooks/useInstall.js.map +1 -0
  231. package/dist/cli/tui/hooks/useSystemCheck.d.ts +13 -0
  232. package/dist/cli/tui/hooks/useSystemCheck.d.ts.map +1 -0
  233. package/dist/cli/tui/hooks/useSystemCheck.js +95 -0
  234. package/dist/cli/tui/hooks/useSystemCheck.js.map +1 -0
  235. package/dist/cli/tui/hooks/useVerify.d.ts +14 -0
  236. package/dist/cli/tui/hooks/useVerify.d.ts.map +1 -0
  237. package/dist/cli/tui/hooks/useVerify.js +71 -0
  238. package/dist/cli/tui/hooks/useVerify.js.map +1 -0
  239. package/dist/cli/tui/ink-init.d.ts +2 -0
  240. package/dist/cli/tui/ink-init.d.ts.map +1 -0
  241. package/dist/cli/tui/ink-init.js +198 -0
  242. package/dist/cli/tui/ink-init.js.map +1 -0
  243. package/dist/cli/tui/reporter-auto.d.ts +7 -0
  244. package/dist/cli/tui/reporter-auto.d.ts.map +1 -0
  245. package/dist/cli/tui/reporter-auto.js +15 -0
  246. package/dist/cli/tui/reporter-auto.js.map +1 -0
  247. package/dist/cli/tui/reporter.d.ts +26 -0
  248. package/dist/cli/tui/reporter.d.ts.map +1 -0
  249. package/dist/cli/tui/reporter.js +32 -0
  250. package/dist/cli/tui/reporter.js.map +1 -0
  251. package/dist/cli/tui/run-command.d.ts +14 -0
  252. package/dist/cli/tui/run-command.d.ts.map +1 -0
  253. package/dist/cli/tui/run-command.js +72 -0
  254. package/dist/cli/tui/run-command.js.map +1 -0
  255. package/dist/cli/tui/select-agents.d.ts +6 -0
  256. package/dist/cli/tui/select-agents.d.ts.map +1 -0
  257. package/dist/cli/tui/select-agents.js +32 -0
  258. package/dist/cli/tui/select-agents.js.map +1 -0
  259. package/dist/cli/tui/status-agents.d.ts +11 -0
  260. package/dist/cli/tui/status-agents.d.ts.map +1 -0
  261. package/dist/cli/tui/status-agents.js +53 -0
  262. package/dist/cli/tui/status-agents.js.map +1 -0
  263. package/dist/cli/tui/status-cache.d.ts +6 -0
  264. package/dist/cli/tui/status-cache.d.ts.map +1 -0
  265. package/dist/cli/tui/status-cache.js +39 -0
  266. package/dist/cli/tui/status-cache.js.map +1 -0
  267. package/dist/cli/tui/status-format.d.ts +14 -0
  268. package/dist/cli/tui/status-format.d.ts.map +1 -0
  269. package/dist/cli/tui/status-format.js +41 -0
  270. package/dist/cli/tui/status-format.js.map +1 -0
  271. package/dist/cli/tui/status-python.d.ts +6 -0
  272. package/dist/cli/tui/status-python.d.ts.map +1 -0
  273. package/dist/cli/tui/status-python.js +30 -0
  274. package/dist/cli/tui/status-python.js.map +1 -0
  275. package/dist/cli/tui/system-check.d.ts +24 -0
  276. package/dist/cli/tui/system-check.d.ts.map +1 -0
  277. package/dist/cli/tui/system-check.js +103 -0
  278. package/dist/cli/tui/system-check.js.map +1 -0
  279. package/dist/cli/tui/tui-reporter.d.ts +19 -0
  280. package/dist/cli/tui/tui-reporter.d.ts.map +1 -0
  281. package/dist/cli/tui/tui-reporter.js +95 -0
  282. package/dist/cli/tui/tui-reporter.js.map +1 -0
  283. package/dist/cli/tui/utils/config-writer.d.ts +3 -0
  284. package/dist/cli/tui/utils/config-writer.d.ts.map +1 -0
  285. package/dist/cli/tui/utils/config-writer.js +22 -0
  286. package/dist/cli/tui/utils/config-writer.js.map +1 -0
  287. package/dist/cli/tui/utils/suppress-logs.d.ts +3 -0
  288. package/dist/cli/tui/utils/suppress-logs.d.ts.map +1 -0
  289. package/dist/cli/tui/utils/suppress-logs.js +11 -0
  290. package/dist/cli/tui/utils/suppress-logs.js.map +1 -0
  291. package/dist/cli/tui/verify-suggestions.d.ts +5 -0
  292. package/dist/cli/tui/verify-suggestions.d.ts.map +1 -0
  293. package/dist/cli/tui/verify-suggestions.js +20 -0
  294. package/dist/cli/tui/verify-suggestions.js.map +1 -0
  295. package/dist/cli/tui/verify.d.ts +14 -0
  296. package/dist/cli/tui/verify.d.ts.map +1 -0
  297. package/dist/cli/tui/verify.js +101 -0
  298. package/dist/cli/tui/verify.js.map +1 -0
  299. package/dist/cli/tui/version.d.ts +2 -0
  300. package/dist/cli/tui/version.d.ts.map +1 -0
  301. package/dist/cli/tui/version.js +14 -0
  302. package/dist/cli/tui/version.js.map +1 -0
  303. package/dist/cli/uninstall.d.ts +2 -0
  304. package/dist/cli/uninstall.d.ts.map +1 -0
  305. package/dist/cli/uninstall.js +57 -0
  306. package/dist/cli/uninstall.js.map +1 -0
  307. package/dist/cli/warmup.d.ts +10 -2
  308. package/dist/cli/warmup.d.ts.map +1 -1
  309. package/dist/cli/warmup.js +226 -93
  310. package/dist/cli/warmup.js.map +1 -1
  311. package/dist/config.d.ts +28 -2
  312. package/dist/config.d.ts.map +1 -1
  313. package/dist/config.js +106 -56
  314. package/dist/config.js.map +1 -1
  315. package/dist/crawl/crawler.d.ts +6 -0
  316. package/dist/crawl/crawler.d.ts.map +1 -1
  317. package/dist/crawl/crawler.js +210 -209
  318. package/dist/crawl/crawler.js.map +1 -1
  319. package/dist/crawl/dedup.d.ts +1 -0
  320. package/dist/crawl/dedup.d.ts.map +1 -1
  321. package/dist/crawl/dedup.js +124 -81
  322. package/dist/crawl/dedup.js.map +1 -1
  323. package/dist/crawl/etag-incremental.d.ts +43 -0
  324. package/dist/crawl/etag-incremental.d.ts.map +1 -0
  325. package/dist/crawl/etag-incremental.js +94 -0
  326. package/dist/crawl/etag-incremental.js.map +1 -0
  327. package/dist/crawl/index-to-vec.d.ts +10 -0
  328. package/dist/crawl/index-to-vec.d.ts.map +1 -0
  329. package/dist/crawl/index-to-vec.js +44 -0
  330. package/dist/crawl/index-to-vec.js.map +1 -0
  331. package/dist/crawl/mapper.js +136 -164
  332. package/dist/crawl/mapper.js.map +1 -1
  333. package/dist/crawl/rate-limiter.js +63 -66
  334. package/dist/crawl/rate-limiter.js.map +1 -1
  335. package/dist/crawl/robots.js +58 -57
  336. package/dist/crawl/robots.js.map +1 -1
  337. package/dist/crawl/sitemap-first.d.ts +12 -0
  338. package/dist/crawl/sitemap-first.d.ts.map +1 -0
  339. package/dist/crawl/sitemap-first.js +47 -0
  340. package/dist/crawl/sitemap-first.js.map +1 -0
  341. package/dist/crawl/sitemap.js +33 -32
  342. package/dist/crawl/sitemap.js.map +1 -1
  343. package/dist/crawl/url-utils.d.ts +1 -0
  344. package/dist/crawl/url-utils.d.ts.map +1 -1
  345. package/dist/crawl/url-utils.js +49 -37
  346. package/dist/crawl/url-utils.js.map +1 -1
  347. package/dist/daemon/health-check.d.ts +16 -0
  348. package/dist/daemon/health-check.d.ts.map +1 -0
  349. package/dist/daemon/health-check.js +33 -0
  350. package/dist/daemon/health-check.js.map +1 -0
  351. package/dist/daemon/http-server.d.ts +26 -0
  352. package/dist/daemon/http-server.d.ts.map +1 -0
  353. package/dist/daemon/http-server.js +275 -0
  354. package/dist/daemon/http-server.js.map +1 -0
  355. package/dist/daemon/proxy.d.ts +10 -0
  356. package/dist/daemon/proxy.d.ts.map +1 -0
  357. package/dist/daemon/proxy.js +93 -0
  358. package/dist/daemon/proxy.js.map +1 -0
  359. package/dist/embedding/embed.d.ts +59 -0
  360. package/dist/embedding/embed.d.ts.map +1 -0
  361. package/dist/embedding/embed.js +233 -0
  362. package/dist/embedding/embed.js.map +1 -0
  363. package/dist/embedding/fastembed-provider.d.ts +19 -0
  364. package/dist/embedding/fastembed-provider.d.ts.map +1 -0
  365. package/dist/embedding/fastembed-provider.js +51 -0
  366. package/dist/embedding/fastembed-provider.js.map +1 -0
  367. package/dist/embedding/key-terms.d.ts +12 -0
  368. package/dist/embedding/key-terms.d.ts.map +1 -0
  369. package/dist/embedding/key-terms.js +234 -0
  370. package/dist/embedding/key-terms.js.map +1 -0
  371. package/dist/extraction/boilerplate.d.ts +15 -0
  372. package/dist/extraction/boilerplate.d.ts.map +1 -0
  373. package/dist/extraction/boilerplate.js +52 -0
  374. package/dist/extraction/boilerplate.js.map +1 -0
  375. package/dist/extraction/defuddle.d.ts.map +1 -1
  376. package/dist/extraction/defuddle.js +27 -23
  377. package/dist/extraction/defuddle.js.map +1 -1
  378. package/dist/extraction/extract.d.ts.map +1 -1
  379. package/dist/extraction/extract.js +76 -76
  380. package/dist/extraction/extract.js.map +1 -1
  381. package/dist/extraction/jsonld.js +50 -54
  382. package/dist/extraction/jsonld.js.map +1 -1
  383. package/dist/extraction/lang-hints.d.ts +2 -0
  384. package/dist/extraction/lang-hints.d.ts.map +1 -0
  385. package/dist/extraction/lang-hints.js +30 -0
  386. package/dist/extraction/lang-hints.js.map +1 -0
  387. package/dist/extraction/llm-fallback.d.ts +17 -0
  388. package/dist/extraction/llm-fallback.d.ts.map +1 -0
  389. package/dist/extraction/llm-fallback.js +130 -0
  390. package/dist/extraction/llm-fallback.js.map +1 -0
  391. package/dist/extraction/markdown-sanitize.d.ts +2 -0
  392. package/dist/extraction/markdown-sanitize.d.ts.map +1 -0
  393. package/dist/extraction/markdown-sanitize.js +151 -0
  394. package/dist/extraction/markdown-sanitize.js.map +1 -0
  395. package/dist/extraction/markdown.d.ts +11 -0
  396. package/dist/extraction/markdown.d.ts.map +1 -1
  397. package/dist/extraction/markdown.js +195 -91
  398. package/dist/extraction/markdown.js.map +1 -1
  399. package/dist/extraction/pipeline.d.ts +8 -0
  400. package/dist/extraction/pipeline.d.ts.map +1 -1
  401. package/dist/extraction/pipeline.js +57 -91
  402. package/dist/extraction/pipeline.js.map +1 -1
  403. package/dist/extraction/readability.d.ts +1 -1
  404. package/dist/extraction/readability.d.ts.map +1 -1
  405. package/dist/extraction/readability.js +28 -29
  406. package/dist/extraction/readability.js.map +1 -1
  407. package/dist/extraction/schema.d.ts +12 -0
  408. package/dist/extraction/schema.d.ts.map +1 -1
  409. package/dist/extraction/schema.js +135 -72
  410. package/dist/extraction/schema.js.map +1 -1
  411. package/dist/extraction/site-extractors/docs-generic.d.ts.map +1 -1
  412. package/dist/extraction/site-extractors/docs-generic.js +81 -91
  413. package/dist/extraction/site-extractors/docs-generic.js.map +1 -1
  414. package/dist/extraction/site-extractors/github.d.ts.map +1 -1
  415. package/dist/extraction/site-extractors/github.js +87 -95
  416. package/dist/extraction/site-extractors/github.js.map +1 -1
  417. package/dist/extraction/site-extractors/mdn.d.ts.map +1 -1
  418. package/dist/extraction/site-extractors/mdn.js +46 -54
  419. package/dist/extraction/site-extractors/mdn.js.map +1 -1
  420. package/dist/extraction/site-extractors/stackoverflow.d.ts.map +1 -1
  421. package/dist/extraction/site-extractors/stackoverflow.js +71 -80
  422. package/dist/extraction/site-extractors/stackoverflow.js.map +1 -1
  423. package/dist/extraction/structured-data.d.ts +4 -0
  424. package/dist/extraction/structured-data.d.ts.map +1 -0
  425. package/dist/extraction/structured-data.js +173 -0
  426. package/dist/extraction/structured-data.js.map +1 -0
  427. package/dist/extraction/structured.d.ts +4 -0
  428. package/dist/extraction/structured.d.ts.map +1 -0
  429. package/dist/extraction/structured.js +163 -0
  430. package/dist/extraction/structured.js.map +1 -0
  431. package/dist/extraction/v1/classifier.d.ts +3 -0
  432. package/dist/extraction/v1/classifier.d.ts.map +1 -0
  433. package/dist/extraction/v1/classifier.js +110 -0
  434. package/dist/extraction/v1/classifier.js.map +1 -0
  435. package/dist/extraction/v1/extract-provider.d.ts +16 -0
  436. package/dist/extraction/v1/extract-provider.d.ts.map +1 -0
  437. package/dist/extraction/v1/extract-provider.js +43 -0
  438. package/dist/extraction/v1/extract-provider.js.map +1 -0
  439. package/dist/extraction/v1/local-llm.d.ts +8 -0
  440. package/dist/extraction/v1/local-llm.d.ts.map +1 -0
  441. package/dist/extraction/v1/local-llm.js +58 -0
  442. package/dist/extraction/v1/local-llm.js.map +1 -0
  443. package/dist/extraction/v1/news.d.ts +3 -0
  444. package/dist/extraction/v1/news.d.ts.map +1 -0
  445. package/dist/extraction/v1/news.js +61 -0
  446. package/dist/extraction/v1/news.js.map +1 -0
  447. package/dist/extraction/v1/product.d.ts +3 -0
  448. package/dist/extraction/v1/product.d.ts.map +1 -0
  449. package/dist/extraction/v1/product.js +166 -0
  450. package/dist/extraction/v1/product.js.map +1 -0
  451. package/dist/extraction/v1/recipe.d.ts +3 -0
  452. package/dist/extraction/v1/recipe.d.ts.map +1 -0
  453. package/dist/extraction/v1/recipe.js +136 -0
  454. package/dist/extraction/v1/recipe.js.map +1 -0
  455. package/dist/extraction/v1/routed.d.ts +17 -0
  456. package/dist/extraction/v1/routed.d.ts.map +1 -0
  457. package/dist/extraction/v1/routed.js +68 -0
  458. package/dist/extraction/v1/routed.js.map +1 -0
  459. package/dist/extraction/v1/schemas/Article.d.ts +11 -0
  460. package/dist/extraction/v1/schemas/Article.d.ts.map +1 -0
  461. package/dist/extraction/v1/schemas/Article.js +23 -0
  462. package/dist/extraction/v1/schemas/Article.js.map +1 -0
  463. package/dist/extraction/v1/schemas/CodeSnippet.d.ts +9 -0
  464. package/dist/extraction/v1/schemas/CodeSnippet.d.ts.map +1 -0
  465. package/dist/extraction/v1/schemas/CodeSnippet.js +90 -0
  466. package/dist/extraction/v1/schemas/CodeSnippet.js.map +1 -0
  467. package/dist/extraction/v1/schemas/EventListing.d.ts +10 -0
  468. package/dist/extraction/v1/schemas/EventListing.d.ts.map +1 -0
  469. package/dist/extraction/v1/schemas/EventListing.js +122 -0
  470. package/dist/extraction/v1/schemas/EventListing.js.map +1 -0
  471. package/dist/extraction/v1/schemas/Paper.d.ts +10 -0
  472. package/dist/extraction/v1/schemas/Paper.d.ts.map +1 -0
  473. package/dist/extraction/v1/schemas/Paper.js +156 -0
  474. package/dist/extraction/v1/schemas/Paper.js.map +1 -0
  475. package/dist/extraction/v1/schemas/Product.d.ts +17 -0
  476. package/dist/extraction/v1/schemas/Product.d.ts.map +1 -0
  477. package/dist/extraction/v1/schemas/Product.js +149 -0
  478. package/dist/extraction/v1/schemas/Product.js.map +1 -0
  479. package/dist/extraction/v1/schemas/Recipe.d.ts +14 -0
  480. package/dist/extraction/v1/schemas/Recipe.d.ts.map +1 -0
  481. package/dist/extraction/v1/schemas/Recipe.js +160 -0
  482. package/dist/extraction/v1/schemas/Recipe.js.map +1 -0
  483. package/dist/extraction/v1/schemas/index.d.ts +13 -0
  484. package/dist/extraction/v1/schemas/index.d.ts.map +1 -0
  485. package/dist/extraction/v1/schemas/index.js +44 -0
  486. package/dist/extraction/v1/schemas/index.js.map +1 -0
  487. package/dist/extraction/v1/site-extractors.d.ts +5 -0
  488. package/dist/extraction/v1/site-extractors.d.ts.map +1 -0
  489. package/dist/extraction/v1/site-extractors.js +31 -0
  490. package/dist/extraction/v1/site-extractors.js.map +1 -0
  491. package/dist/fetch/action-executor.d.ts +28 -0
  492. package/dist/fetch/action-executor.d.ts.map +1 -0
  493. package/dist/fetch/action-executor.js +88 -0
  494. package/dist/fetch/action-executor.js.map +1 -0
  495. package/dist/fetch/auth.d.ts +2 -1
  496. package/dist/fetch/auth.d.ts.map +1 -1
  497. package/dist/fetch/auth.js +56 -26
  498. package/dist/fetch/auth.js.map +1 -1
  499. package/dist/fetch/browser-pool.d.ts +30 -11
  500. package/dist/fetch/browser-pool.d.ts.map +1 -1
  501. package/dist/fetch/browser-pool.js +303 -127
  502. package/dist/fetch/browser-pool.js.map +1 -1
  503. package/dist/fetch/browser-selector.d.ts +17 -0
  504. package/dist/fetch/browser-selector.d.ts.map +1 -0
  505. package/dist/fetch/browser-selector.js +72 -0
  506. package/dist/fetch/browser-selector.js.map +1 -0
  507. package/dist/fetch/browser-types.d.ts +3 -0
  508. package/dist/fetch/browser-types.d.ts.map +1 -0
  509. package/dist/fetch/browser-types.js +45 -0
  510. package/dist/fetch/browser-types.js.map +1 -0
  511. package/dist/fetch/cdp-client.d.ts +9 -0
  512. package/dist/fetch/cdp-client.d.ts.map +1 -0
  513. package/dist/fetch/cdp-client.js +89 -0
  514. package/dist/fetch/cdp-client.js.map +1 -0
  515. package/dist/fetch/content-check.js +39 -46
  516. package/dist/fetch/content-check.js.map +1 -1
  517. package/dist/fetch/http-client.d.ts +4 -0
  518. package/dist/fetch/http-client.d.ts.map +1 -1
  519. package/dist/fetch/http-client.js +147 -128
  520. package/dist/fetch/http-client.js.map +1 -1
  521. package/dist/fetch/lightpanda.d.ts +28 -0
  522. package/dist/fetch/lightpanda.d.ts.map +1 -0
  523. package/dist/fetch/lightpanda.js +174 -0
  524. package/dist/fetch/lightpanda.js.map +1 -0
  525. package/dist/fetch/playwright-tier.d.ts +19 -0
  526. package/dist/fetch/playwright-tier.d.ts.map +1 -0
  527. package/dist/fetch/playwright-tier.js +76 -0
  528. package/dist/fetch/playwright-tier.js.map +1 -0
  529. package/dist/fetch/router.d.ts +49 -3
  530. package/dist/fetch/router.d.ts.map +1 -1
  531. package/dist/fetch/router.js +185 -81
  532. package/dist/fetch/router.js.map +1 -1
  533. package/dist/index.js +97 -17
  534. package/dist/index.js.map +1 -1
  535. package/dist/instructions.d.ts +31 -0
  536. package/dist/instructions.d.ts.map +1 -0
  537. package/dist/instructions.js +245 -0
  538. package/dist/instructions.js.map +1 -0
  539. package/dist/integrations/cloud/llm/anthropic.d.ts +3 -0
  540. package/dist/integrations/cloud/llm/anthropic.d.ts.map +1 -0
  541. package/dist/integrations/cloud/llm/anthropic.js +41 -0
  542. package/dist/integrations/cloud/llm/anthropic.js.map +1 -0
  543. package/dist/integrations/cloud/llm/cache.d.ts +5 -0
  544. package/dist/integrations/cloud/llm/cache.d.ts.map +1 -0
  545. package/dist/integrations/cloud/llm/cache.js +49 -0
  546. package/dist/integrations/cloud/llm/cache.js.map +1 -0
  547. package/dist/integrations/cloud/llm/gemini.d.ts +3 -0
  548. package/dist/integrations/cloud/llm/gemini.d.ts.map +1 -0
  549. package/dist/integrations/cloud/llm/gemini.js +37 -0
  550. package/dist/integrations/cloud/llm/gemini.js.map +1 -0
  551. package/dist/integrations/cloud/llm/groq.d.ts +3 -0
  552. package/dist/integrations/cloud/llm/groq.d.ts.map +1 -0
  553. package/dist/integrations/cloud/llm/groq.js +74 -0
  554. package/dist/integrations/cloud/llm/groq.js.map +1 -0
  555. package/dist/integrations/cloud/llm/hash.d.ts +3 -0
  556. package/dist/integrations/cloud/llm/hash.d.ts.map +1 -0
  557. package/dist/integrations/cloud/llm/hash.js +26 -0
  558. package/dist/integrations/cloud/llm/hash.js.map +1 -0
  559. package/dist/integrations/cloud/llm/openai.d.ts +3 -0
  560. package/dist/integrations/cloud/llm/openai.d.ts.map +1 -0
  561. package/dist/integrations/cloud/llm/openai.js +43 -0
  562. package/dist/integrations/cloud/llm/openai.js.map +1 -0
  563. package/dist/integrations/cloud/llm/select.d.ts +5 -0
  564. package/dist/integrations/cloud/llm/select.d.ts.map +1 -0
  565. package/dist/integrations/cloud/llm/select.js +30 -0
  566. package/dist/integrations/cloud/llm/select.js.map +1 -0
  567. package/dist/integrations/cloud/llm/types.d.ts +24 -0
  568. package/dist/integrations/cloud/llm/types.d.ts.map +1 -0
  569. package/dist/integrations/cloud/llm/types.js +1 -0
  570. package/dist/integrations/cloud/llm/types.js.map +1 -0
  571. package/dist/integrations/cloud/llm/validate.d.ts +6 -0
  572. package/dist/integrations/cloud/llm/validate.d.ts.map +1 -0
  573. package/dist/integrations/cloud/llm/validate.js +63 -0
  574. package/dist/integrations/cloud/llm/validate.js.map +1 -0
  575. package/dist/logger.d.ts +4 -1
  576. package/dist/logger.d.ts.map +1 -1
  577. package/dist/logger.js +71 -30
  578. package/dist/logger.js.map +1 -1
  579. package/dist/pdf-parse.d.js +1 -0
  580. package/dist/pdf-parse.d.js.map +1 -0
  581. package/dist/plugins/loader.d.ts +20 -0
  582. package/dist/plugins/loader.d.ts.map +1 -0
  583. package/dist/plugins/loader.js +157 -0
  584. package/dist/plugins/loader.js.map +1 -0
  585. package/dist/plugins/registry.d.ts +26 -0
  586. package/dist/plugins/registry.d.ts.map +1 -0
  587. package/dist/plugins/registry.js +71 -0
  588. package/dist/plugins/registry.js.map +1 -0
  589. package/dist/plugins/validate.d.ts +9 -0
  590. package/dist/plugins/validate.d.ts.map +1 -0
  591. package/dist/plugins/validate.js +79 -0
  592. package/dist/plugins/validate.js.map +1 -0
  593. package/dist/providers/embed-provider.d.ts +11 -0
  594. package/dist/providers/embed-provider.d.ts.map +1 -0
  595. package/dist/providers/embed-provider.js +24 -0
  596. package/dist/providers/embed-provider.js.map +1 -0
  597. package/dist/providers/extract-provider.d.ts +23 -0
  598. package/dist/providers/extract-provider.d.ts.map +1 -0
  599. package/dist/providers/extract-provider.js +25 -0
  600. package/dist/providers/extract-provider.js.map +1 -0
  601. package/dist/providers/rerank-provider.d.ts +16 -0
  602. package/dist/providers/rerank-provider.d.ts.map +1 -0
  603. package/dist/providers/rerank-provider.js +28 -0
  604. package/dist/providers/rerank-provider.js.map +1 -0
  605. package/dist/providers/search-provider.d.ts +25 -0
  606. package/dist/providers/search-provider.d.ts.map +1 -0
  607. package/dist/providers/search-provider.js +44 -0
  608. package/dist/providers/search-provider.js.map +1 -0
  609. package/dist/providers/vector-store.d.ts +27 -0
  610. package/dist/providers/vector-store.d.ts.map +1 -0
  611. package/dist/providers/vector-store.js +27 -0
  612. package/dist/providers/vector-store.js.map +1 -0
  613. package/dist/python-env.d.ts +9 -0
  614. package/dist/python-env.d.ts.map +1 -0
  615. package/dist/python-env.js +13 -0
  616. package/dist/python-env.js.map +1 -0
  617. package/dist/repl/commands/agent.d.ts +5 -0
  618. package/dist/repl/commands/agent.d.ts.map +1 -0
  619. package/dist/repl/commands/agent.js +62 -0
  620. package/dist/repl/commands/agent.js.map +1 -0
  621. package/dist/repl/commands/cache.d.ts +4 -0
  622. package/dist/repl/commands/cache.d.ts.map +1 -0
  623. package/dist/repl/commands/cache.js +43 -0
  624. package/dist/repl/commands/cache.js.map +1 -0
  625. package/dist/repl/commands/crawl.d.ts +7 -0
  626. package/dist/repl/commands/crawl.d.ts.map +1 -0
  627. package/dist/repl/commands/crawl.js +44 -0
  628. package/dist/repl/commands/crawl.js.map +1 -0
  629. package/dist/repl/commands/extract.d.ts +5 -0
  630. package/dist/repl/commands/extract.d.ts.map +1 -0
  631. package/dist/repl/commands/extract.js +47 -0
  632. package/dist/repl/commands/extract.js.map +1 -0
  633. package/dist/repl/commands/fetch.d.ts +5 -0
  634. package/dist/repl/commands/fetch.d.ts.map +1 -0
  635. package/dist/repl/commands/fetch.js +67 -0
  636. package/dist/repl/commands/fetch.js.map +1 -0
  637. package/dist/repl/commands/find-similar.d.ts +5 -0
  638. package/dist/repl/commands/find-similar.d.ts.map +1 -0
  639. package/dist/repl/commands/find-similar.js +74 -0
  640. package/dist/repl/commands/find-similar.js.map +1 -0
  641. package/dist/repl/commands/research.d.ts +5 -0
  642. package/dist/repl/commands/research.d.ts.map +1 -0
  643. package/dist/repl/commands/research.js +65 -0
  644. package/dist/repl/commands/research.js.map +1 -0
  645. package/dist/repl/commands/search.d.ts +5 -0
  646. package/dist/repl/commands/search.d.ts.map +1 -0
  647. package/dist/repl/commands/search.js +74 -0
  648. package/dist/repl/commands/search.js.map +1 -0
  649. package/dist/repl/commands/types.d.ts +9 -0
  650. package/dist/repl/commands/types.d.ts.map +1 -0
  651. package/dist/repl/commands/types.js +1 -0
  652. package/dist/repl/commands/types.js.map +1 -0
  653. package/dist/repl/formatters.d.ts +13 -0
  654. package/dist/repl/formatters.d.ts.map +1 -0
  655. package/dist/repl/formatters.js +283 -0
  656. package/dist/repl/formatters.js.map +1 -0
  657. package/dist/repl/parser.d.ts +9 -0
  658. package/dist/repl/parser.d.ts.map +1 -0
  659. package/dist/repl/parser.js +86 -0
  660. package/dist/repl/parser.js.map +1 -0
  661. package/dist/repl/shell.d.ts +8 -0
  662. package/dist/repl/shell.d.ts.map +1 -0
  663. package/dist/repl/shell.js +184 -0
  664. package/dist/repl/shell.js.map +1 -0
  665. package/dist/research/branch-exploration.d.ts +14 -0
  666. package/dist/research/branch-exploration.d.ts.map +1 -0
  667. package/dist/research/branch-exploration.js +100 -0
  668. package/dist/research/branch-exploration.js.map +1 -0
  669. package/dist/research/brief.d.ts +5 -0
  670. package/dist/research/brief.d.ts.map +1 -0
  671. package/dist/research/brief.js +242 -0
  672. package/dist/research/brief.js.map +1 -0
  673. package/dist/research/citation-graph.d.ts +9 -0
  674. package/dist/research/citation-graph.d.ts.map +1 -0
  675. package/dist/research/citation-graph.js +114 -0
  676. package/dist/research/citation-graph.js.map +1 -0
  677. package/dist/research/decompose.d.ts +14 -0
  678. package/dist/research/decompose.d.ts.map +1 -0
  679. package/dist/research/decompose.js +439 -0
  680. package/dist/research/decompose.js.map +1 -0
  681. package/dist/research/pipeline.d.ts +5 -0
  682. package/dist/research/pipeline.d.ts.map +1 -0
  683. package/dist/research/pipeline.js +269 -0
  684. package/dist/research/pipeline.js.map +1 -0
  685. package/dist/research/synthesis-local.d.ts +16 -0
  686. package/dist/research/synthesis-local.d.ts.map +1 -0
  687. package/dist/research/synthesis-local.js +73 -0
  688. package/dist/research/synthesis-local.js.map +1 -0
  689. package/dist/research/synthesize.d.ts +10 -0
  690. package/dist/research/synthesize.d.ts.map +1 -0
  691. package/dist/research/synthesize.js +137 -0
  692. package/dist/research/synthesize.js.map +1 -0
  693. package/dist/search/answer-synthesis.d.ts +33 -0
  694. package/dist/search/answer-synthesis.d.ts.map +1 -0
  695. package/dist/search/answer-synthesis.js +244 -0
  696. package/dist/search/answer-synthesis.js.map +1 -0
  697. package/dist/search/context-formatter.d.ts +3 -0
  698. package/dist/search/context-formatter.d.ts.map +1 -0
  699. package/dist/search/context-formatter.js +56 -0
  700. package/dist/search/context-formatter.js.map +1 -0
  701. package/dist/search/dedup.d.ts +1 -0
  702. package/dist/search/dedup.d.ts.map +1 -1
  703. package/dist/search/dedup.js +40 -32
  704. package/dist/search/dedup.js.map +1 -1
  705. package/dist/search/engines/arxiv.d.ts +7 -0
  706. package/dist/search/engines/arxiv.d.ts.map +1 -0
  707. package/dist/search/engines/arxiv.js +70 -0
  708. package/dist/search/engines/arxiv.js.map +1 -0
  709. package/dist/search/engines/bing-news.d.ts +7 -0
  710. package/dist/search/engines/bing-news.d.ts.map +1 -0
  711. package/dist/search/engines/bing-news.js +97 -0
  712. package/dist/search/engines/bing-news.js.map +1 -0
  713. package/dist/search/engines/bing.d.ts +1 -0
  714. package/dist/search/engines/bing.d.ts.map +1 -1
  715. package/dist/search/engines/bing.js +100 -44
  716. package/dist/search/engines/bing.js.map +1 -1
  717. package/dist/search/engines/devdocs.d.ts +6 -0
  718. package/dist/search/engines/devdocs.d.ts.map +1 -0
  719. package/dist/search/engines/devdocs.js +56 -0
  720. package/dist/search/engines/devdocs.js.map +1 -0
  721. package/dist/search/engines/duckduckgo.d.ts.map +1 -1
  722. package/dist/search/engines/duckduckgo.js +56 -44
  723. package/dist/search/engines/duckduckgo.js.map +1 -1
  724. package/dist/search/engines/github-code.d.ts +7 -0
  725. package/dist/search/engines/github-code.d.ts.map +1 -0
  726. package/dist/search/engines/github-code.js +55 -0
  727. package/dist/search/engines/github-code.js.map +1 -0
  728. package/dist/search/engines/hn-algolia.d.ts +7 -0
  729. package/dist/search/engines/hn-algolia.d.ts.map +1 -0
  730. package/dist/search/engines/hn-algolia.js +76 -0
  731. package/dist/search/engines/hn-algolia.js.map +1 -0
  732. package/dist/search/engines/lobsters.d.ts +7 -0
  733. package/dist/search/engines/lobsters.d.ts.map +1 -0
  734. package/dist/search/engines/lobsters.js +83 -0
  735. package/dist/search/engines/lobsters.js.map +1 -0
  736. package/dist/search/engines/mdn.d.ts +7 -0
  737. package/dist/search/engines/mdn.d.ts.map +1 -0
  738. package/dist/search/engines/mdn.js +48 -0
  739. package/dist/search/engines/mdn.js.map +1 -0
  740. package/dist/search/engines/semantic-scholar.d.ts +7 -0
  741. package/dist/search/engines/semantic-scholar.d.ts.map +1 -0
  742. package/dist/search/engines/semantic-scholar.js +69 -0
  743. package/dist/search/engines/semantic-scholar.js.map +1 -0
  744. package/dist/search/engines/stackoverflow.d.ts +7 -0
  745. package/dist/search/engines/stackoverflow.d.ts.map +1 -0
  746. package/dist/search/engines/stackoverflow.js +73 -0
  747. package/dist/search/engines/stackoverflow.js.map +1 -0
  748. package/dist/search/engines/startpage.d.ts.map +1 -1
  749. package/dist/search/engines/startpage.js +65 -46
  750. package/dist/search/engines/startpage.js.map +1 -1
  751. package/dist/search/evidence.d.ts +25 -0
  752. package/dist/search/evidence.d.ts.map +1 -0
  753. package/dist/search/evidence.js +220 -0
  754. package/dist/search/evidence.js.map +1 -0
  755. package/dist/search/filters.js +49 -55
  756. package/dist/search/filters.js.map +1 -1
  757. package/dist/search/find-similar/crawl-rank.d.ts +9 -0
  758. package/dist/search/find-similar/crawl-rank.d.ts.map +1 -0
  759. package/dist/search/find-similar/crawl-rank.js +272 -0
  760. package/dist/search/find-similar/crawl-rank.js.map +1 -0
  761. package/dist/search/find-similar/mode.d.ts +4 -0
  762. package/dist/search/find-similar/mode.d.ts.map +1 -0
  763. package/dist/search/find-similar/mode.js +12 -0
  764. package/dist/search/find-similar/mode.js.map +1 -0
  765. package/dist/search/find-similar.d.ts +5 -0
  766. package/dist/search/find-similar.d.ts.map +1 -0
  767. package/dist/search/find-similar.js +509 -0
  768. package/dist/search/find-similar.js.map +1 -0
  769. package/dist/search/highlights.d.ts +19 -0
  770. package/dist/search/highlights.d.ts.map +1 -0
  771. package/dist/search/highlights.js +167 -0
  772. package/dist/search/highlights.js.map +1 -0
  773. package/dist/search/language-filter.d.ts +29 -0
  774. package/dist/search/language-filter.d.ts.map +1 -0
  775. package/dist/search/language-filter.js +126 -0
  776. package/dist/search/language-filter.js.map +1 -0
  777. package/dist/search/legacy/searxng-orchestrator.d.ts +4 -0
  778. package/dist/search/legacy/searxng-orchestrator.d.ts.map +1 -0
  779. package/dist/search/legacy/searxng-orchestrator.js +501 -0
  780. package/dist/search/legacy/searxng-orchestrator.js.map +1 -0
  781. package/dist/search/legacy/searxng-provider.d.ts +7 -0
  782. package/dist/search/legacy/searxng-provider.d.ts.map +1 -0
  783. package/dist/search/legacy/searxng-provider.js +11 -0
  784. package/dist/search/legacy/searxng-provider.js.map +1 -0
  785. package/dist/search/multi-query.d.ts +25 -0
  786. package/dist/search/multi-query.d.ts.map +1 -0
  787. package/dist/search/multi-query.js +228 -0
  788. package/dist/search/multi-query.js.map +1 -0
  789. package/dist/search/query.js +32 -34
  790. package/dist/search/query.js.map +1 -1
  791. package/dist/search/rerank.d.ts +3 -1
  792. package/dist/search/rerank.d.ts.map +1 -1
  793. package/dist/search/rerank.js +44 -35
  794. package/dist/search/rerank.js.map +1 -1
  795. package/dist/search/reranker/authority-boost.d.ts +3 -0
  796. package/dist/search/reranker/authority-boost.d.ts.map +1 -0
  797. package/dist/search/reranker/authority-boost.js +179 -0
  798. package/dist/search/reranker/authority-boost.js.map +1 -0
  799. package/dist/search/reranker/consensus-boost.d.ts +3 -0
  800. package/dist/search/reranker/consensus-boost.d.ts.map +1 -0
  801. package/dist/search/reranker/consensus-boost.js +27 -0
  802. package/dist/search/reranker/consensus-boost.js.map +1 -0
  803. package/dist/search/reranker/recency-boost.d.ts +3 -0
  804. package/dist/search/reranker/recency-boost.d.ts.map +1 -0
  805. package/dist/search/reranker/recency-boost.js +13 -0
  806. package/dist/search/reranker/recency-boost.js.map +1 -0
  807. package/dist/search/reranker/recency.d.ts +3 -0
  808. package/dist/search/reranker/recency.d.ts.map +1 -0
  809. package/dist/search/reranker/recency.js +23 -0
  810. package/dist/search/reranker/recency.js.map +1 -0
  811. package/dist/search/reranker/transformers-rerank-provider.d.ts +12 -0
  812. package/dist/search/reranker/transformers-rerank-provider.d.ts.map +1 -0
  813. package/dist/search/reranker/transformers-rerank-provider.js +78 -0
  814. package/dist/search/reranker/transformers-rerank-provider.js.map +1 -0
  815. package/dist/search/rrf.d.ts +17 -0
  816. package/dist/search/rrf.d.ts.map +1 -0
  817. package/dist/search/rrf.js +39 -0
  818. package/dist/search/rrf.js.map +1 -0
  819. package/dist/search/sampling.d.ts +25 -0
  820. package/dist/search/sampling.d.ts.map +1 -0
  821. package/dist/search/sampling.js +52 -0
  822. package/dist/search/sampling.js.map +1 -0
  823. package/dist/search/searxng.d.ts.map +1 -1
  824. package/dist/search/searxng.js +69 -79
  825. package/dist/search/searxng.js.map +1 -1
  826. package/dist/search/tokens.d.ts +3 -0
  827. package/dist/search/tokens.d.ts.map +1 -0
  828. package/dist/search/tokens.js +39 -0
  829. package/dist/search/tokens.js.map +1 -0
  830. package/dist/search/truncate.d.ts +6 -0
  831. package/dist/search/truncate.d.ts.map +1 -0
  832. package/dist/search/truncate.js +26 -0
  833. package/dist/search/truncate.js.map +1 -0
  834. package/dist/search/url-unwrap.d.ts +3 -0
  835. package/dist/search/url-unwrap.d.ts.map +1 -0
  836. package/dist/search/url-unwrap.js +43 -0
  837. package/dist/search/url-unwrap.js.map +1 -0
  838. package/dist/search/v1/context-rank.d.ts +13 -0
  839. package/dist/search/v1/context-rank.d.ts.map +1 -0
  840. package/dist/search/v1/context-rank.js +74 -0
  841. package/dist/search/v1/context-rank.js.map +1 -0
  842. package/dist/search/v1/engine-base.d.ts +27 -0
  843. package/dist/search/v1/engine-base.d.ts.map +1 -0
  844. package/dist/search/v1/engine-base.js +110 -0
  845. package/dist/search/v1/engine-base.js.map +1 -0
  846. package/dist/search/v1/intent-router.d.ts +22 -0
  847. package/dist/search/v1/intent-router.d.ts.map +1 -0
  848. package/dist/search/v1/intent-router.js +138 -0
  849. package/dist/search/v1/intent-router.js.map +1 -0
  850. package/dist/search/v1/orchestrator.d.ts +24 -0
  851. package/dist/search/v1/orchestrator.d.ts.map +1 -0
  852. package/dist/search/v1/orchestrator.js +163 -0
  853. package/dist/search/v1/orchestrator.js.map +1 -0
  854. package/dist/search/v1/recency-boost.d.ts +9 -0
  855. package/dist/search/v1/recency-boost.d.ts.map +1 -0
  856. package/dist/search/v1/recency-boost.js +37 -0
  857. package/dist/search/v1/recency-boost.js.map +1 -0
  858. package/dist/search/v1/recent-cache-dedup.d.ts +6 -0
  859. package/dist/search/v1/recent-cache-dedup.d.ts.map +1 -0
  860. package/dist/search/v1/recent-cache-dedup.js +85 -0
  861. package/dist/search/v1/recent-cache-dedup.js.map +1 -0
  862. package/dist/search/v1/rss/feed-config.d.ts +21 -0
  863. package/dist/search/v1/rss/feed-config.d.ts.map +1 -0
  864. package/dist/search/v1/rss/feed-config.js +90 -0
  865. package/dist/search/v1/rss/feed-config.js.map +1 -0
  866. package/dist/search/v1/rss/feed-parser.d.ts +14 -0
  867. package/dist/search/v1/rss/feed-parser.d.ts.map +1 -0
  868. package/dist/search/v1/rss/feed-parser.js +104 -0
  869. package/dist/search/v1/rss/feed-parser.js.map +1 -0
  870. package/dist/search/v1/rss/feed-poller.d.ts +22 -0
  871. package/dist/search/v1/rss/feed-poller.d.ts.map +1 -0
  872. package/dist/search/v1/rss/feed-poller.js +102 -0
  873. package/dist/search/v1/rss/feed-poller.js.map +1 -0
  874. package/dist/search/v1/rss/feed-store.d.ts +30 -0
  875. package/dist/search/v1/rss/feed-store.d.ts.map +1 -0
  876. package/dist/search/v1/rss/feed-store.js +134 -0
  877. package/dist/search/v1/rss/feed-store.js.map +1 -0
  878. package/dist/search/v1/rss/rss-engine.d.ts +6 -0
  879. package/dist/search/v1/rss/rss-engine.d.ts.map +1 -0
  880. package/dist/search/v1/rss/rss-engine.js +28 -0
  881. package/dist/search/v1/rss/rss-engine.js.map +1 -0
  882. package/dist/search/v1/v1-provider.d.ts +7 -0
  883. package/dist/search/v1/v1-provider.d.ts.map +1 -0
  884. package/dist/search/v1/v1-provider.js +68 -0
  885. package/dist/search/v1/v1-provider.js.map +1 -0
  886. package/dist/search/v1/verticals/code.d.ts +4 -0
  887. package/dist/search/v1/verticals/code.d.ts.map +1 -0
  888. package/dist/search/v1/verticals/code.js +20 -0
  889. package/dist/search/v1/verticals/code.js.map +1 -0
  890. package/dist/search/v1/verticals/docs.d.ts +4 -0
  891. package/dist/search/v1/verticals/docs.d.ts.map +1 -0
  892. package/dist/search/v1/verticals/docs.js +20 -0
  893. package/dist/search/v1/verticals/docs.js.map +1 -0
  894. package/dist/search/v1/verticals/general.d.ts +4 -0
  895. package/dist/search/v1/verticals/general.d.ts.map +1 -0
  896. package/dist/search/v1/verticals/general.js +22 -0
  897. package/dist/search/v1/verticals/general.js.map +1 -0
  898. package/dist/search/v1/verticals/news.d.ts +10 -0
  899. package/dist/search/v1/verticals/news.d.ts.map +1 -0
  900. package/dist/search/v1/verticals/news.js +52 -0
  901. package/dist/search/v1/verticals/news.js.map +1 -0
  902. package/dist/search/v1/verticals/papers.d.ts +4 -0
  903. package/dist/search/v1/verticals/papers.d.ts.map +1 -0
  904. package/dist/search/v1/verticals/papers.js +23 -0
  905. package/dist/search/v1/verticals/papers.js.map +1 -0
  906. package/dist/search/validator.js +31 -31
  907. package/dist/search/validator.js.map +1 -1
  908. package/dist/searxng/bootstrap.d.ts +30 -0
  909. package/dist/searxng/bootstrap.d.ts.map +1 -1
  910. package/dist/searxng/bootstrap.js +223 -85
  911. package/dist/searxng/bootstrap.js.map +1 -1
  912. package/dist/searxng/docker.d.ts.map +1 -1
  913. package/dist/searxng/docker.js +69 -60
  914. package/dist/searxng/docker.js.map +1 -1
  915. package/dist/searxng/process.d.ts +13 -1
  916. package/dist/searxng/process.d.ts.map +1 -1
  917. package/dist/searxng/process.js +231 -164
  918. package/dist/searxng/process.js.map +1 -1
  919. package/dist/server/backend-status.d.ts +13 -0
  920. package/dist/server/backend-status.d.ts.map +1 -0
  921. package/dist/server/backend-status.js +40 -0
  922. package/dist/server/backend-status.js.map +1 -0
  923. package/dist/server/tool-schemas.d.ts +549 -0
  924. package/dist/server/tool-schemas.d.ts.map +1 -0
  925. package/dist/server/tool-schemas.js +464 -0
  926. package/dist/server/tool-schemas.js.map +1 -0
  927. package/dist/server/warmup-on-start.d.ts +9 -0
  928. package/dist/server/warmup-on-start.d.ts.map +1 -0
  929. package/dist/server/warmup-on-start.js +55 -0
  930. package/dist/server/warmup-on-start.js.map +1 -0
  931. package/dist/server.d.ts +17 -0
  932. package/dist/server.d.ts.map +1 -1
  933. package/dist/server.js +454 -297
  934. package/dist/server.js.map +1 -1
  935. package/dist/tools/agent.d.ts +5 -0
  936. package/dist/tools/agent.d.ts.map +1 -0
  937. package/dist/tools/agent.js +128 -0
  938. package/dist/tools/agent.js.map +1 -0
  939. package/dist/tools/cache.d.ts +2 -1
  940. package/dist/tools/cache.d.ts.map +1 -1
  941. package/dist/tools/cache.js +175 -44
  942. package/dist/tools/cache.js.map +1 -1
  943. package/dist/tools/crawl.d.ts.map +1 -1
  944. package/dist/tools/crawl.js +171 -88
  945. package/dist/tools/crawl.js.map +1 -1
  946. package/dist/tools/extract.d.ts +2 -2
  947. package/dist/tools/extract.d.ts.map +1 -1
  948. package/dist/tools/extract.js +175 -59
  949. package/dist/tools/extract.js.map +1 -1
  950. package/dist/tools/fetch.d.ts +2 -2
  951. package/dist/tools/fetch.d.ts.map +1 -1
  952. package/dist/tools/fetch.js +161 -68
  953. package/dist/tools/fetch.js.map +1 -1
  954. package/dist/tools/find-similar.d.ts +5 -0
  955. package/dist/tools/find-similar.d.ts.map +1 -0
  956. package/dist/tools/find-similar.js +127 -0
  957. package/dist/tools/find-similar.js.map +1 -0
  958. package/dist/tools/research.d.ts +5 -0
  959. package/dist/tools/research.d.ts.map +1 -0
  960. package/dist/tools/research.js +107 -0
  961. package/dist/tools/research.js.map +1 -0
  962. package/dist/tools/search.d.ts +10 -2
  963. package/dist/tools/search.d.ts.map +1 -1
  964. package/dist/tools/search.js +13 -158
  965. package/dist/tools/search.js.map +1 -1
  966. package/dist/types.d.ts +350 -7
  967. package/dist/types.d.ts.map +1 -1
  968. package/dist/types.js +6 -1
  969. package/dist/types.js.map +1 -1
  970. package/dist/util/mode.d.ts +4 -0
  971. package/dist/util/mode.d.ts.map +1 -0
  972. package/dist/util/mode.js +34 -0
  973. package/dist/util/mode.js.map +1 -0
  974. package/package.json +78 -8
  975. package/dist/extraction/trafilatura.d.ts +0 -6
  976. package/dist/extraction/trafilatura.d.ts.map +0 -1
  977. package/dist/extraction/trafilatura.js +0 -105
  978. package/dist/extraction/trafilatura.js.map +0 -1
  979. package/dist/search/flashrank.d.ts +0 -12
  980. package/dist/search/flashrank.d.ts.map +0 -1
  981. package/dist/search/flashrank.js +0 -63
  982. package/dist/search/flashrank.js.map +0 -1
@@ -0,0 +1,509 @@
1
+ import { extractKeyTerms, buildFTS5Query } from "../embedding/key-terms.js";
2
+ import { reciprocalRankFusion, sortByRRFScore } from "./rrf.js";
3
+ import { searchCache, getCachedContent, normalizeUrl, getCacheStats } from "../cache/store.js";
4
+ import { filterByDomains } from "./filters.js";
5
+ import { handleSearch } from "../tools/search.js";
6
+ import { getExtractProvider } from "../providers/extract-provider.js";
7
+ import { getEmbeddingService } from "../embedding/embed.js";
8
+ import { createLogger } from "../logger.js";
9
+ import { selectMode } from "./find-similar/mode.js";
10
+ import { crawlRank } from "./find-similar/crawl-rank.js";
11
+ const log = createLogger("search");
12
+ const DEFAULT_MAX_RESULTS = 10;
13
+ const MAX_FTS5_CANDIDATES = 20;
14
+ const MAX_EMBEDDING_CANDIDATES = 20;
15
+ const WEB_SEARCH_QUERY_COUNT = 3;
16
+ async function findSimilar(input, engines, router, backendStatus) {
17
+ const start = Date.now();
18
+ const embeddingAvailable = checkEmbeddingAvailable();
19
+ const initialCacheSize = safeCacheCount();
20
+ const initialEmbedIndexSize = safeEmbedIndexSize();
21
+ try {
22
+ const mode = selectMode(input);
23
+ if (mode === "crawl-rank") {
24
+ const seed = input.url?.trim();
25
+ if (!seed) {
26
+ return {
27
+ results: [],
28
+ method: "fts5",
29
+ cache_hits: 0,
30
+ search_hits: 0,
31
+ embedding_available: embeddingAvailable,
32
+ error: "crawl-rank mode requires a url",
33
+ total_time_ms: Date.now() - start
34
+ };
35
+ }
36
+ const cr = await crawlRank(seed, input, router);
37
+ return { ...cr, total_time_ms: Date.now() - start };
38
+ }
39
+ const url = input.url?.trim();
40
+ const concept = input.concept?.trim();
41
+ if (!url && !concept) {
42
+ return {
43
+ results: [],
44
+ method: "fts5",
45
+ cache_hits: 0,
46
+ search_hits: 0,
47
+ embedding_available: embeddingAvailable,
48
+ error: "Either url or concept must be provided",
49
+ total_time_ms: Date.now() - start
50
+ };
51
+ }
52
+ const maxResults = input.max_results ?? DEFAULT_MAX_RESULTS;
53
+ const includeCache = input.include_cache ?? true;
54
+ const includeWeb = input.include_web ?? true;
55
+ const signal = await prepareSignal(url, concept, router);
56
+ if (signal.terms.length === 0 && !signal.queryText) {
57
+ log.warn("no key terms or query text extracted, falling back to web search");
58
+ if (!includeWeb) {
59
+ return {
60
+ results: [],
61
+ method: "fts5",
62
+ cache_hits: 0,
63
+ search_hits: 0,
64
+ embedding_available: embeddingAvailable,
65
+ error: "Could not extract key terms from input and web search is disabled",
66
+ total_time_ms: Date.now() - start
67
+ };
68
+ }
69
+ }
70
+ let cacheResults = [];
71
+ const fts5RankMap = /* @__PURE__ */ new Map();
72
+ let embeddingResults = [];
73
+ const embeddingRankMap = /* @__PURE__ */ new Map();
74
+ await Promise.all([
75
+ (async () => {
76
+ if (includeCache && signal.terms.length > 0) {
77
+ cacheResults = runFTS5Search(
78
+ signal.terms,
79
+ signal.inputNormalizedUrl,
80
+ input.include_domains,
81
+ input.exclude_domains,
82
+ MAX_FTS5_CANDIDATES,
83
+ fts5RankMap
84
+ );
85
+ log.debug("FTS5 search complete", { hits: cacheResults.length });
86
+ }
87
+ })(),
88
+ (async () => {
89
+ if (includeCache && embeddingAvailable && signal.queryText) {
90
+ embeddingResults = await runEmbeddingSearch(
91
+ signal.queryText,
92
+ signal.inputNormalizedUrl,
93
+ input.include_domains,
94
+ input.exclude_domains,
95
+ MAX_EMBEDDING_CANDIDATES,
96
+ embeddingRankMap
97
+ );
98
+ log.debug("embedding search complete", { hits: embeddingResults.length });
99
+ }
100
+ })()
101
+ ]);
102
+ let searchResults = [];
103
+ const searchRankMap = /* @__PURE__ */ new Map();
104
+ const combinedLocalHits = /* @__PURE__ */ new Set();
105
+ for (const r of cacheResults) combinedLocalHits.add(safeNormalize(r.url));
106
+ for (const r of embeddingResults) combinedLocalHits.add(safeNormalize(r.url));
107
+ if (combinedLocalHits.size < maxResults && includeWeb) {
108
+ searchResults = await runWebSearchFallback(
109
+ signal,
110
+ engines,
111
+ router,
112
+ backendStatus,
113
+ maxResults,
114
+ signal.inputNormalizedUrl,
115
+ input.include_domains,
116
+ input.exclude_domains,
117
+ searchRankMap
118
+ );
119
+ log.debug("web search fallback complete", { hits: searchResults.length });
120
+ if (embeddingAvailable && signal.queryText && searchResults.length > 0) {
121
+ const freshEmbeddingResults = await runEmbeddingSearch(
122
+ signal.queryText,
123
+ signal.inputNormalizedUrl,
124
+ input.include_domains,
125
+ input.exclude_domains,
126
+ MAX_EMBEDDING_CANDIDATES,
127
+ embeddingRankMap
128
+ );
129
+ if (freshEmbeddingResults.length > 0) {
130
+ embeddingResults = freshEmbeddingResults;
131
+ log.debug("re-ran embedding search after web fallback", { hits: embeddingResults.length });
132
+ }
133
+ }
134
+ }
135
+ const rankedLists = [];
136
+ if (fts5RankMap.size > 0) rankedLists.push(fts5RankMap);
137
+ if (embeddingRankMap.size > 0) rankedLists.push(embeddingRankMap);
138
+ if (searchRankMap.size > 0) rankedLists.push(searchRankMap);
139
+ const allResults = mergeResults(cacheResults, embeddingResults, searchResults);
140
+ let finalResults;
141
+ if (rankedLists.length >= 1) {
142
+ finalResults = fuseResults(rankedLists, allResults, maxResults);
143
+ } else {
144
+ finalResults = allResults.sort((a, b) => b.relevance_score - a.relevance_score).slice(0, maxResults);
145
+ }
146
+ const method = determineMethod(
147
+ cacheResults.length > 0,
148
+ embeddingResults.length > 0,
149
+ searchResults.length > 0
150
+ );
151
+ const cacheHits = finalResults.filter((r) => r.source === "cache").length;
152
+ const searchHits = finalResults.filter((r) => r.source === "search").length;
153
+ const coldStart = buildColdStartNote(
154
+ cacheHits,
155
+ embeddingAvailable,
156
+ initialCacheSize,
157
+ initialEmbedIndexSize
158
+ );
159
+ return {
160
+ results: finalResults,
161
+ method,
162
+ cache_hits: cacheHits,
163
+ search_hits: searchHits,
164
+ embedding_available: embeddingAvailable,
165
+ ...coldStart ? { cold_start: coldStart } : {},
166
+ total_time_ms: Date.now() - start
167
+ };
168
+ } catch (err) {
169
+ log.error("findSimilar failed", { error: String(err) });
170
+ return {
171
+ results: [],
172
+ method: "fts5",
173
+ cache_hits: 0,
174
+ search_hits: 0,
175
+ embedding_available: embeddingAvailable,
176
+ error: `find_similar failed: ${err instanceof Error ? err.message : String(err)}`,
177
+ total_time_ms: Date.now() - start
178
+ };
179
+ }
180
+ }
181
+ function checkEmbeddingAvailable() {
182
+ try {
183
+ const svc = getEmbeddingService();
184
+ return svc.isAvailable() && svc.isSubprocessReady();
185
+ } catch {
186
+ return false;
187
+ }
188
+ }
189
+ function safeCacheCount() {
190
+ try {
191
+ return getCacheStats().total_urls;
192
+ } catch {
193
+ return 0;
194
+ }
195
+ }
196
+ function safeEmbedIndexSize() {
197
+ try {
198
+ return getEmbeddingService().getIndex().size();
199
+ } catch {
200
+ return 0;
201
+ }
202
+ }
203
+ function buildColdStartNote(cacheHits, embeddingAvailable, initialCacheSize, initialEmbedIndexSize) {
204
+ if (initialCacheSize === 0) {
205
+ return "Cache is empty. Results come from live web search only. Use wigolo_fetch / wigolo_crawl to warm the cache, then re-run find_similar for hybrid local+web ranking.";
206
+ }
207
+ if (!embeddingAvailable && initialCacheSize > 0) {
208
+ return "Embeddings unavailable or index empty (cached pages have not been embedded yet). Falling back to FTS5 keyword ranking. Set up sentence-transformers to enable semantic matching.";
209
+ }
210
+ if (cacheHits === 0 && initialCacheSize < 20) {
211
+ return `Cache has only ${initialCacheSize} pages. Add more context by fetching or crawling relevant sites before relying on find_similar for cross-source similarity.`;
212
+ }
213
+ if (!embeddingAvailable && initialEmbedIndexSize === 0) {
214
+ return "Embedding index is empty. Semantic matching disabled until background embedding jobs catch up.";
215
+ }
216
+ return void 0;
217
+ }
218
+ function safeNormalize(url) {
219
+ try {
220
+ return normalizeUrl(url);
221
+ } catch {
222
+ return url;
223
+ }
224
+ }
225
+ function mergeResults(...lists) {
226
+ const seen = /* @__PURE__ */ new Map();
227
+ for (const list of lists) {
228
+ for (const r of list) {
229
+ const key = safeNormalize(r.url);
230
+ const existing = seen.get(key);
231
+ if (!existing) {
232
+ seen.set(key, r);
233
+ } else {
234
+ existing.match_signals = {
235
+ ...existing.match_signals,
236
+ ...r.match_signals,
237
+ fused_score: existing.match_signals.fused_score
238
+ };
239
+ }
240
+ }
241
+ }
242
+ return [...seen.values()];
243
+ }
244
+ async function prepareSignal(url, concept, router) {
245
+ if (url) {
246
+ return await prepareSignalFromUrl(url, router);
247
+ }
248
+ if (concept) {
249
+ const terms = extractKeyTerms(concept, "");
250
+ return { terms, title: concept, queryText: concept };
251
+ }
252
+ return { terms: [], title: "" };
253
+ }
254
+ async function prepareSignalFromUrl(url, router) {
255
+ let normalizedInputUrl;
256
+ try {
257
+ normalizedInputUrl = normalizeUrl(url);
258
+ } catch {
259
+ normalizedInputUrl = url;
260
+ }
261
+ const cached = getCachedContent(url);
262
+ if (cached) {
263
+ const terms = extractKeyTerms(cached.markdown, cached.title);
264
+ return {
265
+ terms,
266
+ title: cached.title,
267
+ inputUrl: url,
268
+ inputNormalizedUrl: normalizedInputUrl,
269
+ queryText: cached.markdown
270
+ };
271
+ }
272
+ try {
273
+ log.info("fetching URL for signal extraction", { url });
274
+ const raw = await router.fetch(url, { renderJs: "auto" });
275
+ const extractor = await getExtractProvider();
276
+ const extraction = await extractor.extract(raw.html, raw.finalUrl, {
277
+ contentType: raw.contentType
278
+ });
279
+ const terms = extractKeyTerms(extraction.markdown, extraction.title);
280
+ return {
281
+ terms,
282
+ title: extraction.title,
283
+ inputUrl: url,
284
+ inputNormalizedUrl: normalizedInputUrl,
285
+ queryText: extraction.markdown
286
+ };
287
+ } catch (err) {
288
+ log.warn("failed to fetch URL for signal extraction", { url, error: String(err) });
289
+ const urlTerms = extractKeyTerms("", url);
290
+ return {
291
+ terms: urlTerms,
292
+ title: url,
293
+ inputUrl: url,
294
+ inputNormalizedUrl: normalizedInputUrl
295
+ };
296
+ }
297
+ }
298
+ async function runEmbeddingSearch(queryText, excludeNormalizedUrl, includeDomains, excludeDomains, topK, rankMap) {
299
+ try {
300
+ const service = getEmbeddingService();
301
+ if (!service.isAvailable() || !service.isSubprocessReady()) return [];
302
+ if (service.getIndex().size() === 0) return [];
303
+ const excludeUrls = excludeNormalizedUrl ? /* @__PURE__ */ new Set([excludeNormalizedUrl]) : void 0;
304
+ const similar = await service.findSimilar(queryText, topK, excludeUrls);
305
+ if (similar.length === 0) return [];
306
+ const hydrated = [];
307
+ for (const { url: nUrl, score } of similar) {
308
+ const cached = getCachedContent(nUrl);
309
+ hydrated.push({ entry: cached, url: nUrl, score });
310
+ }
311
+ const filterableInputs = hydrated.map((h) => ({
312
+ url: h.entry?.url ?? h.url
313
+ }));
314
+ const filtered = filterByDomains(filterableInputs, includeDomains, excludeDomains);
315
+ const allowedUrls = new Set(filtered.map((f) => f.url));
316
+ const results = [];
317
+ let rank = 0;
318
+ for (const h of hydrated) {
319
+ const displayUrl = h.entry?.url ?? h.url;
320
+ if (!allowedUrls.has(displayUrl)) continue;
321
+ rank++;
322
+ rankMap.set(safeNormalize(displayUrl), rank);
323
+ results.push({
324
+ url: displayUrl,
325
+ title: h.entry?.title ?? displayUrl,
326
+ markdown: (h.entry?.markdown ?? "").slice(0, 5e3),
327
+ relevance_score: h.score,
328
+ source: "cache",
329
+ match_signals: {
330
+ embedding_rank: rank,
331
+ fused_score: 0
332
+ }
333
+ });
334
+ }
335
+ return results;
336
+ } catch (err) {
337
+ log.warn("embedding search failed", { error: String(err) });
338
+ return [];
339
+ }
340
+ }
341
+ function runFTS5Search(terms, excludeNormalizedUrl, includeDomains, excludeDomains, maxCandidates, rankMap) {
342
+ try {
343
+ const fts5Query = buildFTS5Query(terms);
344
+ if (!fts5Query) return [];
345
+ let cached = searchCache(fts5Query);
346
+ if (excludeNormalizedUrl) {
347
+ cached = cached.filter((c) => {
348
+ try {
349
+ return normalizeUrl(c.url) !== excludeNormalizedUrl;
350
+ } catch {
351
+ return c.url !== excludeNormalizedUrl;
352
+ }
353
+ });
354
+ }
355
+ cached = filterByDomains(cached, includeDomains, excludeDomains);
356
+ cached = cached.slice(0, maxCandidates);
357
+ const results = [];
358
+ for (let i = 0; i < cached.length; i++) {
359
+ const entry = cached[i];
360
+ let nUrl;
361
+ try {
362
+ nUrl = normalizeUrl(entry.url);
363
+ } catch {
364
+ nUrl = entry.url;
365
+ }
366
+ rankMap.set(nUrl, i + 1);
367
+ results.push({
368
+ url: entry.url,
369
+ title: entry.title,
370
+ markdown: entry.markdown.slice(0, 5e3),
371
+ relevance_score: 0,
372
+ source: "cache",
373
+ match_signals: {
374
+ fts5_rank: i + 1,
375
+ fused_score: 0
376
+ }
377
+ });
378
+ }
379
+ return results;
380
+ } catch (err) {
381
+ log.error("FTS5 search failed", { error: String(err) });
382
+ return [];
383
+ }
384
+ }
385
+ async function runWebSearchFallback(signal, engines, router, backendStatus, maxResults, excludeNormalizedUrl, includeDomains, excludeDomains, rankMap) {
386
+ try {
387
+ const queries = generateSearchQueries(signal.terms, signal.title);
388
+ if (queries.length === 0) return [];
389
+ const allResults = [];
390
+ const seenUrls = /* @__PURE__ */ new Set();
391
+ if (excludeNormalizedUrl) {
392
+ seenUrls.add(excludeNormalizedUrl);
393
+ }
394
+ for (const query of queries) {
395
+ try {
396
+ const searchResult = await handleSearch(
397
+ {
398
+ query,
399
+ max_results: maxResults,
400
+ include_content: true,
401
+ include_domains: includeDomains,
402
+ exclude_domains: excludeDomains
403
+ },
404
+ engines,
405
+ router,
406
+ backendStatus
407
+ );
408
+ if (!searchResult.ok) {
409
+ log.warn("web search query failed", { query, error: searchResult.error_reason });
410
+ continue;
411
+ }
412
+ const searchOutput = searchResult.data;
413
+ for (const item of searchOutput.results) {
414
+ let nUrl;
415
+ try {
416
+ nUrl = normalizeUrl(item.url);
417
+ } catch {
418
+ nUrl = item.url;
419
+ }
420
+ if (seenUrls.has(nUrl)) continue;
421
+ seenUrls.add(nUrl);
422
+ const rank = allResults.length + 1;
423
+ rankMap.set(nUrl, rank);
424
+ allResults.push({
425
+ url: item.url,
426
+ title: item.title,
427
+ markdown: (item.markdown_content ?? item.snippet).slice(0, 5e3),
428
+ relevance_score: item.relevance_score,
429
+ source: "search",
430
+ match_signals: {
431
+ fused_score: 0
432
+ }
433
+ });
434
+ }
435
+ } catch (err) {
436
+ log.warn("web search query failed", { query, error: String(err) });
437
+ }
438
+ }
439
+ try {
440
+ const embeddingService = getEmbeddingService();
441
+ if (embeddingService.isAvailable() && embeddingService.isSubprocessReady()) {
442
+ const embedPromises = allResults.filter((r) => r.markdown).slice(0, 10).map((r) => embeddingService.embedAndStore(r.url, r.markdown));
443
+ await Promise.allSettled(embedPromises);
444
+ log.debug("embedded web fallback results", { count: embedPromises.length });
445
+ }
446
+ } catch (err) {
447
+ log.debug("embedding hook skipped for find_similar results", { error: String(err) });
448
+ }
449
+ return allResults;
450
+ } catch (err) {
451
+ log.error("web search fallback failed", { error: String(err) });
452
+ return [];
453
+ }
454
+ }
455
+ function generateSearchQueries(terms, title) {
456
+ if (terms.length === 0 && !title) return [];
457
+ const queries = [];
458
+ if (title && title.length > 3) {
459
+ queries.push(title.slice(0, 150));
460
+ }
461
+ if (terms.length >= 3) {
462
+ queries.push(terms.slice(0, 5).join(" "));
463
+ }
464
+ if (terms.length >= 2) {
465
+ queries.push(`${terms.slice(0, 3).join(" ")} tutorial guide`);
466
+ }
467
+ const unique = [...new Set(queries)];
468
+ return unique.slice(0, WEB_SEARCH_QUERY_COUNT);
469
+ }
470
+ function fuseResults(rankedLists, allResults, maxResults) {
471
+ const scores = reciprocalRankFusion(rankedLists);
472
+ const sorted = sortByRRFScore(scores);
473
+ const resultsByNormalizedUrl = /* @__PURE__ */ new Map();
474
+ for (const r of allResults) {
475
+ const key = safeNormalize(r.url);
476
+ if (!resultsByNormalizedUrl.has(key)) {
477
+ resultsByNormalizedUrl.set(key, r);
478
+ }
479
+ }
480
+ const topScore = sorted.length > 0 ? sorted[0][1] : 0;
481
+ const fused = [];
482
+ for (const [nUrl, score] of sorted) {
483
+ if (fused.length >= maxResults) break;
484
+ const result = resultsByNormalizedUrl.get(nUrl);
485
+ if (!result) continue;
486
+ const normalized = topScore > 0 ? score / topScore : 0;
487
+ fused.push({
488
+ ...result,
489
+ relevance_score: normalized,
490
+ match_signals: {
491
+ ...result.match_signals,
492
+ fused_score: score
493
+ }
494
+ });
495
+ }
496
+ return fused;
497
+ }
498
+ function determineMethod(hasCache, hasEmbedding, hasSearch) {
499
+ const sources = [hasCache, hasEmbedding, hasSearch].filter(Boolean).length;
500
+ if (sources >= 2) return "hybrid";
501
+ if (hasEmbedding) return "embedding";
502
+ if (hasCache) return "fts5";
503
+ if (hasSearch) return "search";
504
+ return "fts5";
505
+ }
506
+ export {
507
+ findSimilar
508
+ };
509
+ //# sourceMappingURL=find-similar.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"sources":["../../src/search/find-similar.ts"],"sourcesContent":["import type {\n FindSimilarInput,\n FindSimilarOutput,\n FindSimilarResult,\n SearchEngine,\n CachedContent,\n} from '../types.js';\nimport type { SmartRouter } from '../fetch/router.js';\nimport type { BackendStatus } from '../server/backend-status.js';\nimport { extractKeyTerms, buildFTS5Query } from '../embedding/key-terms.js';\nimport { reciprocalRankFusion, sortByRRFScore } from './rrf.js';\nimport { searchCache, getCachedContent, normalizeUrl, getCacheStats } from '../cache/store.js';\nimport { filterByDomains } from './filters.js';\nimport { handleSearch } from '../tools/search.js';\nimport { getExtractProvider } from '../providers/extract-provider.js';\nimport { getEmbeddingService } from '../embedding/embed.js';\nimport { createLogger } from '../logger.js';\nimport { selectMode } from './find-similar/mode.js';\nimport { crawlRank } from './find-similar/crawl-rank.js';\n\nconst log = createLogger('search');\n\nconst DEFAULT_MAX_RESULTS = 10;\nconst MAX_FTS5_CANDIDATES = 20;\nconst MAX_EMBEDDING_CANDIDATES = 20;\nconst WEB_SEARCH_QUERY_COUNT = 3;\n\ninterface ResolvedSignal {\n terms: string[];\n title: string;\n inputUrl?: string;\n inputNormalizedUrl?: string;\n queryText?: string;\n}\n\nexport async function findSimilar(\n input: FindSimilarInput,\n engines: SearchEngine[],\n router: SmartRouter,\n backendStatus?: BackendStatus,\n): Promise<FindSimilarOutput> {\n const start = Date.now();\n\n // Probe embedding availability once up front for the whole request\n const embeddingAvailable = checkEmbeddingAvailable();\n\n // Snapshot cache/embedding posture BEFORE the web fallback writes new\n // entries into cache, otherwise the cold-start note would wrongly report a\n // populated cache simply because we just fetched during this call.\n const initialCacheSize = safeCacheCount();\n const initialEmbedIndexSize = safeEmbedIndexSize();\n\n try {\n // Mode dispatch: only 'crawl-rank' diverts. All other modes (cache,\n // web-expansion, auto) fall through to the existing hybrid flow.\n const mode = selectMode(input);\n if (mode === 'crawl-rank') {\n const seed = input.url?.trim();\n if (!seed) {\n return {\n results: [],\n method: 'fts5',\n cache_hits: 0,\n search_hits: 0,\n embedding_available: embeddingAvailable,\n error: 'crawl-rank mode requires a url',\n total_time_ms: Date.now() - start,\n };\n }\n const cr = await crawlRank(seed, input, router);\n return { ...cr, total_time_ms: Date.now() - start };\n }\n\n const url = input.url?.trim();\n const concept = input.concept?.trim();\n\n if (!url && !concept) {\n return {\n results: [],\n method: 'fts5',\n cache_hits: 0,\n search_hits: 0,\n embedding_available: embeddingAvailable,\n error: 'Either url or concept must be provided',\n total_time_ms: Date.now() - start,\n };\n }\n\n const maxResults = input.max_results ?? DEFAULT_MAX_RESULTS;\n const includeCache = input.include_cache ?? true;\n const includeWeb = input.include_web ?? true;\n\n const signal = await prepareSignal(url, concept, router);\n\n if (signal.terms.length === 0 && !signal.queryText) {\n log.warn('no key terms or query text extracted, falling back to web search');\n\n if (!includeWeb) {\n return {\n results: [],\n method: 'fts5',\n cache_hits: 0,\n search_hits: 0,\n embedding_available: embeddingAvailable,\n error: 'Could not extract key terms from input and web search is disabled',\n total_time_ms: Date.now() - start,\n };\n }\n }\n\n // Phase 1: FTS5 + embedding in parallel (both hit local state, cheap)\n let cacheResults: FindSimilarResult[] = [];\n const fts5RankMap = new Map<string, number>();\n let embeddingResults: FindSimilarResult[] = [];\n const embeddingRankMap = new Map<string, number>();\n\n await Promise.all([\n (async () => {\n if (includeCache && signal.terms.length > 0) {\n cacheResults = runFTS5Search(\n signal.terms,\n signal.inputNormalizedUrl,\n input.include_domains,\n input.exclude_domains,\n MAX_FTS5_CANDIDATES,\n fts5RankMap,\n );\n log.debug('FTS5 search complete', { hits: cacheResults.length });\n }\n })(),\n (async () => {\n if (includeCache && embeddingAvailable && signal.queryText) {\n embeddingResults = await runEmbeddingSearch(\n signal.queryText,\n signal.inputNormalizedUrl,\n input.include_domains,\n input.exclude_domains,\n MAX_EMBEDDING_CANDIDATES,\n embeddingRankMap,\n );\n log.debug('embedding search complete', { hits: embeddingResults.length });\n }\n })(),\n ]);\n\n // Phase 2: Web search fallback (only if combined unique local hits < maxResults)\n let searchResults: FindSimilarResult[] = [];\n const searchRankMap = new Map<string, number>();\n\n const combinedLocalHits = new Set<string>();\n for (const r of cacheResults) combinedLocalHits.add(safeNormalize(r.url));\n for (const r of embeddingResults) combinedLocalHits.add(safeNormalize(r.url));\n\n if (combinedLocalHits.size < maxResults && includeWeb) {\n searchResults = await runWebSearchFallback(\n signal,\n engines,\n router,\n backendStatus,\n maxResults,\n signal.inputNormalizedUrl,\n input.include_domains,\n input.exclude_domains,\n searchRankMap,\n );\n log.debug('web search fallback complete', { hits: searchResults.length });\n\n // After web fallback, re-run embedding search against newly-populated index.\n // The web fallback used embedAndStore() (awaited) so vectors are already in\n // the index — no sleep needed, just re-query.\n if (embeddingAvailable && signal.queryText && searchResults.length > 0) {\n const freshEmbeddingResults = await runEmbeddingSearch(\n signal.queryText,\n signal.inputNormalizedUrl,\n input.include_domains,\n input.exclude_domains,\n MAX_EMBEDDING_CANDIDATES,\n embeddingRankMap,\n );\n\n if (freshEmbeddingResults.length > 0) {\n embeddingResults = freshEmbeddingResults;\n log.debug('re-ran embedding search after web fallback', { hits: embeddingResults.length });\n }\n }\n }\n\n // Phase 3: 3-way RRF fusion\n const rankedLists: Map<string, number>[] = [];\n if (fts5RankMap.size > 0) rankedLists.push(fts5RankMap);\n if (embeddingRankMap.size > 0) rankedLists.push(embeddingRankMap);\n if (searchRankMap.size > 0) rankedLists.push(searchRankMap);\n\n const allResults = mergeResults(cacheResults, embeddingResults, searchResults);\n\n let finalResults: FindSimilarResult[];\n\n if (rankedLists.length >= 1) {\n finalResults = fuseResults(rankedLists, allResults, maxResults);\n } else {\n finalResults = allResults\n .sort((a, b) => b.relevance_score - a.relevance_score)\n .slice(0, maxResults);\n }\n\n const method = determineMethod(\n cacheResults.length > 0,\n embeddingResults.length > 0,\n searchResults.length > 0,\n );\n\n const cacheHits = finalResults.filter(r => r.source === 'cache').length;\n const searchHits = finalResults.filter(r => r.source === 'search').length;\n\n const coldStart = buildColdStartNote(\n cacheHits,\n embeddingAvailable,\n initialCacheSize,\n initialEmbedIndexSize,\n );\n\n return {\n results: finalResults,\n method,\n cache_hits: cacheHits,\n search_hits: searchHits,\n embedding_available: embeddingAvailable,\n ...(coldStart ? { cold_start: coldStart } : {}),\n total_time_ms: Date.now() - start,\n };\n } catch (err) {\n log.error('findSimilar failed', { error: String(err) });\n return {\n results: [],\n method: 'fts5',\n cache_hits: 0,\n search_hits: 0,\n embedding_available: embeddingAvailable,\n error: `find_similar failed: ${err instanceof Error ? err.message : String(err)}`,\n total_time_ms: Date.now() - start,\n };\n }\n}\n\nfunction checkEmbeddingAvailable(): boolean {\n try {\n const svc = getEmbeddingService();\n // Available = service initialized + subprocess verified (Python + model work).\n // We no longer require index.size() > 0 because the embedding path can\n // generate query embeddings on-the-fly and compare against freshly-embedded\n // web fallback results within the same request.\n return svc.isAvailable() && svc.isSubprocessReady();\n } catch {\n return false;\n }\n}\n\nfunction safeCacheCount(): number {\n try {\n return getCacheStats().total_urls;\n } catch {\n return 0;\n }\n}\n\nfunction safeEmbedIndexSize(): number {\n try {\n return getEmbeddingService().getIndex().size();\n } catch {\n return 0;\n }\n}\n\n// Surface a note when local hybrid signals are weak so host LLMs can\n// explain to users why results are search-heavy. Avoids silent fallbacks.\nfunction buildColdStartNote(\n cacheHits: number,\n embeddingAvailable: boolean,\n initialCacheSize: number,\n initialEmbedIndexSize: number,\n): string | undefined {\n if (initialCacheSize === 0) {\n return 'Cache is empty. Results come from live web search only. Use wigolo_fetch / wigolo_crawl to warm the cache, then re-run find_similar for hybrid local+web ranking.';\n }\n if (!embeddingAvailable && initialCacheSize > 0) {\n return 'Embeddings unavailable or index empty (cached pages have not been embedded yet). Falling back to FTS5 keyword ranking. Set up sentence-transformers to enable semantic matching.';\n }\n if (cacheHits === 0 && initialCacheSize < 20) {\n return `Cache has only ${initialCacheSize} pages. Add more context by fetching or crawling relevant sites before relying on find_similar for cross-source similarity.`;\n }\n if (!embeddingAvailable && initialEmbedIndexSize === 0) {\n return 'Embedding index is empty. Semantic matching disabled until background embedding jobs catch up.';\n }\n return undefined;\n}\n\nfunction safeNormalize(url: string): string {\n try {\n return normalizeUrl(url);\n } catch {\n return url;\n }\n}\n\nfunction mergeResults(...lists: FindSimilarResult[][]): FindSimilarResult[] {\n const seen = new Map<string, FindSimilarResult>();\n for (const list of lists) {\n for (const r of list) {\n const key = safeNormalize(r.url);\n const existing = seen.get(key);\n if (!existing) {\n seen.set(key, r);\n } else {\n // Merge match_signals so fused result records the most-specific source info\n existing.match_signals = {\n ...existing.match_signals,\n ...r.match_signals,\n fused_score: existing.match_signals.fused_score,\n };\n }\n }\n }\n return [...seen.values()];\n}\n\nasync function prepareSignal(\n url: string | undefined,\n concept: string | undefined,\n router: SmartRouter,\n): Promise<ResolvedSignal> {\n if (url) {\n return await prepareSignalFromUrl(url, router);\n }\n\n if (concept) {\n const terms = extractKeyTerms(concept, '');\n return { terms, title: concept, queryText: concept };\n }\n\n return { terms: [], title: '' };\n}\n\nasync function prepareSignalFromUrl(\n url: string,\n router: SmartRouter,\n): Promise<ResolvedSignal> {\n let normalizedInputUrl: string;\n try {\n normalizedInputUrl = normalizeUrl(url);\n } catch {\n normalizedInputUrl = url;\n }\n\n const cached = getCachedContent(url);\n if (cached) {\n const terms = extractKeyTerms(cached.markdown, cached.title);\n return {\n terms,\n title: cached.title,\n inputUrl: url,\n inputNormalizedUrl: normalizedInputUrl,\n queryText: cached.markdown,\n };\n }\n\n try {\n log.info('fetching URL for signal extraction', { url });\n const raw = await router.fetch(url, { renderJs: 'auto' });\n const extractor = await getExtractProvider();\n const extraction = await extractor.extract(raw.html, raw.finalUrl, {\n contentType: raw.contentType,\n });\n const terms = extractKeyTerms(extraction.markdown, extraction.title);\n return {\n terms,\n title: extraction.title,\n inputUrl: url,\n inputNormalizedUrl: normalizedInputUrl,\n queryText: extraction.markdown,\n };\n } catch (err) {\n log.warn('failed to fetch URL for signal extraction', { url, error: String(err) });\n const urlTerms = extractKeyTerms('', url);\n return {\n terms: urlTerms,\n title: url,\n inputUrl: url,\n inputNormalizedUrl: normalizedInputUrl,\n };\n }\n}\n\nasync function runEmbeddingSearch(\n queryText: string,\n excludeNormalizedUrl: string | undefined,\n includeDomains: string[] | undefined,\n excludeDomains: string[] | undefined,\n topK: number,\n rankMap: Map<string, number>,\n): Promise<FindSimilarResult[]> {\n try {\n const service = getEmbeddingService();\n if (!service.isAvailable() || !service.isSubprocessReady()) return [];\n if (service.getIndex().size() === 0) return [];\n\n const excludeUrls = excludeNormalizedUrl ? new Set([excludeNormalizedUrl]) : undefined;\n const similar = await service.findSimilar(queryText, topK, excludeUrls);\n if (similar.length === 0) return [];\n\n // Hydrate with cached content and apply domain filters on the hydrated pool\n const hydrated: Array<{ entry: CachedContent | null; url: string; score: number }> = [];\n for (const { url: nUrl, score } of similar) {\n const cached = getCachedContent(nUrl);\n hydrated.push({ entry: cached, url: nUrl, score });\n }\n\n const filterableInputs = hydrated.map(h => ({\n url: h.entry?.url ?? h.url,\n })) as unknown as CachedContent[];\n const filtered = filterByDomains(filterableInputs, includeDomains, excludeDomains) as unknown as Array<{\n url: string;\n }>;\n const allowedUrls = new Set(filtered.map(f => f.url));\n\n const results: FindSimilarResult[] = [];\n let rank = 0;\n for (const h of hydrated) {\n const displayUrl = h.entry?.url ?? h.url;\n if (!allowedUrls.has(displayUrl)) continue;\n\n rank++;\n rankMap.set(safeNormalize(displayUrl), rank);\n\n results.push({\n url: displayUrl,\n title: h.entry?.title ?? displayUrl,\n markdown: (h.entry?.markdown ?? '').slice(0, 5000),\n relevance_score: h.score,\n source: 'cache',\n match_signals: {\n embedding_rank: rank,\n fused_score: 0,\n },\n });\n }\n\n return results;\n } catch (err) {\n log.warn('embedding search failed', { error: String(err) });\n return [];\n }\n}\n\nfunction runFTS5Search(\n terms: string[],\n excludeNormalizedUrl: string | undefined,\n includeDomains: string[] | undefined,\n excludeDomains: string[] | undefined,\n maxCandidates: number,\n rankMap: Map<string, number>,\n): FindSimilarResult[] {\n try {\n const fts5Query = buildFTS5Query(terms);\n if (!fts5Query) return [];\n\n let cached = searchCache(fts5Query);\n\n if (excludeNormalizedUrl) {\n cached = cached.filter(c => {\n try {\n return normalizeUrl(c.url) !== excludeNormalizedUrl;\n } catch {\n return c.url !== excludeNormalizedUrl;\n }\n });\n }\n\n cached = filterByDomains(cached, includeDomains, excludeDomains) as CachedContent[];\n cached = cached.slice(0, maxCandidates);\n\n const results: FindSimilarResult[] = [];\n for (let i = 0; i < cached.length; i++) {\n const entry = cached[i];\n let nUrl: string;\n try {\n nUrl = normalizeUrl(entry.url);\n } catch {\n nUrl = entry.url;\n }\n\n rankMap.set(nUrl, i + 1);\n\n results.push({\n url: entry.url,\n title: entry.title,\n markdown: entry.markdown.slice(0, 5000),\n relevance_score: 0,\n source: 'cache',\n match_signals: {\n fts5_rank: i + 1,\n fused_score: 0,\n },\n });\n }\n\n return results;\n } catch (err) {\n log.error('FTS5 search failed', { error: String(err) });\n return [];\n }\n}\n\nasync function runWebSearchFallback(\n signal: ResolvedSignal,\n engines: SearchEngine[],\n router: SmartRouter,\n backendStatus: BackendStatus | undefined,\n maxResults: number,\n excludeNormalizedUrl: string | undefined,\n includeDomains: string[] | undefined,\n excludeDomains: string[] | undefined,\n rankMap: Map<string, number>,\n): Promise<FindSimilarResult[]> {\n try {\n const queries = generateSearchQueries(signal.terms, signal.title);\n if (queries.length === 0) return [];\n\n const allResults: FindSimilarResult[] = [];\n const seenUrls = new Set<string>();\n\n if (excludeNormalizedUrl) {\n seenUrls.add(excludeNormalizedUrl);\n }\n\n for (const query of queries) {\n try {\n const searchResult = await handleSearch(\n {\n query,\n max_results: maxResults,\n include_content: true,\n include_domains: includeDomains,\n exclude_domains: excludeDomains,\n },\n engines,\n router,\n backendStatus,\n );\n\n if (!searchResult.ok) {\n log.warn('web search query failed', { query, error: searchResult.error_reason });\n continue;\n }\n const searchOutput = searchResult.data;\n\n for (const item of searchOutput.results) {\n let nUrl: string;\n try {\n nUrl = normalizeUrl(item.url);\n } catch {\n nUrl = item.url;\n }\n\n if (seenUrls.has(nUrl)) continue;\n seenUrls.add(nUrl);\n\n const rank = allResults.length + 1;\n rankMap.set(nUrl, rank);\n\n allResults.push({\n url: item.url,\n title: item.title,\n markdown: (item.markdown_content ?? item.snippet).slice(0, 5000),\n relevance_score: item.relevance_score,\n source: 'search',\n match_signals: {\n fused_score: 0,\n },\n });\n }\n } catch (err) {\n log.warn('web search query failed', { query, error: String(err) });\n }\n }\n\n // Embed web results synchronously so they're in the index for the\n // re-query pass that runs after this fallback. Other tools use embedAsync\n // (fire-and-forget), but find_similar needs embeddings in THIS request.\n try {\n const embeddingService = getEmbeddingService();\n if (embeddingService.isAvailable() && embeddingService.isSubprocessReady()) {\n const embedPromises = allResults\n .filter(r => r.markdown)\n .slice(0, 10) // cap to avoid blocking too long\n .map(r => embeddingService.embedAndStore(r.url, r.markdown));\n await Promise.allSettled(embedPromises);\n log.debug('embedded web fallback results', { count: embedPromises.length });\n }\n } catch (err) {\n log.debug('embedding hook skipped for find_similar results', { error: String(err) });\n }\n\n return allResults;\n } catch (err) {\n log.error('web search fallback failed', { error: String(err) });\n return [];\n }\n}\n\nfunction generateSearchQueries(terms: string[], title: string): string[] {\n if (terms.length === 0 && !title) return [];\n\n const queries: string[] = [];\n\n if (title && title.length > 3) {\n queries.push(title.slice(0, 150));\n }\n\n if (terms.length >= 3) {\n queries.push(terms.slice(0, 5).join(' '));\n }\n\n if (terms.length >= 2) {\n queries.push(`${terms.slice(0, 3).join(' ')} tutorial guide`);\n }\n\n const unique = [...new Set(queries)];\n return unique.slice(0, WEB_SEARCH_QUERY_COUNT);\n}\n\nfunction fuseResults(\n rankedLists: Map<string, number>[],\n allResults: FindSimilarResult[],\n maxResults: number,\n): FindSimilarResult[] {\n const scores = reciprocalRankFusion(rankedLists);\n const sorted = sortByRRFScore(scores);\n\n const resultsByNormalizedUrl = new Map<string, FindSimilarResult>();\n for (const r of allResults) {\n const key = safeNormalize(r.url);\n if (!resultsByNormalizedUrl.has(key)) {\n resultsByNormalizedUrl.set(key, r);\n }\n }\n\n // Raw RRF scores cap at ~2/60 ≈ 0.033 which reads as \"low relevance\" to\n // users. Normalize against the top score so the best match is 1.0 and the\n // rest are proportional; the absolute RRF value is preserved in\n // match_signals.fused_score for clients that depend on it.\n const topScore = sorted.length > 0 ? sorted[0][1] : 0;\n const fused: FindSimilarResult[] = [];\n for (const [nUrl, score] of sorted) {\n if (fused.length >= maxResults) break;\n\n const result = resultsByNormalizedUrl.get(nUrl);\n if (!result) continue;\n\n const normalized = topScore > 0 ? score / topScore : 0;\n fused.push({\n ...result,\n relevance_score: normalized,\n match_signals: {\n ...result.match_signals,\n fused_score: score,\n },\n });\n }\n\n return fused;\n}\n\nfunction determineMethod(\n hasCache: boolean,\n hasEmbedding: boolean,\n hasSearch: boolean,\n): FindSimilarOutput['method'] {\n const sources = [hasCache, hasEmbedding, hasSearch].filter(Boolean).length;\n if (sources >= 2) return 'hybrid';\n if (hasEmbedding) return 'embedding';\n if (hasCache) return 'fts5';\n if (hasSearch) return 'search';\n return 'fts5';\n}\n"],"mappings":"AASA,SAAS,iBAAiB,sBAAsB;AAChD,SAAS,sBAAsB,sBAAsB;AACrD,SAAS,aAAa,kBAAkB,cAAc,qBAAqB;AAC3E,SAAS,uBAAuB;AAChC,SAAS,oBAAoB;AAC7B,SAAS,0BAA0B;AACnC,SAAS,2BAA2B;AACpC,SAAS,oBAAoB;AAC7B,SAAS,kBAAkB;AAC3B,SAAS,iBAAiB;AAE1B,MAAM,MAAM,aAAa,QAAQ;AAEjC,MAAM,sBAAsB;AAC5B,MAAM,sBAAsB;AAC5B,MAAM,2BAA2B;AACjC,MAAM,yBAAyB;AAU/B,eAAsB,YACpB,OACA,SACA,QACA,eAC4B;AAC5B,QAAM,QAAQ,KAAK,IAAI;AAGvB,QAAM,qBAAqB,wBAAwB;AAKnD,QAAM,mBAAmB,eAAe;AACxC,QAAM,wBAAwB,mBAAmB;AAEjD,MAAI;AAGF,UAAM,OAAO,WAAW,KAAK;AAC7B,QAAI,SAAS,cAAc;AACzB,YAAM,OAAO,MAAM,KAAK,KAAK;AAC7B,UAAI,CAAC,MAAM;AACT,eAAO;AAAA,UACL,SAAS,CAAC;AAAA,UACV,QAAQ;AAAA,UACR,YAAY;AAAA,UACZ,aAAa;AAAA,UACb,qBAAqB;AAAA,UACrB,OAAO;AAAA,UACP,eAAe,KAAK,IAAI,IAAI;AAAA,QAC9B;AAAA,MACF;AACA,YAAM,KAAK,MAAM,UAAU,MAAM,OAAO,MAAM;AAC9C,aAAO,EAAE,GAAG,IAAI,eAAe,KAAK,IAAI,IAAI,MAAM;AAAA,IACpD;AAEA,UAAM,MAAM,MAAM,KAAK,KAAK;AAC5B,UAAM,UAAU,MAAM,SAAS,KAAK;AAEpC,QAAI,CAAC,OAAO,CAAC,SAAS;AACpB,aAAO;AAAA,QACL,SAAS,CAAC;AAAA,QACV,QAAQ;AAAA,QACR,YAAY;AAAA,QACZ,aAAa;AAAA,QACb,qBAAqB;AAAA,QACrB,OAAO;AAAA,QACP,eAAe,KAAK,IAAI,IAAI;AAAA,MAC9B;AAAA,IACF;AAEA,UAAM,aAAa,MAAM,eAAe;AACxC,UAAM,eAAe,MAAM,iBAAiB;AAC5C,UAAM,aAAa,MAAM,eAAe;AAExC,UAAM,SAAS,MAAM,cAAc,KAAK,SAAS,MAAM;AAEvD,QAAI,OAAO,MAAM,WAAW,KAAK,CAAC,OAAO,WAAW;AAClD,UAAI,KAAK,kEAAkE;AAE3E,UAAI,CAAC,YAAY;AACf,eAAO;AAAA,UACL,SAAS,CAAC;AAAA,UACV,QAAQ;AAAA,UACR,YAAY;AAAA,UACZ,aAAa;AAAA,UACb,qBAAqB;AAAA,UACrB,OAAO;AAAA,UACP,eAAe,KAAK,IAAI,IAAI;AAAA,QAC9B;AAAA,MACF;AAAA,IACF;AAGA,QAAI,eAAoC,CAAC;AACzC,UAAM,cAAc,oBAAI,IAAoB;AAC5C,QAAI,mBAAwC,CAAC;AAC7C,UAAM,mBAAmB,oBAAI,IAAoB;AAEjD,UAAM,QAAQ,IAAI;AAAA,OACf,YAAY;AACX,YAAI,gBAAgB,OAAO,MAAM,SAAS,GAAG;AAC3C,yBAAe;AAAA,YACb,OAAO;AAAA,YACP,OAAO;AAAA,YACP,MAAM;AAAA,YACN,MAAM;AAAA,YACN;AAAA,YACA;AAAA,UACF;AACA,cAAI,MAAM,wBAAwB,EAAE,MAAM,aAAa,OAAO,CAAC;AAAA,QACjE;AAAA,MACF,GAAG;AAAA,OACF,YAAY;AACX,YAAI,gBAAgB,sBAAsB,OAAO,WAAW;AAC1D,6BAAmB,MAAM;AAAA,YACvB,OAAO;AAAA,YACP,OAAO;AAAA,YACP,MAAM;AAAA,YACN,MAAM;AAAA,YACN;AAAA,YACA;AAAA,UACF;AACA,cAAI,MAAM,6BAA6B,EAAE,MAAM,iBAAiB,OAAO,CAAC;AAAA,QAC1E;AAAA,MACF,GAAG;AAAA,IACL,CAAC;AAGD,QAAI,gBAAqC,CAAC;AAC1C,UAAM,gBAAgB,oBAAI,IAAoB;AAE9C,UAAM,oBAAoB,oBAAI,IAAY;AAC1C,eAAW,KAAK,aAAc,mBAAkB,IAAI,cAAc,EAAE,GAAG,CAAC;AACxE,eAAW,KAAK,iBAAkB,mBAAkB,IAAI,cAAc,EAAE,GAAG,CAAC;AAE5E,QAAI,kBAAkB,OAAO,cAAc,YAAY;AACrD,sBAAgB,MAAM;AAAA,QACpB;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA;AAAA,QACA,OAAO;AAAA,QACP,MAAM;AAAA,QACN,MAAM;AAAA,QACN;AAAA,MACF;AACA,UAAI,MAAM,gCAAgC,EAAE,MAAM,cAAc,OAAO,CAAC;AAKxE,UAAI,sBAAsB,OAAO,aAAa,cAAc,SAAS,GAAG;AACtE,cAAM,wBAAwB,MAAM;AAAA,UAClC,OAAO;AAAA,UACP,OAAO;AAAA,UACP,MAAM;AAAA,UACN,MAAM;AAAA,UACN;AAAA,UACA;AAAA,QACF;AAEA,YAAI,sBAAsB,SAAS,GAAG;AACpC,6BAAmB;AACnB,cAAI,MAAM,8CAA8C,EAAE,MAAM,iBAAiB,OAAO,CAAC;AAAA,QAC3F;AAAA,MACF;AAAA,IACF;AAGA,UAAM,cAAqC,CAAC;AAC5C,QAAI,YAAY,OAAO,EAAG,aAAY,KAAK,WAAW;AACtD,QAAI,iBAAiB,OAAO,EAAG,aAAY,KAAK,gBAAgB;AAChE,QAAI,cAAc,OAAO,EAAG,aAAY,KAAK,aAAa;AAE1D,UAAM,aAAa,aAAa,cAAc,kBAAkB,aAAa;AAE7E,QAAI;AAEJ,QAAI,YAAY,UAAU,GAAG;AAC3B,qBAAe,YAAY,aAAa,YAAY,UAAU;AAAA,IAChE,OAAO;AACL,qBAAe,WACZ,KAAK,CAAC,GAAG,MAAM,EAAE,kBAAkB,EAAE,eAAe,EACpD,MAAM,GAAG,UAAU;AAAA,IACxB;AAEA,UAAM,SAAS;AAAA,MACb,aAAa,SAAS;AAAA,MACtB,iBAAiB,SAAS;AAAA,MAC1B,cAAc,SAAS;AAAA,IACzB;AAEA,UAAM,YAAY,aAAa,OAAO,OAAK,EAAE,WAAW,OAAO,EAAE;AACjE,UAAM,aAAa,aAAa,OAAO,OAAK,EAAE,WAAW,QAAQ,EAAE;AAEnE,UAAM,YAAY;AAAA,MAChB;AAAA,MACA;AAAA,MACA;AAAA,MACA;AAAA,IACF;AAEA,WAAO;AAAA,MACL,SAAS;AAAA,MACT;AAAA,MACA,YAAY;AAAA,MACZ,aAAa;AAAA,MACb,qBAAqB;AAAA,MACrB,GAAI,YAAY,EAAE,YAAY,UAAU,IAAI,CAAC;AAAA,MAC7C,eAAe,KAAK,IAAI,IAAI;AAAA,IAC9B;AAAA,EACF,SAAS,KAAK;AACZ,QAAI,MAAM,sBAAsB,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AACtD,WAAO;AAAA,MACL,SAAS,CAAC;AAAA,MACV,QAAQ;AAAA,MACR,YAAY;AAAA,MACZ,aAAa;AAAA,MACb,qBAAqB;AAAA,MACrB,OAAO,wBAAwB,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG,CAAC;AAAA,MAC/E,eAAe,KAAK,IAAI,IAAI;AAAA,IAC9B;AAAA,EACF;AACF;AAEA,SAAS,0BAAmC;AAC1C,MAAI;AACF,UAAM,MAAM,oBAAoB;AAKhC,WAAO,IAAI,YAAY,KAAK,IAAI,kBAAkB;AAAA,EACpD,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAEA,SAAS,iBAAyB;AAChC,MAAI;AACF,WAAO,cAAc,EAAE;AAAA,EACzB,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAEA,SAAS,qBAA6B;AACpC,MAAI;AACF,WAAO,oBAAoB,EAAE,SAAS,EAAE,KAAK;AAAA,EAC/C,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAIA,SAAS,mBACP,WACA,oBACA,kBACA,uBACoB;AACpB,MAAI,qBAAqB,GAAG;AAC1B,WAAO;AAAA,EACT;AACA,MAAI,CAAC,sBAAsB,mBAAmB,GAAG;AAC/C,WAAO;AAAA,EACT;AACA,MAAI,cAAc,KAAK,mBAAmB,IAAI;AAC5C,WAAO,kBAAkB,gBAAgB;AAAA,EAC3C;AACA,MAAI,CAAC,sBAAsB,0BAA0B,GAAG;AACtD,WAAO;AAAA,EACT;AACA,SAAO;AACT;AAEA,SAAS,cAAc,KAAqB;AAC1C,MAAI;AACF,WAAO,aAAa,GAAG;AAAA,EACzB,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAEA,SAAS,gBAAgB,OAAmD;AAC1E,QAAM,OAAO,oBAAI,IAA+B;AAChD,aAAW,QAAQ,OAAO;AACxB,eAAW,KAAK,MAAM;AACpB,YAAM,MAAM,cAAc,EAAE,GAAG;AAC/B,YAAM,WAAW,KAAK,IAAI,GAAG;AAC7B,UAAI,CAAC,UAAU;AACb,aAAK,IAAI,KAAK,CAAC;AAAA,MACjB,OAAO;AAEL,iBAAS,gBAAgB;AAAA,UACvB,GAAG,SAAS;AAAA,UACZ,GAAG,EAAE;AAAA,UACL,aAAa,SAAS,cAAc;AAAA,QACtC;AAAA,MACF;AAAA,IACF;AAAA,EACF;AACA,SAAO,CAAC,GAAG,KAAK,OAAO,CAAC;AAC1B;AAEA,eAAe,cACb,KACA,SACA,QACyB;AACzB,MAAI,KAAK;AACP,WAAO,MAAM,qBAAqB,KAAK,MAAM;AAAA,EAC/C;AAEA,MAAI,SAAS;AACX,UAAM,QAAQ,gBAAgB,SAAS,EAAE;AACzC,WAAO,EAAE,OAAO,OAAO,SAAS,WAAW,QAAQ;AAAA,EACrD;AAEA,SAAO,EAAE,OAAO,CAAC,GAAG,OAAO,GAAG;AAChC;AAEA,eAAe,qBACb,KACA,QACyB;AACzB,MAAI;AACJ,MAAI;AACF,yBAAqB,aAAa,GAAG;AAAA,EACvC,QAAQ;AACN,yBAAqB;AAAA,EACvB;AAEA,QAAM,SAAS,iBAAiB,GAAG;AACnC,MAAI,QAAQ;AACV,UAAM,QAAQ,gBAAgB,OAAO,UAAU,OAAO,KAAK;AAC3D,WAAO;AAAA,MACL;AAAA,MACA,OAAO,OAAO;AAAA,MACd,UAAU;AAAA,MACV,oBAAoB;AAAA,MACpB,WAAW,OAAO;AAAA,IACpB;AAAA,EACF;AAEA,MAAI;AACF,QAAI,KAAK,sCAAsC,EAAE,IAAI,CAAC;AACtD,UAAM,MAAM,MAAM,OAAO,MAAM,KAAK,EAAE,UAAU,OAAO,CAAC;AACxD,UAAM,YAAY,MAAM,mBAAmB;AAC3C,UAAM,aAAa,MAAM,UAAU,QAAQ,IAAI,MAAM,IAAI,UAAU;AAAA,MACjE,aAAa,IAAI;AAAA,IACnB,CAAC;AACD,UAAM,QAAQ,gBAAgB,WAAW,UAAU,WAAW,KAAK;AACnE,WAAO;AAAA,MACL;AAAA,MACA,OAAO,WAAW;AAAA,MAClB,UAAU;AAAA,MACV,oBAAoB;AAAA,MACpB,WAAW,WAAW;AAAA,IACxB;AAAA,EACF,SAAS,KAAK;AACZ,QAAI,KAAK,6CAA6C,EAAE,KAAK,OAAO,OAAO,GAAG,EAAE,CAAC;AACjF,UAAM,WAAW,gBAAgB,IAAI,GAAG;AACxC,WAAO;AAAA,MACL,OAAO;AAAA,MACP,OAAO;AAAA,MACP,UAAU;AAAA,MACV,oBAAoB;AAAA,IACtB;AAAA,EACF;AACF;AAEA,eAAe,mBACb,WACA,sBACA,gBACA,gBACA,MACA,SAC8B;AAC9B,MAAI;AACF,UAAM,UAAU,oBAAoB;AACpC,QAAI,CAAC,QAAQ,YAAY,KAAK,CAAC,QAAQ,kBAAkB,EAAG,QAAO,CAAC;AACpE,QAAI,QAAQ,SAAS,EAAE,KAAK,MAAM,EAAG,QAAO,CAAC;AAE7C,UAAM,cAAc,uBAAuB,oBAAI,IAAI,CAAC,oBAAoB,CAAC,IAAI;AAC7E,UAAM,UAAU,MAAM,QAAQ,YAAY,WAAW,MAAM,WAAW;AACtE,QAAI,QAAQ,WAAW,EAAG,QAAO,CAAC;AAGlC,UAAM,WAA+E,CAAC;AACtF,eAAW,EAAE,KAAK,MAAM,MAAM,KAAK,SAAS;AAC1C,YAAM,SAAS,iBAAiB,IAAI;AACpC,eAAS,KAAK,EAAE,OAAO,QAAQ,KAAK,MAAM,MAAM,CAAC;AAAA,IACnD;AAEA,UAAM,mBAAmB,SAAS,IAAI,QAAM;AAAA,MAC1C,KAAK,EAAE,OAAO,OAAO,EAAE;AAAA,IACzB,EAAE;AACF,UAAM,WAAW,gBAAgB,kBAAkB,gBAAgB,cAAc;AAGjF,UAAM,cAAc,IAAI,IAAI,SAAS,IAAI,OAAK,EAAE,GAAG,CAAC;AAEpD,UAAM,UAA+B,CAAC;AACtC,QAAI,OAAO;AACX,eAAW,KAAK,UAAU;AACxB,YAAM,aAAa,EAAE,OAAO,OAAO,EAAE;AACrC,UAAI,CAAC,YAAY,IAAI,UAAU,EAAG;AAElC;AACA,cAAQ,IAAI,cAAc,UAAU,GAAG,IAAI;AAE3C,cAAQ,KAAK;AAAA,QACX,KAAK;AAAA,QACL,OAAO,EAAE,OAAO,SAAS;AAAA,QACzB,WAAW,EAAE,OAAO,YAAY,IAAI,MAAM,GAAG,GAAI;AAAA,QACjD,iBAAiB,EAAE;AAAA,QACnB,QAAQ;AAAA,QACR,eAAe;AAAA,UACb,gBAAgB;AAAA,UAChB,aAAa;AAAA,QACf;AAAA,MACF,CAAC;AAAA,IACH;AAEA,WAAO;AAAA,EACT,SAAS,KAAK;AACZ,QAAI,KAAK,2BAA2B,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AAC1D,WAAO,CAAC;AAAA,EACV;AACF;AAEA,SAAS,cACP,OACA,sBACA,gBACA,gBACA,eACA,SACqB;AACrB,MAAI;AACF,UAAM,YAAY,eAAe,KAAK;AACtC,QAAI,CAAC,UAAW,QAAO,CAAC;AAExB,QAAI,SAAS,YAAY,SAAS;AAElC,QAAI,sBAAsB;AACxB,eAAS,OAAO,OAAO,OAAK;AAC1B,YAAI;AACF,iBAAO,aAAa,EAAE,GAAG,MAAM;AAAA,QACjC,QAAQ;AACN,iBAAO,EAAE,QAAQ;AAAA,QACnB;AAAA,MACF,CAAC;AAAA,IACH;AAEA,aAAS,gBAAgB,QAAQ,gBAAgB,cAAc;AAC/D,aAAS,OAAO,MAAM,GAAG,aAAa;AAEtC,UAAM,UAA+B,CAAC;AACtC,aAAS,IAAI,GAAG,IAAI,OAAO,QAAQ,KAAK;AACtC,YAAM,QAAQ,OAAO,CAAC;AACtB,UAAI;AACJ,UAAI;AACF,eAAO,aAAa,MAAM,GAAG;AAAA,MAC/B,QAAQ;AACN,eAAO,MAAM;AAAA,MACf;AAEA,cAAQ,IAAI,MAAM,IAAI,CAAC;AAEvB,cAAQ,KAAK;AAAA,QACX,KAAK,MAAM;AAAA,QACX,OAAO,MAAM;AAAA,QACb,UAAU,MAAM,SAAS,MAAM,GAAG,GAAI;AAAA,QACtC,iBAAiB;AAAA,QACjB,QAAQ;AAAA,QACR,eAAe;AAAA,UACb,WAAW,IAAI;AAAA,UACf,aAAa;AAAA,QACf;AAAA,MACF,CAAC;AAAA,IACH;AAEA,WAAO;AAAA,EACT,SAAS,KAAK;AACZ,QAAI,MAAM,sBAAsB,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AACtD,WAAO,CAAC;AAAA,EACV;AACF;AAEA,eAAe,qBACb,QACA,SACA,QACA,eACA,YACA,sBACA,gBACA,gBACA,SAC8B;AAC9B,MAAI;AACF,UAAM,UAAU,sBAAsB,OAAO,OAAO,OAAO,KAAK;AAChE,QAAI,QAAQ,WAAW,EAAG,QAAO,CAAC;AAElC,UAAM,aAAkC,CAAC;AACzC,UAAM,WAAW,oBAAI,IAAY;AAEjC,QAAI,sBAAsB;AACxB,eAAS,IAAI,oBAAoB;AAAA,IACnC;AAEA,eAAW,SAAS,SAAS;AAC3B,UAAI;AACF,cAAM,eAAe,MAAM;AAAA,UACzB;AAAA,YACE;AAAA,YACA,aAAa;AAAA,YACb,iBAAiB;AAAA,YACjB,iBAAiB;AAAA,YACjB,iBAAiB;AAAA,UACnB;AAAA,UACA;AAAA,UACA;AAAA,UACA;AAAA,QACF;AAEA,YAAI,CAAC,aAAa,IAAI;AACpB,cAAI,KAAK,2BAA2B,EAAE,OAAO,OAAO,aAAa,aAAa,CAAC;AAC/E;AAAA,QACF;AACA,cAAM,eAAe,aAAa;AAElC,mBAAW,QAAQ,aAAa,SAAS;AACvC,cAAI;AACJ,cAAI;AACF,mBAAO,aAAa,KAAK,GAAG;AAAA,UAC9B,QAAQ;AACN,mBAAO,KAAK;AAAA,UACd;AAEA,cAAI,SAAS,IAAI,IAAI,EAAG;AACxB,mBAAS,IAAI,IAAI;AAEjB,gBAAM,OAAO,WAAW,SAAS;AACjC,kBAAQ,IAAI,MAAM,IAAI;AAEtB,qBAAW,KAAK;AAAA,YACd,KAAK,KAAK;AAAA,YACV,OAAO,KAAK;AAAA,YACZ,WAAW,KAAK,oBAAoB,KAAK,SAAS,MAAM,GAAG,GAAI;AAAA,YAC/D,iBAAiB,KAAK;AAAA,YACtB,QAAQ;AAAA,YACR,eAAe;AAAA,cACb,aAAa;AAAA,YACf;AAAA,UACF,CAAC;AAAA,QACH;AAAA,MACF,SAAS,KAAK;AACZ,YAAI,KAAK,2BAA2B,EAAE,OAAO,OAAO,OAAO,GAAG,EAAE,CAAC;AAAA,MACnE;AAAA,IACF;AAKA,QAAI;AACF,YAAM,mBAAmB,oBAAoB;AAC7C,UAAI,iBAAiB,YAAY,KAAK,iBAAiB,kBAAkB,GAAG;AAC1E,cAAM,gBAAgB,WACnB,OAAO,OAAK,EAAE,QAAQ,EACtB,MAAM,GAAG,EAAE,EACX,IAAI,OAAK,iBAAiB,cAAc,EAAE,KAAK,EAAE,QAAQ,CAAC;AAC7D,cAAM,QAAQ,WAAW,aAAa;AACtC,YAAI,MAAM,iCAAiC,EAAE,OAAO,cAAc,OAAO,CAAC;AAAA,MAC5E;AAAA,IACF,SAAS,KAAK;AACZ,UAAI,MAAM,mDAAmD,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AAAA,IACrF;AAEA,WAAO;AAAA,EACT,SAAS,KAAK;AACZ,QAAI,MAAM,8BAA8B,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AAC9D,WAAO,CAAC;AAAA,EACV;AACF;AAEA,SAAS,sBAAsB,OAAiB,OAAyB;AACvE,MAAI,MAAM,WAAW,KAAK,CAAC,MAAO,QAAO,CAAC;AAE1C,QAAM,UAAoB,CAAC;AAE3B,MAAI,SAAS,MAAM,SAAS,GAAG;AAC7B,YAAQ,KAAK,MAAM,MAAM,GAAG,GAAG,CAAC;AAAA,EAClC;AAEA,MAAI,MAAM,UAAU,GAAG;AACrB,YAAQ,KAAK,MAAM,MAAM,GAAG,CAAC,EAAE,KAAK,GAAG,CAAC;AAAA,EAC1C;AAEA,MAAI,MAAM,UAAU,GAAG;AACrB,YAAQ,KAAK,GAAG,MAAM,MAAM,GAAG,CAAC,EAAE,KAAK,GAAG,CAAC,iBAAiB;AAAA,EAC9D;AAEA,QAAM,SAAS,CAAC,GAAG,IAAI,IAAI,OAAO,CAAC;AACnC,SAAO,OAAO,MAAM,GAAG,sBAAsB;AAC/C;AAEA,SAAS,YACP,aACA,YACA,YACqB;AACrB,QAAM,SAAS,qBAAqB,WAAW;AAC/C,QAAM,SAAS,eAAe,MAAM;AAEpC,QAAM,yBAAyB,oBAAI,IAA+B;AAClE,aAAW,KAAK,YAAY;AAC1B,UAAM,MAAM,cAAc,EAAE,GAAG;AAC/B,QAAI,CAAC,uBAAuB,IAAI,GAAG,GAAG;AACpC,6BAAuB,IAAI,KAAK,CAAC;AAAA,IACnC;AAAA,EACF;AAMA,QAAM,WAAW,OAAO,SAAS,IAAI,OAAO,CAAC,EAAE,CAAC,IAAI;AACpD,QAAM,QAA6B,CAAC;AACpC,aAAW,CAAC,MAAM,KAAK,KAAK,QAAQ;AAClC,QAAI,MAAM,UAAU,WAAY;AAEhC,UAAM,SAAS,uBAAuB,IAAI,IAAI;AAC9C,QAAI,CAAC,OAAQ;AAEb,UAAM,aAAa,WAAW,IAAI,QAAQ,WAAW;AACrD,UAAM,KAAK;AAAA,MACT,GAAG;AAAA,MACH,iBAAiB;AAAA,MACjB,eAAe;AAAA,QACb,GAAG,OAAO;AAAA,QACV,aAAa;AAAA,MACf;AAAA,IACF,CAAC;AAAA,EACH;AAEA,SAAO;AACT;AAEA,SAAS,gBACP,UACA,cACA,WAC6B;AAC7B,QAAM,UAAU,CAAC,UAAU,cAAc,SAAS,EAAE,OAAO,OAAO,EAAE;AACpE,MAAI,WAAW,EAAG,QAAO;AACzB,MAAI,aAAc,QAAO;AACzB,MAAI,SAAU,QAAO;AACrB,MAAI,UAAW,QAAO;AACtB,SAAO;AACT;","names":[]}
@@ -0,0 +1,19 @@
1
+ import type { SearchResultItem, Citation, Highlight } from '../types.js';
2
+ export interface HighlightSynthesisResult {
3
+ highlights: Highlight[];
4
+ citations: Citation[];
5
+ reranker_used: boolean;
6
+ }
7
+ export interface Passage {
8
+ text: string;
9
+ charStart: number;
10
+ charEnd: number;
11
+ }
12
+ export declare function splitIntoPassages(markdown: string): Passage[];
13
+ export interface AnnotatedPassage extends Passage {
14
+ sectionHeading: string | null;
15
+ }
16
+ export declare function mapPassageHeadings(markdown: string, passages: Passage[]): AnnotatedPassage[];
17
+ export declare function extractHighlights(query: string, results: SearchResultItem[], maxHighlights?: number): Promise<HighlightSynthesisResult>;
18
+ export declare function fallbackHighlights(results: SearchResultItem[], maxHighlights: number): Highlight[];
19
+ //# sourceMappingURL=highlights.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"highlights.d.ts","sourceRoot":"","sources":["../../src/search/highlights.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,gBAAgB,EAAE,QAAQ,EAAE,SAAS,EAAE,MAAM,aAAa,CAAC;AAYzE,MAAM,WAAW,wBAAwB;IACvC,UAAU,EAAE,SAAS,EAAE,CAAC;IACxB,SAAS,EAAE,QAAQ,EAAE,CAAC;IACtB,aAAa,EAAE,OAAO,CAAC;CACxB;AAED,MAAM,WAAW,OAAO;IACtB,IAAI,EAAE,MAAM,CAAC;IACb,SAAS,EAAE,MAAM,CAAC;IAClB,OAAO,EAAE,MAAM,CAAC;CACjB;AAwBD,wBAAgB,iBAAiB,CAAC,QAAQ,EAAE,MAAM,GAAG,OAAO,EAAE,CA6B7D;AAOD,MAAM,WAAW,gBAAiB,SAAQ,OAAO;IAC/C,cAAc,EAAE,MAAM,GAAG,IAAI,CAAC;CAC/B;AAKD,wBAAgB,kBAAkB,CAChC,QAAQ,EAAE,MAAM,EAChB,QAAQ,EAAE,OAAO,EAAE,GAClB,gBAAgB,EAAE,CAapB;AAMD,wBAAsB,iBAAiB,CACrC,KAAK,EAAE,MAAM,EACb,OAAO,EAAE,gBAAgB,EAAE,EAC3B,aAAa,GAAE,MAA+B,GAC7C,OAAO,CAAC,wBAAwB,CAAC,CAmEnC;AAKD,wBAAgB,kBAAkB,CAChC,OAAO,EAAE,gBAAgB,EAAE,EAC3B,aAAa,EAAE,MAAM,GACpB,SAAS,EAAE,CAkCb"}