@staticn0va/wigolo 0.1.0 → 0.1.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +1 -1
- package/README.md +146 -227
- package/SKILL.md +382 -0
- package/assets/blocks/claude-code/CLAUDE.md.block +20 -0
- package/assets/blocks/claude-code/wigolo-command.md +40 -0
- package/assets/blocks/cursor/wigolo.mdc +46 -0
- package/assets/blocks/gemini-cli/GEMINI.md.block +18 -0
- package/assets/blocks/vscode/copilot-instructions.md.block +18 -0
- package/assets/skills/wigolo/SKILL.md +50 -0
- package/assets/skills/wigolo/rules/cache-first.md +30 -0
- package/assets/skills/wigolo/rules/synthesis.md +43 -0
- package/assets/skills/wigolo-agent/SKILL.md +73 -0
- package/assets/skills/wigolo-crawl/SKILL.md +60 -0
- package/assets/skills/wigolo-extract/SKILL.md +59 -0
- package/assets/skills/wigolo-fetch/SKILL.md +65 -0
- package/assets/skills/wigolo-find-similar/SKILL.md +72 -0
- package/assets/skills/wigolo-research/SKILL.md +77 -0
- package/assets/skills/wigolo-search/SKILL.md +78 -0
- package/dist/agent/executor.d.ts +33 -0
- package/dist/agent/executor.d.ts.map +1 -0
- package/dist/agent/executor.js +233 -0
- package/dist/agent/executor.js.map +1 -0
- package/dist/agent/pipeline.d.ts +5 -0
- package/dist/agent/pipeline.d.ts.map +1 -0
- package/dist/agent/pipeline.js +238 -0
- package/dist/agent/pipeline.js.map +1 -0
- package/dist/agent/planner.d.ts +13 -0
- package/dist/agent/planner.d.ts.map +1 -0
- package/dist/agent/planner.js +271 -0
- package/dist/agent/planner.js.map +1 -0
- package/dist/agent/relevance.d.ts +15 -0
- package/dist/agent/relevance.d.ts.map +1 -0
- package/dist/agent/relevance.js +60 -0
- package/dist/agent/relevance.js.map +1 -0
- package/dist/cache/backfill-embeddings.d.ts +23 -0
- package/dist/cache/backfill-embeddings.d.ts.map +1 -0
- package/dist/cache/backfill-embeddings.js +105 -0
- package/dist/cache/backfill-embeddings.js.map +1 -0
- package/dist/cache/change-detector.d.ts +7 -0
- package/dist/cache/change-detector.d.ts.map +1 -0
- package/dist/cache/change-detector.js +43 -0
- package/dist/cache/change-detector.js.map +1 -0
- package/dist/cache/db.d.ts +1 -0
- package/dist/cache/db.d.ts.map +1 -1
- package/dist/cache/db.js +94 -22
- package/dist/cache/db.js.map +1 -1
- package/dist/cache/diff-summary.d.ts +2 -0
- package/dist/cache/diff-summary.d.ts.map +1 -0
- package/dist/cache/diff-summary.js +82 -0
- package/dist/cache/diff-summary.js.map +1 -0
- package/dist/cache/migrations/runner.d.ts +29 -0
- package/dist/cache/migrations/runner.d.ts.map +1 -0
- package/dist/cache/migrations/runner.js +147 -0
- package/dist/cache/migrations/runner.js.map +1 -0
- package/dist/cache/sqlite-vec-store.d.ts +42 -0
- package/dist/cache/sqlite-vec-store.d.ts.map +1 -0
- package/dist/cache/sqlite-vec-store.js +176 -0
- package/dist/cache/sqlite-vec-store.js.map +1 -0
- package/dist/cache/store.d.ts +47 -1
- package/dist/cache/store.d.ts.map +1 -1
- package/dist/cache/store.js +364 -168
- package/dist/cache/store.js.map +1 -1
- package/dist/cli/agents/antigravity.d.ts +20 -0
- package/dist/cli/agents/antigravity.d.ts.map +1 -0
- package/dist/cli/agents/antigravity.js +49 -0
- package/dist/cli/agents/antigravity.js.map +1 -0
- package/dist/cli/agents/claude-code.d.ts +25 -0
- package/dist/cli/agents/claude-code.d.ts.map +1 -0
- package/dist/cli/agents/claude-code.js +111 -0
- package/dist/cli/agents/claude-code.js.map +1 -0
- package/dist/cli/agents/cursor.d.ts +21 -0
- package/dist/cli/agents/cursor.d.ts.map +1 -0
- package/dist/cli/agents/cursor.js +58 -0
- package/dist/cli/agents/cursor.js.map +1 -0
- package/dist/cli/agents/gemini-cli.d.ts +21 -0
- package/dist/cli/agents/gemini-cli.d.ts.map +1 -0
- package/dist/cli/agents/gemini-cli.js +55 -0
- package/dist/cli/agents/gemini-cli.js.map +1 -0
- package/dist/cli/agents/registry.d.ts +21 -0
- package/dist/cli/agents/registry.d.ts.map +1 -0
- package/dist/cli/agents/registry.js +27 -0
- package/dist/cli/agents/registry.js.map +1 -0
- package/dist/cli/agents/utils.d.ts +26 -0
- package/dist/cli/agents/utils.d.ts.map +1 -0
- package/dist/cli/agents/utils.js +136 -0
- package/dist/cli/agents/utils.js.map +1 -0
- package/dist/cli/agents/vscode.d.ts +21 -0
- package/dist/cli/agents/vscode.d.ts.map +1 -0
- package/dist/cli/agents/vscode.js +62 -0
- package/dist/cli/agents/vscode.js.map +1 -0
- package/dist/cli/auth.d.ts +2 -0
- package/dist/cli/auth.d.ts.map +1 -0
- package/dist/cli/auth.js +94 -0
- package/dist/cli/auth.js.map +1 -0
- package/dist/cli/backfill.d.ts +2 -0
- package/dist/cli/backfill.d.ts.map +1 -0
- package/dist/cli/backfill.js +58 -0
- package/dist/cli/backfill.js.map +1 -0
- package/dist/cli/daemon.d.ts +6 -1
- package/dist/cli/daemon.d.ts.map +1 -1
- package/dist/cli/daemon.js +61 -3
- package/dist/cli/daemon.js.map +1 -1
- package/dist/cli/doctor.d.ts +8 -0
- package/dist/cli/doctor.d.ts.map +1 -0
- package/dist/cli/doctor.js +344 -0
- package/dist/cli/doctor.js.map +1 -0
- package/dist/cli/health.d.ts +1 -1
- package/dist/cli/health.d.ts.map +1 -1
- package/dist/cli/health.js +42 -3
- package/dist/cli/health.js.map +1 -1
- package/dist/cli/help.d.ts +6 -0
- package/dist/cli/help.d.ts.map +1 -0
- package/dist/cli/help.js +63 -0
- package/dist/cli/help.js.map +1 -0
- package/dist/cli/index.d.ts +1 -1
- package/dist/cli/index.d.ts.map +1 -1
- package/dist/cli/index.js +35 -7
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/init.d.ts +2 -0
- package/dist/cli/init.d.ts.map +1 -0
- package/dist/cli/init.js +201 -0
- package/dist/cli/init.js.map +1 -0
- package/dist/cli/plugin.d.ts +5 -0
- package/dist/cli/plugin.d.ts.map +1 -0
- package/dist/cli/plugin.js +185 -0
- package/dist/cli/plugin.js.map +1 -0
- package/dist/cli/setup-mcp.d.ts +2 -0
- package/dist/cli/setup-mcp.d.ts.map +1 -0
- package/dist/cli/setup-mcp.js +114 -0
- package/dist/cli/setup-mcp.js.map +1 -0
- package/dist/cli/shell.d.ts +2 -0
- package/dist/cli/shell.d.ts.map +1 -0
- package/dist/cli/shell.js +86 -0
- package/dist/cli/shell.js.map +1 -0
- package/dist/cli/shutdown.d.ts +2 -0
- package/dist/cli/shutdown.d.ts.map +1 -0
- package/dist/cli/shutdown.js +26 -0
- package/dist/cli/shutdown.js.map +1 -0
- package/dist/cli/status.d.ts +2 -0
- package/dist/cli/status.d.ts.map +1 -0
- package/dist/cli/status.js +31 -0
- package/dist/cli/status.js.map +1 -0
- package/dist/cli/telemetry.d.ts +10 -0
- package/dist/cli/telemetry.d.ts.map +1 -0
- package/dist/cli/telemetry.js +56 -0
- package/dist/cli/telemetry.js.map +1 -0
- package/dist/cli/tui/agents-types.d.ts +28 -0
- package/dist/cli/tui/agents-types.d.ts.map +1 -0
- package/dist/cli/tui/agents-types.js +1 -0
- package/dist/cli/tui/agents-types.js.map +1 -0
- package/dist/cli/tui/agents.d.ts +11 -0
- package/dist/cli/tui/agents.d.ts.map +1 -0
- package/dist/cli/tui/agents.js +93 -0
- package/dist/cli/tui/agents.js.map +1 -0
- package/dist/cli/tui/banner.d.ts +3 -0
- package/dist/cli/tui/banner.d.ts.map +1 -0
- package/dist/cli/tui/banner.js +30 -0
- package/dist/cli/tui/banner.js.map +1 -0
- package/dist/cli/tui/components/AgentSelect.d.ts +13 -0
- package/dist/cli/tui/components/AgentSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/AgentSelect.js +116 -0
- package/dist/cli/tui/components/AgentSelect.js.map +1 -0
- package/dist/cli/tui/components/Banner.d.ts +6 -0
- package/dist/cli/tui/components/Banner.d.ts.map +1 -0
- package/dist/cli/tui/components/Banner.js +25 -0
- package/dist/cli/tui/components/Banner.js.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts +7 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.js +19 -0
- package/dist/cli/tui/components/BrowserSelect.js.map +1 -0
- package/dist/cli/tui/components/InstallProgress.d.ts +9 -0
- package/dist/cli/tui/components/InstallProgress.d.ts.map +1 -0
- package/dist/cli/tui/components/InstallProgress.js +67 -0
- package/dist/cli/tui/components/InstallProgress.js.map +1 -0
- package/dist/cli/tui/components/SkillInstall.d.ts +14 -0
- package/dist/cli/tui/components/SkillInstall.d.ts.map +1 -0
- package/dist/cli/tui/components/SkillInstall.js +94 -0
- package/dist/cli/tui/components/SkillInstall.js.map +1 -0
- package/dist/cli/tui/components/Summary.d.ts +22 -0
- package/dist/cli/tui/components/Summary.d.ts.map +1 -0
- package/dist/cli/tui/components/Summary.js +135 -0
- package/dist/cli/tui/components/Summary.js.map +1 -0
- package/dist/cli/tui/components/SystemCheck.d.ts +8 -0
- package/dist/cli/tui/components/SystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/components/SystemCheck.js +71 -0
- package/dist/cli/tui/components/SystemCheck.js.map +1 -0
- package/dist/cli/tui/components/Verification.d.ts +8 -0
- package/dist/cli/tui/components/Verification.d.ts.map +1 -0
- package/dist/cli/tui/components/Verification.js +63 -0
- package/dist/cli/tui/components/Verification.js.map +1 -0
- package/dist/cli/tui/config-writer-cli.d.ts +12 -0
- package/dist/cli/tui/config-writer-cli.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-cli.js +39 -0
- package/dist/cli/tui/config-writer-cli.js.map +1 -0
- package/dist/cli/tui/config-writer-json.d.ts +16 -0
- package/dist/cli/tui/config-writer-json.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-json.js +86 -0
- package/dist/cli/tui/config-writer-json.js.map +1 -0
- package/dist/cli/tui/config-writer-toml.d.ts +16 -0
- package/dist/cli/tui/config-writer-toml.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-toml.js +83 -0
- package/dist/cli/tui/config-writer-toml.js.map +1 -0
- package/dist/cli/tui/config-writer.d.ts +25 -0
- package/dist/cli/tui/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/config-writer.js +101 -0
- package/dist/cli/tui/config-writer.js.map +1 -0
- package/dist/cli/tui/detect-helpers.d.ts +6 -0
- package/dist/cli/tui/detect-helpers.d.ts.map +1 -0
- package/dist/cli/tui/detect-helpers.js +45 -0
- package/dist/cli/tui/detect-helpers.js.map +1 -0
- package/dist/cli/tui/extras-prompt.d.ts +7 -0
- package/dist/cli/tui/extras-prompt.d.ts.map +1 -0
- package/dist/cli/tui/extras-prompt.js +42 -0
- package/dist/cli/tui/extras-prompt.js.map +1 -0
- package/dist/cli/tui/flags-types.d.ts +19 -0
- package/dist/cli/tui/flags-types.d.ts.map +1 -0
- package/dist/cli/tui/flags-types.js +23 -0
- package/dist/cli/tui/flags-types.js.map +1 -0
- package/dist/cli/tui/flags.d.ts +5 -0
- package/dist/cli/tui/flags.d.ts.map +1 -0
- package/dist/cli/tui/flags.js +132 -0
- package/dist/cli/tui/flags.js.map +1 -0
- package/dist/cli/tui/format.d.ts +14 -0
- package/dist/cli/tui/format.d.ts.map +1 -0
- package/dist/cli/tui/format.js +37 -0
- package/dist/cli/tui/format.js.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts +6 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.js +19 -0
- package/dist/cli/tui/hooks/useAgentDetect.js.map +1 -0
- package/dist/cli/tui/hooks/useInstall.d.ts +14 -0
- package/dist/cli/tui/hooks/useInstall.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useInstall.js +90 -0
- package/dist/cli/tui/hooks/useInstall.js.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts +13 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.js +95 -0
- package/dist/cli/tui/hooks/useSystemCheck.js.map +1 -0
- package/dist/cli/tui/hooks/useVerify.d.ts +14 -0
- package/dist/cli/tui/hooks/useVerify.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useVerify.js +71 -0
- package/dist/cli/tui/hooks/useVerify.js.map +1 -0
- package/dist/cli/tui/ink-init.d.ts +2 -0
- package/dist/cli/tui/ink-init.d.ts.map +1 -0
- package/dist/cli/tui/ink-init.js +198 -0
- package/dist/cli/tui/ink-init.js.map +1 -0
- package/dist/cli/tui/reporter-auto.d.ts +7 -0
- package/dist/cli/tui/reporter-auto.d.ts.map +1 -0
- package/dist/cli/tui/reporter-auto.js +15 -0
- package/dist/cli/tui/reporter-auto.js.map +1 -0
- package/dist/cli/tui/reporter.d.ts +26 -0
- package/dist/cli/tui/reporter.d.ts.map +1 -0
- package/dist/cli/tui/reporter.js +32 -0
- package/dist/cli/tui/reporter.js.map +1 -0
- package/dist/cli/tui/run-command.d.ts +14 -0
- package/dist/cli/tui/run-command.d.ts.map +1 -0
- package/dist/cli/tui/run-command.js +72 -0
- package/dist/cli/tui/run-command.js.map +1 -0
- package/dist/cli/tui/select-agents.d.ts +6 -0
- package/dist/cli/tui/select-agents.d.ts.map +1 -0
- package/dist/cli/tui/select-agents.js +32 -0
- package/dist/cli/tui/select-agents.js.map +1 -0
- package/dist/cli/tui/status-agents.d.ts +11 -0
- package/dist/cli/tui/status-agents.d.ts.map +1 -0
- package/dist/cli/tui/status-agents.js +53 -0
- package/dist/cli/tui/status-agents.js.map +1 -0
- package/dist/cli/tui/status-cache.d.ts +6 -0
- package/dist/cli/tui/status-cache.d.ts.map +1 -0
- package/dist/cli/tui/status-cache.js +39 -0
- package/dist/cli/tui/status-cache.js.map +1 -0
- package/dist/cli/tui/status-format.d.ts +14 -0
- package/dist/cli/tui/status-format.d.ts.map +1 -0
- package/dist/cli/tui/status-format.js +41 -0
- package/dist/cli/tui/status-format.js.map +1 -0
- package/dist/cli/tui/status-python.d.ts +6 -0
- package/dist/cli/tui/status-python.d.ts.map +1 -0
- package/dist/cli/tui/status-python.js +30 -0
- package/dist/cli/tui/status-python.js.map +1 -0
- package/dist/cli/tui/system-check.d.ts +24 -0
- package/dist/cli/tui/system-check.d.ts.map +1 -0
- package/dist/cli/tui/system-check.js +103 -0
- package/dist/cli/tui/system-check.js.map +1 -0
- package/dist/cli/tui/tui-reporter.d.ts +19 -0
- package/dist/cli/tui/tui-reporter.d.ts.map +1 -0
- package/dist/cli/tui/tui-reporter.js +95 -0
- package/dist/cli/tui/tui-reporter.js.map +1 -0
- package/dist/cli/tui/utils/config-writer.d.ts +3 -0
- package/dist/cli/tui/utils/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/utils/config-writer.js +22 -0
- package/dist/cli/tui/utils/config-writer.js.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts +3 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.js +11 -0
- package/dist/cli/tui/utils/suppress-logs.js.map +1 -0
- package/dist/cli/tui/verify-suggestions.d.ts +5 -0
- package/dist/cli/tui/verify-suggestions.d.ts.map +1 -0
- package/dist/cli/tui/verify-suggestions.js +20 -0
- package/dist/cli/tui/verify-suggestions.js.map +1 -0
- package/dist/cli/tui/verify.d.ts +14 -0
- package/dist/cli/tui/verify.d.ts.map +1 -0
- package/dist/cli/tui/verify.js +101 -0
- package/dist/cli/tui/verify.js.map +1 -0
- package/dist/cli/tui/version.d.ts +2 -0
- package/dist/cli/tui/version.d.ts.map +1 -0
- package/dist/cli/tui/version.js +14 -0
- package/dist/cli/tui/version.js.map +1 -0
- package/dist/cli/uninstall.d.ts +2 -0
- package/dist/cli/uninstall.d.ts.map +1 -0
- package/dist/cli/uninstall.js +57 -0
- package/dist/cli/uninstall.js.map +1 -0
- package/dist/cli/warmup.d.ts +10 -2
- package/dist/cli/warmup.d.ts.map +1 -1
- package/dist/cli/warmup.js +226 -93
- package/dist/cli/warmup.js.map +1 -1
- package/dist/config.d.ts +28 -2
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +106 -56
- package/dist/config.js.map +1 -1
- package/dist/crawl/crawler.d.ts +6 -0
- package/dist/crawl/crawler.d.ts.map +1 -1
- package/dist/crawl/crawler.js +210 -209
- package/dist/crawl/crawler.js.map +1 -1
- package/dist/crawl/dedup.d.ts +1 -0
- package/dist/crawl/dedup.d.ts.map +1 -1
- package/dist/crawl/dedup.js +124 -81
- package/dist/crawl/dedup.js.map +1 -1
- package/dist/crawl/etag-incremental.d.ts +43 -0
- package/dist/crawl/etag-incremental.d.ts.map +1 -0
- package/dist/crawl/etag-incremental.js +94 -0
- package/dist/crawl/etag-incremental.js.map +1 -0
- package/dist/crawl/index-to-vec.d.ts +10 -0
- package/dist/crawl/index-to-vec.d.ts.map +1 -0
- package/dist/crawl/index-to-vec.js +44 -0
- package/dist/crawl/index-to-vec.js.map +1 -0
- package/dist/crawl/mapper.js +136 -164
- package/dist/crawl/mapper.js.map +1 -1
- package/dist/crawl/rate-limiter.js +63 -66
- package/dist/crawl/rate-limiter.js.map +1 -1
- package/dist/crawl/robots.js +58 -57
- package/dist/crawl/robots.js.map +1 -1
- package/dist/crawl/sitemap-first.d.ts +12 -0
- package/dist/crawl/sitemap-first.d.ts.map +1 -0
- package/dist/crawl/sitemap-first.js +47 -0
- package/dist/crawl/sitemap-first.js.map +1 -0
- package/dist/crawl/sitemap.js +33 -32
- package/dist/crawl/sitemap.js.map +1 -1
- package/dist/crawl/url-utils.d.ts +1 -0
- package/dist/crawl/url-utils.d.ts.map +1 -1
- package/dist/crawl/url-utils.js +49 -37
- package/dist/crawl/url-utils.js.map +1 -1
- package/dist/daemon/health-check.d.ts +16 -0
- package/dist/daemon/health-check.d.ts.map +1 -0
- package/dist/daemon/health-check.js +33 -0
- package/dist/daemon/health-check.js.map +1 -0
- package/dist/daemon/http-server.d.ts +26 -0
- package/dist/daemon/http-server.d.ts.map +1 -0
- package/dist/daemon/http-server.js +275 -0
- package/dist/daemon/http-server.js.map +1 -0
- package/dist/daemon/proxy.d.ts +10 -0
- package/dist/daemon/proxy.d.ts.map +1 -0
- package/dist/daemon/proxy.js +93 -0
- package/dist/daemon/proxy.js.map +1 -0
- package/dist/embedding/embed.d.ts +59 -0
- package/dist/embedding/embed.d.ts.map +1 -0
- package/dist/embedding/embed.js +233 -0
- package/dist/embedding/embed.js.map +1 -0
- package/dist/embedding/fastembed-provider.d.ts +19 -0
- package/dist/embedding/fastembed-provider.d.ts.map +1 -0
- package/dist/embedding/fastembed-provider.js +51 -0
- package/dist/embedding/fastembed-provider.js.map +1 -0
- package/dist/embedding/key-terms.d.ts +12 -0
- package/dist/embedding/key-terms.d.ts.map +1 -0
- package/dist/embedding/key-terms.js +234 -0
- package/dist/embedding/key-terms.js.map +1 -0
- package/dist/extraction/boilerplate.d.ts +15 -0
- package/dist/extraction/boilerplate.d.ts.map +1 -0
- package/dist/extraction/boilerplate.js +52 -0
- package/dist/extraction/boilerplate.js.map +1 -0
- package/dist/extraction/defuddle.d.ts.map +1 -1
- package/dist/extraction/defuddle.js +27 -23
- package/dist/extraction/defuddle.js.map +1 -1
- package/dist/extraction/extract.d.ts.map +1 -1
- package/dist/extraction/extract.js +76 -76
- package/dist/extraction/extract.js.map +1 -1
- package/dist/extraction/jsonld.js +50 -54
- package/dist/extraction/jsonld.js.map +1 -1
- package/dist/extraction/lang-hints.d.ts +2 -0
- package/dist/extraction/lang-hints.d.ts.map +1 -0
- package/dist/extraction/lang-hints.js +30 -0
- package/dist/extraction/lang-hints.js.map +1 -0
- package/dist/extraction/llm-fallback.d.ts +17 -0
- package/dist/extraction/llm-fallback.d.ts.map +1 -0
- package/dist/extraction/llm-fallback.js +130 -0
- package/dist/extraction/llm-fallback.js.map +1 -0
- package/dist/extraction/markdown-sanitize.d.ts +2 -0
- package/dist/extraction/markdown-sanitize.d.ts.map +1 -0
- package/dist/extraction/markdown-sanitize.js +151 -0
- package/dist/extraction/markdown-sanitize.js.map +1 -0
- package/dist/extraction/markdown.d.ts +11 -0
- package/dist/extraction/markdown.d.ts.map +1 -1
- package/dist/extraction/markdown.js +195 -91
- package/dist/extraction/markdown.js.map +1 -1
- package/dist/extraction/pipeline.d.ts +8 -0
- package/dist/extraction/pipeline.d.ts.map +1 -1
- package/dist/extraction/pipeline.js +57 -91
- package/dist/extraction/pipeline.js.map +1 -1
- package/dist/extraction/readability.d.ts +1 -1
- package/dist/extraction/readability.d.ts.map +1 -1
- package/dist/extraction/readability.js +28 -29
- package/dist/extraction/readability.js.map +1 -1
- package/dist/extraction/schema.d.ts +12 -0
- package/dist/extraction/schema.d.ts.map +1 -1
- package/dist/extraction/schema.js +135 -72
- package/dist/extraction/schema.js.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.d.ts.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.js +81 -91
- package/dist/extraction/site-extractors/docs-generic.js.map +1 -1
- package/dist/extraction/site-extractors/github.d.ts.map +1 -1
- package/dist/extraction/site-extractors/github.js +87 -95
- package/dist/extraction/site-extractors/github.js.map +1 -1
- package/dist/extraction/site-extractors/mdn.d.ts.map +1 -1
- package/dist/extraction/site-extractors/mdn.js +46 -54
- package/dist/extraction/site-extractors/mdn.js.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.d.ts.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.js +71 -80
- package/dist/extraction/site-extractors/stackoverflow.js.map +1 -1
- package/dist/extraction/structured-data.d.ts +4 -0
- package/dist/extraction/structured-data.d.ts.map +1 -0
- package/dist/extraction/structured-data.js +173 -0
- package/dist/extraction/structured-data.js.map +1 -0
- package/dist/extraction/structured.d.ts +4 -0
- package/dist/extraction/structured.d.ts.map +1 -0
- package/dist/extraction/structured.js +163 -0
- package/dist/extraction/structured.js.map +1 -0
- package/dist/extraction/v1/classifier.d.ts +3 -0
- package/dist/extraction/v1/classifier.d.ts.map +1 -0
- package/dist/extraction/v1/classifier.js +110 -0
- package/dist/extraction/v1/classifier.js.map +1 -0
- package/dist/extraction/v1/extract-provider.d.ts +16 -0
- package/dist/extraction/v1/extract-provider.d.ts.map +1 -0
- package/dist/extraction/v1/extract-provider.js +43 -0
- package/dist/extraction/v1/extract-provider.js.map +1 -0
- package/dist/extraction/v1/local-llm.d.ts +8 -0
- package/dist/extraction/v1/local-llm.d.ts.map +1 -0
- package/dist/extraction/v1/local-llm.js +34 -0
- package/dist/extraction/v1/local-llm.js.map +1 -0
- package/dist/extraction/v1/news.d.ts +3 -0
- package/dist/extraction/v1/news.d.ts.map +1 -0
- package/dist/extraction/v1/news.js +61 -0
- package/dist/extraction/v1/news.js.map +1 -0
- package/dist/extraction/v1/product.d.ts +3 -0
- package/dist/extraction/v1/product.d.ts.map +1 -0
- package/dist/extraction/v1/product.js +166 -0
- package/dist/extraction/v1/product.js.map +1 -0
- package/dist/extraction/v1/recipe.d.ts +3 -0
- package/dist/extraction/v1/recipe.d.ts.map +1 -0
- package/dist/extraction/v1/recipe.js +136 -0
- package/dist/extraction/v1/recipe.js.map +1 -0
- package/dist/extraction/v1/routed.d.ts +17 -0
- package/dist/extraction/v1/routed.d.ts.map +1 -0
- package/dist/extraction/v1/routed.js +68 -0
- package/dist/extraction/v1/routed.js.map +1 -0
- package/dist/extraction/v1/schemas/Article.d.ts +11 -0
- package/dist/extraction/v1/schemas/Article.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Article.js +23 -0
- package/dist/extraction/v1/schemas/Article.js.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts +9 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js +90 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts +10 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.js +122 -0
- package/dist/extraction/v1/schemas/EventListing.js.map +1 -0
- package/dist/extraction/v1/schemas/Paper.d.ts +10 -0
- package/dist/extraction/v1/schemas/Paper.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Paper.js +156 -0
- package/dist/extraction/v1/schemas/Paper.js.map +1 -0
- package/dist/extraction/v1/schemas/Product.d.ts +17 -0
- package/dist/extraction/v1/schemas/Product.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Product.js +149 -0
- package/dist/extraction/v1/schemas/Product.js.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts +14 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.js +160 -0
- package/dist/extraction/v1/schemas/Recipe.js.map +1 -0
- package/dist/extraction/v1/schemas/index.d.ts +13 -0
- package/dist/extraction/v1/schemas/index.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/index.js +44 -0
- package/dist/extraction/v1/schemas/index.js.map +1 -0
- package/dist/extraction/v1/site-extractors.d.ts +5 -0
- package/dist/extraction/v1/site-extractors.d.ts.map +1 -0
- package/dist/extraction/v1/site-extractors.js +31 -0
- package/dist/extraction/v1/site-extractors.js.map +1 -0
- package/dist/fetch/action-executor.d.ts +28 -0
- package/dist/fetch/action-executor.d.ts.map +1 -0
- package/dist/fetch/action-executor.js +88 -0
- package/dist/fetch/action-executor.js.map +1 -0
- package/dist/fetch/auth.d.ts +2 -1
- package/dist/fetch/auth.d.ts.map +1 -1
- package/dist/fetch/auth.js +56 -26
- package/dist/fetch/auth.js.map +1 -1
- package/dist/fetch/browser-pool.d.ts +30 -11
- package/dist/fetch/browser-pool.d.ts.map +1 -1
- package/dist/fetch/browser-pool.js +303 -127
- package/dist/fetch/browser-pool.js.map +1 -1
- package/dist/fetch/browser-selector.d.ts +17 -0
- package/dist/fetch/browser-selector.d.ts.map +1 -0
- package/dist/fetch/browser-selector.js +72 -0
- package/dist/fetch/browser-selector.js.map +1 -0
- package/dist/fetch/browser-types.d.ts +3 -0
- package/dist/fetch/browser-types.d.ts.map +1 -0
- package/dist/fetch/browser-types.js +45 -0
- package/dist/fetch/browser-types.js.map +1 -0
- package/dist/fetch/cdp-client.d.ts +9 -0
- package/dist/fetch/cdp-client.d.ts.map +1 -0
- package/dist/fetch/cdp-client.js +89 -0
- package/dist/fetch/cdp-client.js.map +1 -0
- package/dist/fetch/content-check.js +39 -46
- package/dist/fetch/content-check.js.map +1 -1
- package/dist/fetch/error-describe.d.ts +7 -0
- package/dist/fetch/error-describe.d.ts.map +1 -0
- package/dist/fetch/error-describe.js +37 -0
- package/dist/fetch/error-describe.js.map +1 -0
- package/dist/fetch/http-client.d.ts +4 -0
- package/dist/fetch/http-client.d.ts.map +1 -1
- package/dist/fetch/http-client.js +147 -128
- package/dist/fetch/http-client.js.map +1 -1
- package/dist/fetch/lightpanda.d.ts +28 -0
- package/dist/fetch/lightpanda.d.ts.map +1 -0
- package/dist/fetch/lightpanda.js +174 -0
- package/dist/fetch/lightpanda.js.map +1 -0
- package/dist/fetch/playwright-tier.d.ts +19 -0
- package/dist/fetch/playwright-tier.d.ts.map +1 -0
- package/dist/fetch/playwright-tier.js +76 -0
- package/dist/fetch/playwright-tier.js.map +1 -0
- package/dist/fetch/router.d.ts +49 -3
- package/dist/fetch/router.d.ts.map +1 -1
- package/dist/fetch/router.js +187 -81
- package/dist/fetch/router.js.map +1 -1
- package/dist/index.js +102 -17
- package/dist/index.js.map +1 -1
- package/dist/instructions.d.ts +31 -0
- package/dist/instructions.d.ts.map +1 -0
- package/dist/instructions.js +245 -0
- package/dist/instructions.js.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts +3 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.js +41 -0
- package/dist/integrations/cloud/llm/anthropic.js.map +1 -0
- package/dist/integrations/cloud/llm/cache.d.ts +5 -0
- package/dist/integrations/cloud/llm/cache.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/cache.js +49 -0
- package/dist/integrations/cloud/llm/cache.js.map +1 -0
- package/dist/integrations/cloud/llm/gemini.d.ts +3 -0
- package/dist/integrations/cloud/llm/gemini.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/gemini.js +37 -0
- package/dist/integrations/cloud/llm/gemini.js.map +1 -0
- package/dist/integrations/cloud/llm/groq.d.ts +3 -0
- package/dist/integrations/cloud/llm/groq.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/groq.js +74 -0
- package/dist/integrations/cloud/llm/groq.js.map +1 -0
- package/dist/integrations/cloud/llm/hash.d.ts +3 -0
- package/dist/integrations/cloud/llm/hash.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/hash.js +26 -0
- package/dist/integrations/cloud/llm/hash.js.map +1 -0
- package/dist/integrations/cloud/llm/model-select.d.ts +5 -0
- package/dist/integrations/cloud/llm/model-select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/model-select.js +32 -0
- package/dist/integrations/cloud/llm/model-select.js.map +1 -0
- package/dist/integrations/cloud/llm/openai.d.ts +3 -0
- package/dist/integrations/cloud/llm/openai.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/openai.js +43 -0
- package/dist/integrations/cloud/llm/openai.js.map +1 -0
- package/dist/integrations/cloud/llm/run.d.ts +27 -0
- package/dist/integrations/cloud/llm/run.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/run.js +99 -0
- package/dist/integrations/cloud/llm/run.js.map +1 -0
- package/dist/integrations/cloud/llm/select.d.ts +5 -0
- package/dist/integrations/cloud/llm/select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/select.js +30 -0
- package/dist/integrations/cloud/llm/select.js.map +1 -0
- package/dist/integrations/cloud/llm/text-adapters.d.ts +19 -0
- package/dist/integrations/cloud/llm/text-adapters.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/text-adapters.js +103 -0
- package/dist/integrations/cloud/llm/text-adapters.js.map +1 -0
- package/dist/integrations/cloud/llm/types.d.ts +24 -0
- package/dist/integrations/cloud/llm/types.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/types.js +1 -0
- package/dist/integrations/cloud/llm/types.js.map +1 -0
- package/dist/integrations/cloud/llm/validate.d.ts +6 -0
- package/dist/integrations/cloud/llm/validate.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/validate.js +63 -0
- package/dist/integrations/cloud/llm/validate.js.map +1 -0
- package/dist/logger.d.ts +4 -1
- package/dist/logger.d.ts.map +1 -1
- package/dist/logger.js +71 -30
- package/dist/logger.js.map +1 -1
- package/dist/pdf-parse.d.js +1 -0
- package/dist/pdf-parse.d.js.map +1 -0
- package/dist/plugins/loader.d.ts +20 -0
- package/dist/plugins/loader.d.ts.map +1 -0
- package/dist/plugins/loader.js +157 -0
- package/dist/plugins/loader.js.map +1 -0
- package/dist/plugins/registry.d.ts +26 -0
- package/dist/plugins/registry.d.ts.map +1 -0
- package/dist/plugins/registry.js +71 -0
- package/dist/plugins/registry.js.map +1 -0
- package/dist/plugins/validate.d.ts +9 -0
- package/dist/plugins/validate.d.ts.map +1 -0
- package/dist/plugins/validate.js +79 -0
- package/dist/plugins/validate.js.map +1 -0
- package/dist/providers/embed-provider.d.ts +11 -0
- package/dist/providers/embed-provider.d.ts.map +1 -0
- package/dist/providers/embed-provider.js +24 -0
- package/dist/providers/embed-provider.js.map +1 -0
- package/dist/providers/extract-provider.d.ts +23 -0
- package/dist/providers/extract-provider.d.ts.map +1 -0
- package/dist/providers/extract-provider.js +25 -0
- package/dist/providers/extract-provider.js.map +1 -0
- package/dist/providers/rerank-provider.d.ts +17 -0
- package/dist/providers/rerank-provider.d.ts.map +1 -0
- package/dist/providers/rerank-provider.js +41 -0
- package/dist/providers/rerank-provider.js.map +1 -0
- package/dist/providers/search-provider.d.ts +25 -0
- package/dist/providers/search-provider.d.ts.map +1 -0
- package/dist/providers/search-provider.js +44 -0
- package/dist/providers/search-provider.js.map +1 -0
- package/dist/providers/vector-store.d.ts +27 -0
- package/dist/providers/vector-store.d.ts.map +1 -0
- package/dist/providers/vector-store.js +27 -0
- package/dist/providers/vector-store.js.map +1 -0
- package/dist/python-env.d.ts +9 -0
- package/dist/python-env.d.ts.map +1 -0
- package/dist/python-env.js +13 -0
- package/dist/python-env.js.map +1 -0
- package/dist/repl/commands/agent.d.ts +5 -0
- package/dist/repl/commands/agent.d.ts.map +1 -0
- package/dist/repl/commands/agent.js +62 -0
- package/dist/repl/commands/agent.js.map +1 -0
- package/dist/repl/commands/cache.d.ts +4 -0
- package/dist/repl/commands/cache.d.ts.map +1 -0
- package/dist/repl/commands/cache.js +43 -0
- package/dist/repl/commands/cache.js.map +1 -0
- package/dist/repl/commands/crawl.d.ts +7 -0
- package/dist/repl/commands/crawl.d.ts.map +1 -0
- package/dist/repl/commands/crawl.js +44 -0
- package/dist/repl/commands/crawl.js.map +1 -0
- package/dist/repl/commands/extract.d.ts +5 -0
- package/dist/repl/commands/extract.d.ts.map +1 -0
- package/dist/repl/commands/extract.js +47 -0
- package/dist/repl/commands/extract.js.map +1 -0
- package/dist/repl/commands/fetch.d.ts +5 -0
- package/dist/repl/commands/fetch.d.ts.map +1 -0
- package/dist/repl/commands/fetch.js +67 -0
- package/dist/repl/commands/fetch.js.map +1 -0
- package/dist/repl/commands/find-similar.d.ts +5 -0
- package/dist/repl/commands/find-similar.d.ts.map +1 -0
- package/dist/repl/commands/find-similar.js +74 -0
- package/dist/repl/commands/find-similar.js.map +1 -0
- package/dist/repl/commands/research.d.ts +5 -0
- package/dist/repl/commands/research.d.ts.map +1 -0
- package/dist/repl/commands/research.js +65 -0
- package/dist/repl/commands/research.js.map +1 -0
- package/dist/repl/commands/search.d.ts +5 -0
- package/dist/repl/commands/search.d.ts.map +1 -0
- package/dist/repl/commands/search.js +74 -0
- package/dist/repl/commands/search.js.map +1 -0
- package/dist/repl/commands/types.d.ts +9 -0
- package/dist/repl/commands/types.d.ts.map +1 -0
- package/dist/repl/commands/types.js +1 -0
- package/dist/repl/commands/types.js.map +1 -0
- package/dist/repl/formatters.d.ts +13 -0
- package/dist/repl/formatters.d.ts.map +1 -0
- package/dist/repl/formatters.js +283 -0
- package/dist/repl/formatters.js.map +1 -0
- package/dist/repl/parser.d.ts +9 -0
- package/dist/repl/parser.d.ts.map +1 -0
- package/dist/repl/parser.js +86 -0
- package/dist/repl/parser.js.map +1 -0
- package/dist/repl/shell.d.ts +8 -0
- package/dist/repl/shell.d.ts.map +1 -0
- package/dist/repl/shell.js +184 -0
- package/dist/repl/shell.js.map +1 -0
- package/dist/research/branch-exploration.d.ts +14 -0
- package/dist/research/branch-exploration.d.ts.map +1 -0
- package/dist/research/branch-exploration.js +100 -0
- package/dist/research/branch-exploration.js.map +1 -0
- package/dist/research/brief.d.ts +6 -0
- package/dist/research/brief.d.ts.map +1 -0
- package/dist/research/brief.js +246 -0
- package/dist/research/brief.js.map +1 -0
- package/dist/research/citation-graph.d.ts +9 -0
- package/dist/research/citation-graph.d.ts.map +1 -0
- package/dist/research/citation-graph.js +114 -0
- package/dist/research/citation-graph.js.map +1 -0
- package/dist/research/decompose.d.ts +14 -0
- package/dist/research/decompose.d.ts.map +1 -0
- package/dist/research/decompose.js +439 -0
- package/dist/research/decompose.js.map +1 -0
- package/dist/research/pipeline.d.ts +5 -0
- package/dist/research/pipeline.d.ts.map +1 -0
- package/dist/research/pipeline.js +269 -0
- package/dist/research/pipeline.js.map +1 -0
- package/dist/research/synthesis-local.d.ts +19 -0
- package/dist/research/synthesis-local.d.ts.map +1 -0
- package/dist/research/synthesis-local.js +62 -0
- package/dist/research/synthesis-local.js.map +1 -0
- package/dist/research/synthesize.d.ts +10 -0
- package/dist/research/synthesize.d.ts.map +1 -0
- package/dist/research/synthesize.js +137 -0
- package/dist/research/synthesize.js.map +1 -0
- package/dist/search/answer-synthesis.d.ts +33 -0
- package/dist/search/answer-synthesis.d.ts.map +1 -0
- package/dist/search/answer-synthesis.js +244 -0
- package/dist/search/answer-synthesis.js.map +1 -0
- package/dist/search/context-formatter.d.ts +3 -0
- package/dist/search/context-formatter.d.ts.map +1 -0
- package/dist/search/context-formatter.js +56 -0
- package/dist/search/context-formatter.js.map +1 -0
- package/dist/search/dedup.d.ts +1 -0
- package/dist/search/dedup.d.ts.map +1 -1
- package/dist/search/dedup.js +40 -32
- package/dist/search/dedup.js.map +1 -1
- package/dist/search/engines/arxiv.d.ts +7 -0
- package/dist/search/engines/arxiv.d.ts.map +1 -0
- package/dist/search/engines/arxiv.js +70 -0
- package/dist/search/engines/arxiv.js.map +1 -0
- package/dist/search/engines/bing-news.d.ts +7 -0
- package/dist/search/engines/bing-news.d.ts.map +1 -0
- package/dist/search/engines/bing-news.js +97 -0
- package/dist/search/engines/bing-news.js.map +1 -0
- package/dist/search/engines/bing.d.ts +1 -0
- package/dist/search/engines/bing.d.ts.map +1 -1
- package/dist/search/engines/bing.js +100 -44
- package/dist/search/engines/bing.js.map +1 -1
- package/dist/search/engines/devdocs.d.ts +6 -0
- package/dist/search/engines/devdocs.d.ts.map +1 -0
- package/dist/search/engines/devdocs.js +56 -0
- package/dist/search/engines/devdocs.js.map +1 -0
- package/dist/search/engines/duckduckgo.d.ts.map +1 -1
- package/dist/search/engines/duckduckgo.js +56 -44
- package/dist/search/engines/duckduckgo.js.map +1 -1
- package/dist/search/engines/github-code.d.ts +7 -0
- package/dist/search/engines/github-code.d.ts.map +1 -0
- package/dist/search/engines/github-code.js +55 -0
- package/dist/search/engines/github-code.js.map +1 -0
- package/dist/search/engines/hn-algolia.d.ts +7 -0
- package/dist/search/engines/hn-algolia.d.ts.map +1 -0
- package/dist/search/engines/hn-algolia.js +76 -0
- package/dist/search/engines/hn-algolia.js.map +1 -0
- package/dist/search/engines/lobsters.d.ts +7 -0
- package/dist/search/engines/lobsters.d.ts.map +1 -0
- package/dist/search/engines/lobsters.js +83 -0
- package/dist/search/engines/lobsters.js.map +1 -0
- package/dist/search/engines/mdn.d.ts +7 -0
- package/dist/search/engines/mdn.d.ts.map +1 -0
- package/dist/search/engines/mdn.js +48 -0
- package/dist/search/engines/mdn.js.map +1 -0
- package/dist/search/engines/semantic-scholar.d.ts +7 -0
- package/dist/search/engines/semantic-scholar.d.ts.map +1 -0
- package/dist/search/engines/semantic-scholar.js +69 -0
- package/dist/search/engines/semantic-scholar.js.map +1 -0
- package/dist/search/engines/stackoverflow.d.ts +7 -0
- package/dist/search/engines/stackoverflow.d.ts.map +1 -0
- package/dist/search/engines/stackoverflow.js +73 -0
- package/dist/search/engines/stackoverflow.js.map +1 -0
- package/dist/search/engines/startpage.d.ts.map +1 -1
- package/dist/search/engines/startpage.js +65 -46
- package/dist/search/engines/startpage.js.map +1 -1
- package/dist/search/evidence.d.ts +25 -0
- package/dist/search/evidence.d.ts.map +1 -0
- package/dist/search/evidence.js +220 -0
- package/dist/search/evidence.js.map +1 -0
- package/dist/search/filters.d.ts.map +1 -1
- package/dist/search/filters.js +58 -54
- package/dist/search/filters.js.map +1 -1
- package/dist/search/find-similar/crawl-rank.d.ts +9 -0
- package/dist/search/find-similar/crawl-rank.d.ts.map +1 -0
- package/dist/search/find-similar/crawl-rank.js +272 -0
- package/dist/search/find-similar/crawl-rank.js.map +1 -0
- package/dist/search/find-similar/mode.d.ts +4 -0
- package/dist/search/find-similar/mode.d.ts.map +1 -0
- package/dist/search/find-similar/mode.js +12 -0
- package/dist/search/find-similar/mode.js.map +1 -0
- package/dist/search/find-similar.d.ts +5 -0
- package/dist/search/find-similar.d.ts.map +1 -0
- package/dist/search/find-similar.js +509 -0
- package/dist/search/find-similar.js.map +1 -0
- package/dist/search/highlights.d.ts +19 -0
- package/dist/search/highlights.d.ts.map +1 -0
- package/dist/search/highlights.js +167 -0
- package/dist/search/highlights.js.map +1 -0
- package/dist/search/language-filter.d.ts +29 -0
- package/dist/search/language-filter.d.ts.map +1 -0
- package/dist/search/language-filter.js +126 -0
- package/dist/search/language-filter.js.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts +4 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.js +501 -0
- package/dist/search/legacy/searxng-orchestrator.js.map +1 -0
- package/dist/search/legacy/searxng-provider.d.ts +7 -0
- package/dist/search/legacy/searxng-provider.d.ts.map +1 -0
- package/dist/search/legacy/searxng-provider.js +11 -0
- package/dist/search/legacy/searxng-provider.js.map +1 -0
- package/dist/search/multi-query.d.ts +25 -0
- package/dist/search/multi-query.d.ts.map +1 -0
- package/dist/search/multi-query.js +228 -0
- package/dist/search/multi-query.js.map +1 -0
- package/dist/search/query.js +32 -34
- package/dist/search/query.js.map +1 -1
- package/dist/search/rerank.d.ts +3 -1
- package/dist/search/rerank.d.ts.map +1 -1
- package/dist/search/rerank.js +44 -35
- package/dist/search/rerank.js.map +1 -1
- package/dist/search/reranker/authority-boost.d.ts +3 -0
- package/dist/search/reranker/authority-boost.d.ts.map +1 -0
- package/dist/search/reranker/authority-boost.js +179 -0
- package/dist/search/reranker/authority-boost.js.map +1 -0
- package/dist/search/reranker/consensus-boost.d.ts +3 -0
- package/dist/search/reranker/consensus-boost.d.ts.map +1 -0
- package/dist/search/reranker/consensus-boost.js +27 -0
- package/dist/search/reranker/consensus-boost.js.map +1 -0
- package/dist/search/reranker/recency-boost.d.ts +3 -0
- package/dist/search/reranker/recency-boost.d.ts.map +1 -0
- package/dist/search/reranker/recency-boost.js +13 -0
- package/dist/search/reranker/recency-boost.js.map +1 -0
- package/dist/search/reranker/recency.d.ts +3 -0
- package/dist/search/reranker/recency.d.ts.map +1 -0
- package/dist/search/reranker/recency.js +23 -0
- package/dist/search/reranker/recency.js.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts +13 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.js +94 -0
- package/dist/search/reranker/transformers-rerank-provider.js.map +1 -0
- package/dist/search/rrf.d.ts +17 -0
- package/dist/search/rrf.d.ts.map +1 -0
- package/dist/search/rrf.js +39 -0
- package/dist/search/rrf.js.map +1 -0
- package/dist/search/sampling.d.ts +25 -0
- package/dist/search/sampling.d.ts.map +1 -0
- package/dist/search/sampling.js +52 -0
- package/dist/search/sampling.js.map +1 -0
- package/dist/search/searxng.d.ts.map +1 -1
- package/dist/search/searxng.js +69 -79
- package/dist/search/searxng.js.map +1 -1
- package/dist/search/tokens.d.ts +3 -0
- package/dist/search/tokens.d.ts.map +1 -0
- package/dist/search/tokens.js +39 -0
- package/dist/search/tokens.js.map +1 -0
- package/dist/search/truncate.d.ts +6 -0
- package/dist/search/truncate.d.ts.map +1 -0
- package/dist/search/truncate.js +26 -0
- package/dist/search/truncate.js.map +1 -0
- package/dist/search/url-unwrap.d.ts +3 -0
- package/dist/search/url-unwrap.d.ts.map +1 -0
- package/dist/search/url-unwrap.js +43 -0
- package/dist/search/url-unwrap.js.map +1 -0
- package/dist/search/v1/context-rank.d.ts +13 -0
- package/dist/search/v1/context-rank.d.ts.map +1 -0
- package/dist/search/v1/context-rank.js +74 -0
- package/dist/search/v1/context-rank.js.map +1 -0
- package/dist/search/v1/engine-base.d.ts +27 -0
- package/dist/search/v1/engine-base.d.ts.map +1 -0
- package/dist/search/v1/engine-base.js +110 -0
- package/dist/search/v1/engine-base.js.map +1 -0
- package/dist/search/v1/intent-router.d.ts +22 -0
- package/dist/search/v1/intent-router.d.ts.map +1 -0
- package/dist/search/v1/intent-router.js +138 -0
- package/dist/search/v1/intent-router.js.map +1 -0
- package/dist/search/v1/orchestrator.d.ts +24 -0
- package/dist/search/v1/orchestrator.d.ts.map +1 -0
- package/dist/search/v1/orchestrator.js +163 -0
- package/dist/search/v1/orchestrator.js.map +1 -0
- package/dist/search/v1/recency-boost.d.ts +9 -0
- package/dist/search/v1/recency-boost.d.ts.map +1 -0
- package/dist/search/v1/recency-boost.js +37 -0
- package/dist/search/v1/recency-boost.js.map +1 -0
- package/dist/search/v1/recent-cache-dedup.d.ts +6 -0
- package/dist/search/v1/recent-cache-dedup.d.ts.map +1 -0
- package/dist/search/v1/recent-cache-dedup.js +85 -0
- package/dist/search/v1/recent-cache-dedup.js.map +1 -0
- package/dist/search/v1/rss/feed-config.d.ts +21 -0
- package/dist/search/v1/rss/feed-config.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-config.js +90 -0
- package/dist/search/v1/rss/feed-config.js.map +1 -0
- package/dist/search/v1/rss/feed-parser.d.ts +14 -0
- package/dist/search/v1/rss/feed-parser.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-parser.js +104 -0
- package/dist/search/v1/rss/feed-parser.js.map +1 -0
- package/dist/search/v1/rss/feed-poller.d.ts +22 -0
- package/dist/search/v1/rss/feed-poller.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-poller.js +102 -0
- package/dist/search/v1/rss/feed-poller.js.map +1 -0
- package/dist/search/v1/rss/feed-store.d.ts +30 -0
- package/dist/search/v1/rss/feed-store.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-store.js +134 -0
- package/dist/search/v1/rss/feed-store.js.map +1 -0
- package/dist/search/v1/rss/rss-engine.d.ts +6 -0
- package/dist/search/v1/rss/rss-engine.d.ts.map +1 -0
- package/dist/search/v1/rss/rss-engine.js +28 -0
- package/dist/search/v1/rss/rss-engine.js.map +1 -0
- package/dist/search/v1/v1-provider.d.ts +7 -0
- package/dist/search/v1/v1-provider.d.ts.map +1 -0
- package/dist/search/v1/v1-provider.js +68 -0
- package/dist/search/v1/v1-provider.js.map +1 -0
- package/dist/search/v1/verticals/code.d.ts +4 -0
- package/dist/search/v1/verticals/code.d.ts.map +1 -0
- package/dist/search/v1/verticals/code.js +20 -0
- package/dist/search/v1/verticals/code.js.map +1 -0
- package/dist/search/v1/verticals/docs.d.ts +4 -0
- package/dist/search/v1/verticals/docs.d.ts.map +1 -0
- package/dist/search/v1/verticals/docs.js +20 -0
- package/dist/search/v1/verticals/docs.js.map +1 -0
- package/dist/search/v1/verticals/general.d.ts +4 -0
- package/dist/search/v1/verticals/general.d.ts.map +1 -0
- package/dist/search/v1/verticals/general.js +22 -0
- package/dist/search/v1/verticals/general.js.map +1 -0
- package/dist/search/v1/verticals/news.d.ts +10 -0
- package/dist/search/v1/verticals/news.d.ts.map +1 -0
- package/dist/search/v1/verticals/news.js +52 -0
- package/dist/search/v1/verticals/news.js.map +1 -0
- package/dist/search/v1/verticals/papers.d.ts +4 -0
- package/dist/search/v1/verticals/papers.d.ts.map +1 -0
- package/dist/search/v1/verticals/papers.js +23 -0
- package/dist/search/v1/verticals/papers.js.map +1 -0
- package/dist/search/validator.js +31 -31
- package/dist/search/validator.js.map +1 -1
- package/dist/searxng/bootstrap.d.ts +30 -0
- package/dist/searxng/bootstrap.d.ts.map +1 -1
- package/dist/searxng/bootstrap.js +223 -85
- package/dist/searxng/bootstrap.js.map +1 -1
- package/dist/searxng/docker.d.ts.map +1 -1
- package/dist/searxng/docker.js +69 -60
- package/dist/searxng/docker.js.map +1 -1
- package/dist/searxng/process.d.ts +13 -1
- package/dist/searxng/process.d.ts.map +1 -1
- package/dist/searxng/process.js +231 -164
- package/dist/searxng/process.js.map +1 -1
- package/dist/server/backend-status.d.ts +13 -0
- package/dist/server/backend-status.d.ts.map +1 -0
- package/dist/server/backend-status.js +40 -0
- package/dist/server/backend-status.js.map +1 -0
- package/dist/server/tool-schemas.d.ts +549 -0
- package/dist/server/tool-schemas.d.ts.map +1 -0
- package/dist/server/tool-schemas.js +464 -0
- package/dist/server/tool-schemas.js.map +1 -0
- package/dist/server/warmup-on-start.d.ts +9 -0
- package/dist/server/warmup-on-start.d.ts.map +1 -0
- package/dist/server/warmup-on-start.js +55 -0
- package/dist/server/warmup-on-start.js.map +1 -0
- package/dist/server.d.ts +17 -0
- package/dist/server.d.ts.map +1 -1
- package/dist/server.js +454 -297
- package/dist/server.js.map +1 -1
- package/dist/tools/agent.d.ts +5 -0
- package/dist/tools/agent.d.ts.map +1 -0
- package/dist/tools/agent.js +128 -0
- package/dist/tools/agent.js.map +1 -0
- package/dist/tools/cache.d.ts +2 -1
- package/dist/tools/cache.d.ts.map +1 -1
- package/dist/tools/cache.js +177 -44
- package/dist/tools/cache.js.map +1 -1
- package/dist/tools/crawl.d.ts.map +1 -1
- package/dist/tools/crawl.js +171 -88
- package/dist/tools/crawl.js.map +1 -1
- package/dist/tools/extract.d.ts +2 -2
- package/dist/tools/extract.d.ts.map +1 -1
- package/dist/tools/extract.js +175 -59
- package/dist/tools/extract.js.map +1 -1
- package/dist/tools/fetch.d.ts +2 -2
- package/dist/tools/fetch.d.ts.map +1 -1
- package/dist/tools/fetch.js +174 -68
- package/dist/tools/fetch.js.map +1 -1
- package/dist/tools/find-similar.d.ts +5 -0
- package/dist/tools/find-similar.d.ts.map +1 -0
- package/dist/tools/find-similar.js +127 -0
- package/dist/tools/find-similar.js.map +1 -0
- package/dist/tools/research.d.ts +5 -0
- package/dist/tools/research.d.ts.map +1 -0
- package/dist/tools/research.js +107 -0
- package/dist/tools/research.js.map +1 -0
- package/dist/tools/search.d.ts +10 -2
- package/dist/tools/search.d.ts.map +1 -1
- package/dist/tools/search.js +13 -158
- package/dist/tools/search.js.map +1 -1
- package/dist/types.d.ts +350 -7
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js +6 -1
- package/dist/types.js.map +1 -1
- package/dist/util/mode.d.ts +4 -0
- package/dist/util/mode.d.ts.map +1 -0
- package/dist/util/mode.js +34 -0
- package/dist/util/mode.js.map +1 -0
- package/package.json +78 -8
- package/dist/extraction/trafilatura.d.ts +0 -6
- package/dist/extraction/trafilatura.d.ts.map +0 -1
- package/dist/extraction/trafilatura.js +0 -105
- package/dist/extraction/trafilatura.js.map +0 -1
- package/dist/search/flashrank.d.ts +0 -12
- package/dist/search/flashrank.d.ts.map +0 -1
- package/dist/search/flashrank.js +0 -63
- package/dist/search/flashrank.js.map +0 -1
|
@@ -0,0 +1,272 @@
|
|
|
1
|
+
import { getExtractProvider } from "../../providers/extract-provider.js";
|
|
2
|
+
import { getEmbedProvider } from "../../providers/embed-provider.js";
|
|
3
|
+
import { createLogger } from "../../logger.js";
|
|
4
|
+
const log = createLogger("search");
|
|
5
|
+
const DEFAULT_MAX_PAGES = 20;
|
|
6
|
+
const DEFAULT_CONCURRENCY = 4;
|
|
7
|
+
const DEFAULT_FETCH_TIMEOUT_MS = 1e4;
|
|
8
|
+
const DEFAULT_MAX_RESULTS = 10;
|
|
9
|
+
const SEED_TEXT_CHARS = 500;
|
|
10
|
+
async function crawlRank(seedUrl, input, router, options = {}) {
|
|
11
|
+
const start = Date.now();
|
|
12
|
+
const maxPages = options.maxPages ?? DEFAULT_MAX_PAGES;
|
|
13
|
+
const concurrency = options.concurrency ?? DEFAULT_CONCURRENCY;
|
|
14
|
+
const fetchTimeoutMs = options.fetchTimeoutMs ?? DEFAULT_FETCH_TIMEOUT_MS;
|
|
15
|
+
const maxResults = input.max_results ?? DEFAULT_MAX_RESULTS;
|
|
16
|
+
let seedHost;
|
|
17
|
+
try {
|
|
18
|
+
seedHost = new URL(seedUrl).hostname;
|
|
19
|
+
} catch {
|
|
20
|
+
return emptyOutput({
|
|
21
|
+
error: "Invalid seed URL",
|
|
22
|
+
embeddingAvailable: false,
|
|
23
|
+
elapsed: Date.now() - start
|
|
24
|
+
});
|
|
25
|
+
}
|
|
26
|
+
let seedRaw;
|
|
27
|
+
try {
|
|
28
|
+
seedRaw = await router.fetch(seedUrl, { renderJs: "auto" });
|
|
29
|
+
} catch (err) {
|
|
30
|
+
return emptyOutput({
|
|
31
|
+
error: `Seed fetch failed: ${err instanceof Error ? err.message : String(err)}`,
|
|
32
|
+
embeddingAvailable: false,
|
|
33
|
+
elapsed: Date.now() - start
|
|
34
|
+
});
|
|
35
|
+
}
|
|
36
|
+
if (!seedRaw || typeof seedRaw.statusCode !== "number" || seedRaw.statusCode < 200 || seedRaw.statusCode >= 300) {
|
|
37
|
+
return emptyOutput({
|
|
38
|
+
error: `Seed fetch failed: ${seedRaw?.statusCode ?? "unknown"}`,
|
|
39
|
+
embeddingAvailable: false,
|
|
40
|
+
elapsed: Date.now() - start
|
|
41
|
+
});
|
|
42
|
+
}
|
|
43
|
+
const extractor = await getExtractProvider();
|
|
44
|
+
const seedExtraction = await extractor.extract(seedRaw.html, seedRaw.finalUrl, {
|
|
45
|
+
contentType: seedRaw.contentType
|
|
46
|
+
});
|
|
47
|
+
const includeDomains = input.include_domains;
|
|
48
|
+
const excludeDomains = input.exclude_domains;
|
|
49
|
+
const allowedLinks = filterLinks(
|
|
50
|
+
seedExtraction.links ?? [],
|
|
51
|
+
seedHost,
|
|
52
|
+
includeDomains,
|
|
53
|
+
excludeDomains,
|
|
54
|
+
maxPages
|
|
55
|
+
);
|
|
56
|
+
let embedProvider;
|
|
57
|
+
let embeddingAvailable = false;
|
|
58
|
+
try {
|
|
59
|
+
embedProvider = await getEmbedProvider();
|
|
60
|
+
embeddingAvailable = true;
|
|
61
|
+
} catch (err) {
|
|
62
|
+
log.debug("embedding provider unavailable for crawl-rank", { error: String(err) });
|
|
63
|
+
embeddingAvailable = false;
|
|
64
|
+
}
|
|
65
|
+
if (allowedLinks.length === 0) {
|
|
66
|
+
return emptyOutput({
|
|
67
|
+
error: "No same-host links found from seed",
|
|
68
|
+
embeddingAvailable,
|
|
69
|
+
elapsed: Date.now() - start
|
|
70
|
+
});
|
|
71
|
+
}
|
|
72
|
+
if (!embeddingAvailable || !embedProvider) {
|
|
73
|
+
const degraded = degradedResults(allowedLinks, maxResults);
|
|
74
|
+
return {
|
|
75
|
+
results: degraded,
|
|
76
|
+
method: "fts5",
|
|
77
|
+
cache_hits: 0,
|
|
78
|
+
search_hits: degraded.length,
|
|
79
|
+
embedding_available: false,
|
|
80
|
+
error: "Embedding unavailable \u2014 returned link order",
|
|
81
|
+
total_time_ms: Date.now() - start
|
|
82
|
+
};
|
|
83
|
+
}
|
|
84
|
+
const fetched = await fetchPagesInChunks(
|
|
85
|
+
allowedLinks,
|
|
86
|
+
router,
|
|
87
|
+
extractor,
|
|
88
|
+
concurrency,
|
|
89
|
+
fetchTimeoutMs
|
|
90
|
+
);
|
|
91
|
+
if (fetched.length === 0) {
|
|
92
|
+
return emptyOutput({
|
|
93
|
+
error: "No linked pages could be fetched",
|
|
94
|
+
embeddingAvailable: true,
|
|
95
|
+
elapsed: Date.now() - start
|
|
96
|
+
});
|
|
97
|
+
}
|
|
98
|
+
const seedText = buildPageText(seedExtraction.title, seedExtraction.markdown);
|
|
99
|
+
const pageTexts = fetched.map((p) => p.text);
|
|
100
|
+
let vectors;
|
|
101
|
+
try {
|
|
102
|
+
vectors = await embedProvider.embed([seedText, ...pageTexts]);
|
|
103
|
+
} catch (err) {
|
|
104
|
+
log.warn("embedding batch failed; falling back to link order", { error: String(err) });
|
|
105
|
+
const degraded = degradedResults(allowedLinks, maxResults);
|
|
106
|
+
return {
|
|
107
|
+
results: degraded,
|
|
108
|
+
method: "fts5",
|
|
109
|
+
cache_hits: 0,
|
|
110
|
+
search_hits: degraded.length,
|
|
111
|
+
embedding_available: true,
|
|
112
|
+
error: `Embedding batch failed: ${err instanceof Error ? err.message : String(err)}`,
|
|
113
|
+
total_time_ms: Date.now() - start
|
|
114
|
+
};
|
|
115
|
+
}
|
|
116
|
+
const seedVec = vectors[0];
|
|
117
|
+
const pageVecs = vectors.slice(1);
|
|
118
|
+
const scored = fetched.map((page, i) => ({
|
|
119
|
+
page,
|
|
120
|
+
score: cosineSimilarity(seedVec, pageVecs[i])
|
|
121
|
+
}));
|
|
122
|
+
scored.sort((a, b) => b.score - a.score);
|
|
123
|
+
const final = scored.slice(0, maxResults).map(({ page, score }) => ({
|
|
124
|
+
url: page.url,
|
|
125
|
+
title: page.title,
|
|
126
|
+
markdown: page.markdown.slice(0, 5e3),
|
|
127
|
+
relevance_score: score,
|
|
128
|
+
source: "search",
|
|
129
|
+
match_signals: {
|
|
130
|
+
fused_score: score
|
|
131
|
+
}
|
|
132
|
+
}));
|
|
133
|
+
return {
|
|
134
|
+
results: final,
|
|
135
|
+
method: "embedding",
|
|
136
|
+
cache_hits: 0,
|
|
137
|
+
search_hits: final.length,
|
|
138
|
+
embedding_available: true,
|
|
139
|
+
total_time_ms: Date.now() - start
|
|
140
|
+
};
|
|
141
|
+
}
|
|
142
|
+
function filterLinks(links, seedHost, includeDomains, excludeDomains, maxPages) {
|
|
143
|
+
const allowOtherHosts = (includeDomains?.length ?? 0) > 0;
|
|
144
|
+
const seen = /* @__PURE__ */ new Set();
|
|
145
|
+
const out = [];
|
|
146
|
+
for (const raw of links) {
|
|
147
|
+
let parsed;
|
|
148
|
+
try {
|
|
149
|
+
parsed = new URL(raw);
|
|
150
|
+
} catch {
|
|
151
|
+
continue;
|
|
152
|
+
}
|
|
153
|
+
const host = parsed.hostname;
|
|
154
|
+
if (!allowOtherHosts && host !== seedHost) continue;
|
|
155
|
+
if (allowOtherHosts && host !== seedHost) {
|
|
156
|
+
const widened = includeDomains.some((d) => domainMatches(host, d));
|
|
157
|
+
if (!widened) continue;
|
|
158
|
+
}
|
|
159
|
+
if (excludeDomains && excludeDomains.some((d) => domainMatches(host, d))) continue;
|
|
160
|
+
const normalized = normalize(parsed);
|
|
161
|
+
if (seen.has(normalized)) continue;
|
|
162
|
+
seen.add(normalized);
|
|
163
|
+
out.push(parsed.toString());
|
|
164
|
+
if (out.length >= maxPages) break;
|
|
165
|
+
}
|
|
166
|
+
return out;
|
|
167
|
+
}
|
|
168
|
+
function domainMatches(host, pattern) {
|
|
169
|
+
const p = pattern.toLowerCase().replace(/^\*\./, "");
|
|
170
|
+
const h = host.toLowerCase();
|
|
171
|
+
return h === p || h.endsWith(`.${p}`);
|
|
172
|
+
}
|
|
173
|
+
function normalize(parsed) {
|
|
174
|
+
const copy = new URL(parsed.toString());
|
|
175
|
+
copy.hash = "";
|
|
176
|
+
return copy.toString().replace(/\/$/, "");
|
|
177
|
+
}
|
|
178
|
+
async function fetchPagesInChunks(urls, router, extractor, concurrency, fetchTimeoutMs) {
|
|
179
|
+
const out = [];
|
|
180
|
+
for (let i = 0; i < urls.length; i += concurrency) {
|
|
181
|
+
const chunk = urls.slice(i, i + concurrency);
|
|
182
|
+
const settled = await Promise.allSettled(
|
|
183
|
+
chunk.map(async (u) => {
|
|
184
|
+
const raw = await withTimeout(
|
|
185
|
+
router.fetch(u, { renderJs: "auto" }),
|
|
186
|
+
fetchTimeoutMs
|
|
187
|
+
);
|
|
188
|
+
if (!raw || typeof raw.statusCode !== "number" || raw.statusCode < 200 || raw.statusCode >= 300) {
|
|
189
|
+
throw new Error(`bad status: ${raw?.statusCode ?? "unknown"}`);
|
|
190
|
+
}
|
|
191
|
+
const ex = await extractor.extract(raw.html, raw.finalUrl, {
|
|
192
|
+
contentType: raw.contentType
|
|
193
|
+
});
|
|
194
|
+
return {
|
|
195
|
+
url: raw.finalUrl,
|
|
196
|
+
title: ex.title || raw.finalUrl,
|
|
197
|
+
markdown: ex.markdown ?? "",
|
|
198
|
+
text: buildPageText(ex.title, ex.markdown ?? "")
|
|
199
|
+
};
|
|
200
|
+
})
|
|
201
|
+
);
|
|
202
|
+
for (const r of settled) {
|
|
203
|
+
if (r.status === "fulfilled") out.push(r.value);
|
|
204
|
+
else log.debug("crawl-rank page fetch failed", { error: String(r.reason) });
|
|
205
|
+
}
|
|
206
|
+
}
|
|
207
|
+
return out;
|
|
208
|
+
}
|
|
209
|
+
function buildPageText(title, markdown) {
|
|
210
|
+
const t = (title ?? "").trim();
|
|
211
|
+
const body = (markdown ?? "").slice(0, SEED_TEXT_CHARS);
|
|
212
|
+
return t ? `${t}
|
|
213
|
+
${body}` : body;
|
|
214
|
+
}
|
|
215
|
+
function cosineSimilarity(a, b) {
|
|
216
|
+
if (!a || !b || a.length === 0 || b.length === 0) return 0;
|
|
217
|
+
const len = Math.min(a.length, b.length);
|
|
218
|
+
let dot = 0;
|
|
219
|
+
let normA = 0;
|
|
220
|
+
let normB = 0;
|
|
221
|
+
for (let i = 0; i < len; i++) {
|
|
222
|
+
dot += a[i] * b[i];
|
|
223
|
+
normA += a[i] * a[i];
|
|
224
|
+
normB += b[i] * b[i];
|
|
225
|
+
}
|
|
226
|
+
if (normA === 0 || normB === 0) return 0;
|
|
227
|
+
return dot / (Math.sqrt(normA) * Math.sqrt(normB));
|
|
228
|
+
}
|
|
229
|
+
function degradedResults(links, maxResults) {
|
|
230
|
+
const limited = links.slice(0, maxResults);
|
|
231
|
+
const n = limited.length;
|
|
232
|
+
return limited.map((url, i) => ({
|
|
233
|
+
url,
|
|
234
|
+
title: url,
|
|
235
|
+
markdown: "",
|
|
236
|
+
relevance_score: n > 0 ? 1 - i / n : 0,
|
|
237
|
+
source: "search",
|
|
238
|
+
match_signals: {
|
|
239
|
+
fused_score: n > 0 ? 1 - i / n : 0
|
|
240
|
+
}
|
|
241
|
+
}));
|
|
242
|
+
}
|
|
243
|
+
function withTimeout(p, ms) {
|
|
244
|
+
return new Promise((resolve, reject) => {
|
|
245
|
+
const t = setTimeout(() => reject(new Error(`timeout after ${ms}ms`)), ms);
|
|
246
|
+
p.then(
|
|
247
|
+
(v) => {
|
|
248
|
+
clearTimeout(t);
|
|
249
|
+
resolve(v);
|
|
250
|
+
},
|
|
251
|
+
(e) => {
|
|
252
|
+
clearTimeout(t);
|
|
253
|
+
reject(e);
|
|
254
|
+
}
|
|
255
|
+
);
|
|
256
|
+
});
|
|
257
|
+
}
|
|
258
|
+
function emptyOutput(args) {
|
|
259
|
+
return {
|
|
260
|
+
results: [],
|
|
261
|
+
method: "fts5",
|
|
262
|
+
cache_hits: 0,
|
|
263
|
+
search_hits: 0,
|
|
264
|
+
embedding_available: args.embeddingAvailable,
|
|
265
|
+
error: args.error,
|
|
266
|
+
total_time_ms: args.elapsed
|
|
267
|
+
};
|
|
268
|
+
}
|
|
269
|
+
export {
|
|
270
|
+
crawlRank
|
|
271
|
+
};
|
|
272
|
+
//# sourceMappingURL=crawl-rank.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../src/search/find-similar/crawl-rank.ts"],"sourcesContent":["import type {\n FindSimilarInput,\n FindSimilarOutput,\n FindSimilarResult,\n} from '../../types.js';\nimport type { SmartRouter } from '../../fetch/router.js';\nimport { getExtractProvider } from '../../providers/extract-provider.js';\nimport { getEmbedProvider } from '../../providers/embed-provider.js';\nimport { createLogger } from '../../logger.js';\n\nconst log = createLogger('search');\n\nconst DEFAULT_MAX_PAGES = 20;\nconst DEFAULT_CONCURRENCY = 4;\nconst DEFAULT_FETCH_TIMEOUT_MS = 10000;\nconst DEFAULT_MAX_RESULTS = 10;\nconst SEED_TEXT_CHARS = 500;\n\nexport interface CrawlRankOptions {\n maxPages?: number;\n concurrency?: number;\n fetchTimeoutMs?: number;\n}\n\ninterface FetchedPage {\n url: string;\n title: string;\n markdown: string;\n text: string;\n}\n\nexport async function crawlRank(\n seedUrl: string,\n input: FindSimilarInput,\n router: SmartRouter,\n options: CrawlRankOptions = {},\n): Promise<FindSimilarOutput> {\n const start = Date.now();\n const maxPages = options.maxPages ?? DEFAULT_MAX_PAGES;\n const concurrency = options.concurrency ?? DEFAULT_CONCURRENCY;\n const fetchTimeoutMs = options.fetchTimeoutMs ?? DEFAULT_FETCH_TIMEOUT_MS;\n const maxResults = input.max_results ?? DEFAULT_MAX_RESULTS;\n\n let seedHost: string;\n try {\n seedHost = new URL(seedUrl).hostname;\n } catch {\n return emptyOutput({\n error: 'Invalid seed URL',\n embeddingAvailable: false,\n elapsed: Date.now() - start,\n });\n }\n\n // 1. Fetch seed\n let seedRaw;\n try {\n seedRaw = await router.fetch(seedUrl, { renderJs: 'auto' });\n } catch (err) {\n return emptyOutput({\n error: `Seed fetch failed: ${err instanceof Error ? err.message : String(err)}`,\n embeddingAvailable: false,\n elapsed: Date.now() - start,\n });\n }\n\n if (!seedRaw || typeof seedRaw.statusCode !== 'number' || seedRaw.statusCode < 200 || seedRaw.statusCode >= 300) {\n return emptyOutput({\n error: `Seed fetch failed: ${seedRaw?.statusCode ?? 'unknown'}`,\n embeddingAvailable: false,\n elapsed: Date.now() - start,\n });\n }\n\n // 2. Extract seed\n const extractor = await getExtractProvider();\n const seedExtraction = await extractor.extract(seedRaw.html, seedRaw.finalUrl, {\n contentType: seedRaw.contentType,\n });\n\n // 3. Filter links: same-host (unless explicitly widened), domain filters, dedup, cap\n const includeDomains = input.include_domains;\n const excludeDomains = input.exclude_domains;\n const allowedLinks = filterLinks(\n seedExtraction.links ?? [],\n seedHost,\n includeDomains,\n excludeDomains,\n maxPages,\n );\n\n // 6. Probe embedding (before failing on empty links so error messaging reflects\n // capability). If no links AND no embedding, the empty-links error is still\n // the more useful signal.\n let embedProvider;\n let embeddingAvailable = false;\n try {\n embedProvider = await getEmbedProvider();\n embeddingAvailable = true;\n } catch (err) {\n log.debug('embedding provider unavailable for crawl-rank', { error: String(err) });\n embeddingAvailable = false;\n }\n\n if (allowedLinks.length === 0) {\n return emptyOutput({\n error: 'No same-host links found from seed',\n embeddingAvailable,\n elapsed: Date.now() - start,\n });\n }\n\n // Degraded mode: no embeddings, return link order\n if (!embeddingAvailable || !embedProvider) {\n const degraded = degradedResults(allowedLinks, maxResults);\n return {\n results: degraded,\n method: 'fts5',\n cache_hits: 0,\n search_hits: degraded.length,\n embedding_available: false,\n error: 'Embedding unavailable — returned link order',\n total_time_ms: Date.now() - start,\n };\n }\n\n // 7. Fetch + extract each link with concurrency cap\n const fetched = await fetchPagesInChunks(\n allowedLinks,\n router,\n extractor,\n concurrency,\n fetchTimeoutMs,\n );\n\n if (fetched.length === 0) {\n return emptyOutput({\n error: 'No linked pages could be fetched',\n embeddingAvailable: true,\n elapsed: Date.now() - start,\n });\n }\n\n // 8. Build text per page\n const seedText = buildPageText(seedExtraction.title, seedExtraction.markdown);\n const pageTexts = fetched.map(p => p.text);\n\n // 9. Embed seed + pages in one batch\n let vectors: Float32Array[];\n try {\n vectors = await embedProvider.embed([seedText, ...pageTexts]);\n } catch (err) {\n log.warn('embedding batch failed; falling back to link order', { error: String(err) });\n const degraded = degradedResults(allowedLinks, maxResults);\n return {\n results: degraded,\n method: 'fts5',\n cache_hits: 0,\n search_hits: degraded.length,\n embedding_available: true,\n error: `Embedding batch failed: ${err instanceof Error ? err.message : String(err)}`,\n total_time_ms: Date.now() - start,\n };\n }\n\n const seedVec = vectors[0];\n const pageVecs = vectors.slice(1);\n\n // 10. Cosine + sort\n const scored = fetched.map((page, i) => ({\n page,\n score: cosineSimilarity(seedVec, pageVecs[i]),\n }));\n scored.sort((a, b) => b.score - a.score);\n\n // 11. Cap + map\n const final: FindSimilarResult[] = scored.slice(0, maxResults).map(({ page, score }) => ({\n url: page.url,\n title: page.title,\n markdown: page.markdown.slice(0, 5000),\n relevance_score: score,\n source: 'search',\n match_signals: {\n fused_score: score,\n },\n }));\n\n return {\n results: final,\n method: 'embedding',\n cache_hits: 0,\n search_hits: final.length,\n embedding_available: true,\n total_time_ms: Date.now() - start,\n };\n}\n\nfunction filterLinks(\n links: string[],\n seedHost: string,\n includeDomains: string[] | undefined,\n excludeDomains: string[] | undefined,\n maxPages: number,\n): string[] {\n const allowOtherHosts = (includeDomains?.length ?? 0) > 0;\n const seen = new Set<string>();\n const out: string[] = [];\n\n for (const raw of links) {\n let parsed: URL;\n try {\n parsed = new URL(raw);\n } catch {\n continue;\n }\n\n const host = parsed.hostname;\n\n if (!allowOtherHosts && host !== seedHost) continue;\n if (allowOtherHosts && host !== seedHost) {\n const widened = includeDomains!.some(d => domainMatches(host, d));\n if (!widened) continue;\n }\n if (excludeDomains && excludeDomains.some(d => domainMatches(host, d))) continue;\n\n const normalized = normalize(parsed);\n if (seen.has(normalized)) continue;\n seen.add(normalized);\n out.push(parsed.toString());\n if (out.length >= maxPages) break;\n }\n\n return out;\n}\n\nfunction domainMatches(host: string, pattern: string): boolean {\n const p = pattern.toLowerCase().replace(/^\\*\\./, '');\n const h = host.toLowerCase();\n return h === p || h.endsWith(`.${p}`);\n}\n\nfunction normalize(parsed: URL): string {\n const copy = new URL(parsed.toString());\n copy.hash = '';\n return copy.toString().replace(/\\/$/, '');\n}\n\nasync function fetchPagesInChunks(\n urls: string[],\n router: SmartRouter,\n extractor: Awaited<ReturnType<typeof getExtractProvider>>,\n concurrency: number,\n fetchTimeoutMs: number,\n): Promise<FetchedPage[]> {\n const out: FetchedPage[] = [];\n for (let i = 0; i < urls.length; i += concurrency) {\n const chunk = urls.slice(i, i + concurrency);\n const settled = await Promise.allSettled(\n chunk.map(async u => {\n const raw = await withTimeout(\n router.fetch(u, { renderJs: 'auto' }),\n fetchTimeoutMs,\n );\n if (\n !raw ||\n typeof raw.statusCode !== 'number' ||\n raw.statusCode < 200 ||\n raw.statusCode >= 300\n ) {\n throw new Error(`bad status: ${raw?.statusCode ?? 'unknown'}`);\n }\n const ex = await extractor.extract(raw.html, raw.finalUrl, {\n contentType: raw.contentType,\n });\n return {\n url: raw.finalUrl,\n title: ex.title || raw.finalUrl,\n markdown: ex.markdown ?? '',\n text: buildPageText(ex.title, ex.markdown ?? ''),\n } satisfies FetchedPage;\n }),\n );\n for (const r of settled) {\n if (r.status === 'fulfilled') out.push(r.value);\n else log.debug('crawl-rank page fetch failed', { error: String(r.reason) });\n }\n }\n return out;\n}\n\nfunction buildPageText(title: string, markdown: string): string {\n const t = (title ?? '').trim();\n const body = (markdown ?? '').slice(0, SEED_TEXT_CHARS);\n return t ? `${t}\\n${body}` : body;\n}\n\nfunction cosineSimilarity(a: Float32Array, b: Float32Array): number {\n if (!a || !b || a.length === 0 || b.length === 0) return 0;\n const len = Math.min(a.length, b.length);\n let dot = 0;\n let normA = 0;\n let normB = 0;\n for (let i = 0; i < len; i++) {\n dot += a[i] * b[i];\n normA += a[i] * a[i];\n normB += b[i] * b[i];\n }\n if (normA === 0 || normB === 0) return 0;\n return dot / (Math.sqrt(normA) * Math.sqrt(normB));\n}\n\nfunction degradedResults(links: string[], maxResults: number): FindSimilarResult[] {\n const limited = links.slice(0, maxResults);\n const n = limited.length;\n return limited.map((url, i) => ({\n url,\n title: url,\n markdown: '',\n relevance_score: n > 0 ? 1 - i / n : 0,\n source: 'search',\n match_signals: {\n fused_score: n > 0 ? 1 - i / n : 0,\n },\n }));\n}\n\nfunction withTimeout<T>(p: Promise<T>, ms: number): Promise<T> {\n return new Promise<T>((resolve, reject) => {\n const t = setTimeout(() => reject(new Error(`timeout after ${ms}ms`)), ms);\n p.then(\n v => {\n clearTimeout(t);\n resolve(v);\n },\n e => {\n clearTimeout(t);\n reject(e);\n },\n );\n });\n}\n\nfunction emptyOutput(args: {\n error: string;\n embeddingAvailable: boolean;\n elapsed: number;\n}): FindSimilarOutput {\n return {\n results: [],\n method: 'fts5',\n cache_hits: 0,\n search_hits: 0,\n embedding_available: args.embeddingAvailable,\n error: args.error,\n total_time_ms: args.elapsed,\n };\n}\n"],"mappings":"AAMA,SAAS,0BAA0B;AACnC,SAAS,wBAAwB;AACjC,SAAS,oBAAoB;AAE7B,MAAM,MAAM,aAAa,QAAQ;AAEjC,MAAM,oBAAoB;AAC1B,MAAM,sBAAsB;AAC5B,MAAM,2BAA2B;AACjC,MAAM,sBAAsB;AAC5B,MAAM,kBAAkB;AAexB,eAAsB,UACpB,SACA,OACA,QACA,UAA4B,CAAC,GACD;AAC5B,QAAM,QAAQ,KAAK,IAAI;AACvB,QAAM,WAAW,QAAQ,YAAY;AACrC,QAAM,cAAc,QAAQ,eAAe;AAC3C,QAAM,iBAAiB,QAAQ,kBAAkB;AACjD,QAAM,aAAa,MAAM,eAAe;AAExC,MAAI;AACJ,MAAI;AACF,eAAW,IAAI,IAAI,OAAO,EAAE;AAAA,EAC9B,QAAQ;AACN,WAAO,YAAY;AAAA,MACjB,OAAO;AAAA,MACP,oBAAoB;AAAA,MACpB,SAAS,KAAK,IAAI,IAAI;AAAA,IACxB,CAAC;AAAA,EACH;AAGA,MAAI;AACJ,MAAI;AACF,cAAU,MAAM,OAAO,MAAM,SAAS,EAAE,UAAU,OAAO,CAAC;AAAA,EAC5D,SAAS,KAAK;AACZ,WAAO,YAAY;AAAA,MACjB,OAAO,sBAAsB,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG,CAAC;AAAA,MAC7E,oBAAoB;AAAA,MACpB,SAAS,KAAK,IAAI,IAAI;AAAA,IACxB,CAAC;AAAA,EACH;AAEA,MAAI,CAAC,WAAW,OAAO,QAAQ,eAAe,YAAY,QAAQ,aAAa,OAAO,QAAQ,cAAc,KAAK;AAC/G,WAAO,YAAY;AAAA,MACjB,OAAO,sBAAsB,SAAS,cAAc,SAAS;AAAA,MAC7D,oBAAoB;AAAA,MACpB,SAAS,KAAK,IAAI,IAAI;AAAA,IACxB,CAAC;AAAA,EACH;AAGA,QAAM,YAAY,MAAM,mBAAmB;AAC3C,QAAM,iBAAiB,MAAM,UAAU,QAAQ,QAAQ,MAAM,QAAQ,UAAU;AAAA,IAC7E,aAAa,QAAQ;AAAA,EACvB,CAAC;AAGD,QAAM,iBAAiB,MAAM;AAC7B,QAAM,iBAAiB,MAAM;AAC7B,QAAM,eAAe;AAAA,IACnB,eAAe,SAAS,CAAC;AAAA,IACzB;AAAA,IACA;AAAA,IACA;AAAA,IACA;AAAA,EACF;AAKA,MAAI;AACJ,MAAI,qBAAqB;AACzB,MAAI;AACF,oBAAgB,MAAM,iBAAiB;AACvC,yBAAqB;AAAA,EACvB,SAAS,KAAK;AACZ,QAAI,MAAM,iDAAiD,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AACjF,yBAAqB;AAAA,EACvB;AAEA,MAAI,aAAa,WAAW,GAAG;AAC7B,WAAO,YAAY;AAAA,MACjB,OAAO;AAAA,MACP;AAAA,MACA,SAAS,KAAK,IAAI,IAAI;AAAA,IACxB,CAAC;AAAA,EACH;AAGA,MAAI,CAAC,sBAAsB,CAAC,eAAe;AACzC,UAAM,WAAW,gBAAgB,cAAc,UAAU;AACzD,WAAO;AAAA,MACL,SAAS;AAAA,MACT,QAAQ;AAAA,MACR,YAAY;AAAA,MACZ,aAAa,SAAS;AAAA,MACtB,qBAAqB;AAAA,MACrB,OAAO;AAAA,MACP,eAAe,KAAK,IAAI,IAAI;AAAA,IAC9B;AAAA,EACF;AAGA,QAAM,UAAU,MAAM;AAAA,IACpB;AAAA,IACA;AAAA,IACA;AAAA,IACA;AAAA,IACA;AAAA,EACF;AAEA,MAAI,QAAQ,WAAW,GAAG;AACxB,WAAO,YAAY;AAAA,MACjB,OAAO;AAAA,MACP,oBAAoB;AAAA,MACpB,SAAS,KAAK,IAAI,IAAI;AAAA,IACxB,CAAC;AAAA,EACH;AAGA,QAAM,WAAW,cAAc,eAAe,OAAO,eAAe,QAAQ;AAC5E,QAAM,YAAY,QAAQ,IAAI,OAAK,EAAE,IAAI;AAGzC,MAAI;AACJ,MAAI;AACF,cAAU,MAAM,cAAc,MAAM,CAAC,UAAU,GAAG,SAAS,CAAC;AAAA,EAC9D,SAAS,KAAK;AACZ,QAAI,KAAK,sDAAsD,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AACrF,UAAM,WAAW,gBAAgB,cAAc,UAAU;AACzD,WAAO;AAAA,MACL,SAAS;AAAA,MACT,QAAQ;AAAA,MACR,YAAY;AAAA,MACZ,aAAa,SAAS;AAAA,MACtB,qBAAqB;AAAA,MACrB,OAAO,2BAA2B,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG,CAAC;AAAA,MAClF,eAAe,KAAK,IAAI,IAAI;AAAA,IAC9B;AAAA,EACF;AAEA,QAAM,UAAU,QAAQ,CAAC;AACzB,QAAM,WAAW,QAAQ,MAAM,CAAC;AAGhC,QAAM,SAAS,QAAQ,IAAI,CAAC,MAAM,OAAO;AAAA,IACvC;AAAA,IACA,OAAO,iBAAiB,SAAS,SAAS,CAAC,CAAC;AAAA,EAC9C,EAAE;AACF,SAAO,KAAK,CAAC,GAAG,MAAM,EAAE,QAAQ,EAAE,KAAK;AAGvC,QAAM,QAA6B,OAAO,MAAM,GAAG,UAAU,EAAE,IAAI,CAAC,EAAE,MAAM,MAAM,OAAO;AAAA,IACvF,KAAK,KAAK;AAAA,IACV,OAAO,KAAK;AAAA,IACZ,UAAU,KAAK,SAAS,MAAM,GAAG,GAAI;AAAA,IACrC,iBAAiB;AAAA,IACjB,QAAQ;AAAA,IACR,eAAe;AAAA,MACb,aAAa;AAAA,IACf;AAAA,EACF,EAAE;AAEF,SAAO;AAAA,IACL,SAAS;AAAA,IACT,QAAQ;AAAA,IACR,YAAY;AAAA,IACZ,aAAa,MAAM;AAAA,IACnB,qBAAqB;AAAA,IACrB,eAAe,KAAK,IAAI,IAAI;AAAA,EAC9B;AACF;AAEA,SAAS,YACP,OACA,UACA,gBACA,gBACA,UACU;AACV,QAAM,mBAAmB,gBAAgB,UAAU,KAAK;AACxD,QAAM,OAAO,oBAAI,IAAY;AAC7B,QAAM,MAAgB,CAAC;AAEvB,aAAW,OAAO,OAAO;AACvB,QAAI;AACJ,QAAI;AACF,eAAS,IAAI,IAAI,GAAG;AAAA,IACtB,QAAQ;AACN;AAAA,IACF;AAEA,UAAM,OAAO,OAAO;AAEpB,QAAI,CAAC,mBAAmB,SAAS,SAAU;AAC3C,QAAI,mBAAmB,SAAS,UAAU;AACxC,YAAM,UAAU,eAAgB,KAAK,OAAK,cAAc,MAAM,CAAC,CAAC;AAChE,UAAI,CAAC,QAAS;AAAA,IAChB;AACA,QAAI,kBAAkB,eAAe,KAAK,OAAK,cAAc,MAAM,CAAC,CAAC,EAAG;AAExE,UAAM,aAAa,UAAU,MAAM;AACnC,QAAI,KAAK,IAAI,UAAU,EAAG;AAC1B,SAAK,IAAI,UAAU;AACnB,QAAI,KAAK,OAAO,SAAS,CAAC;AAC1B,QAAI,IAAI,UAAU,SAAU;AAAA,EAC9B;AAEA,SAAO;AACT;AAEA,SAAS,cAAc,MAAc,SAA0B;AAC7D,QAAM,IAAI,QAAQ,YAAY,EAAE,QAAQ,SAAS,EAAE;AACnD,QAAM,IAAI,KAAK,YAAY;AAC3B,SAAO,MAAM,KAAK,EAAE,SAAS,IAAI,CAAC,EAAE;AACtC;AAEA,SAAS,UAAU,QAAqB;AACtC,QAAM,OAAO,IAAI,IAAI,OAAO,SAAS,CAAC;AACtC,OAAK,OAAO;AACZ,SAAO,KAAK,SAAS,EAAE,QAAQ,OAAO,EAAE;AAC1C;AAEA,eAAe,mBACb,MACA,QACA,WACA,aACA,gBACwB;AACxB,QAAM,MAAqB,CAAC;AAC5B,WAAS,IAAI,GAAG,IAAI,KAAK,QAAQ,KAAK,aAAa;AACjD,UAAM,QAAQ,KAAK,MAAM,GAAG,IAAI,WAAW;AAC3C,UAAM,UAAU,MAAM,QAAQ;AAAA,MAC5B,MAAM,IAAI,OAAM,MAAK;AACnB,cAAM,MAAM,MAAM;AAAA,UAChB,OAAO,MAAM,GAAG,EAAE,UAAU,OAAO,CAAC;AAAA,UACpC;AAAA,QACF;AACA,YACE,CAAC,OACD,OAAO,IAAI,eAAe,YAC1B,IAAI,aAAa,OACjB,IAAI,cAAc,KAClB;AACA,gBAAM,IAAI,MAAM,eAAe,KAAK,cAAc,SAAS,EAAE;AAAA,QAC/D;AACA,cAAM,KAAK,MAAM,UAAU,QAAQ,IAAI,MAAM,IAAI,UAAU;AAAA,UACzD,aAAa,IAAI;AAAA,QACnB,CAAC;AACD,eAAO;AAAA,UACL,KAAK,IAAI;AAAA,UACT,OAAO,GAAG,SAAS,IAAI;AAAA,UACvB,UAAU,GAAG,YAAY;AAAA,UACzB,MAAM,cAAc,GAAG,OAAO,GAAG,YAAY,EAAE;AAAA,QACjD;AAAA,MACF,CAAC;AAAA,IACH;AACA,eAAW,KAAK,SAAS;AACvB,UAAI,EAAE,WAAW,YAAa,KAAI,KAAK,EAAE,KAAK;AAAA,UACzC,KAAI,MAAM,gCAAgC,EAAE,OAAO,OAAO,EAAE,MAAM,EAAE,CAAC;AAAA,IAC5E;AAAA,EACF;AACA,SAAO;AACT;AAEA,SAAS,cAAc,OAAe,UAA0B;AAC9D,QAAM,KAAK,SAAS,IAAI,KAAK;AAC7B,QAAM,QAAQ,YAAY,IAAI,MAAM,GAAG,eAAe;AACtD,SAAO,IAAI,GAAG,CAAC;AAAA,EAAK,IAAI,KAAK;AAC/B;AAEA,SAAS,iBAAiB,GAAiB,GAAyB;AAClE,MAAI,CAAC,KAAK,CAAC,KAAK,EAAE,WAAW,KAAK,EAAE,WAAW,EAAG,QAAO;AACzD,QAAM,MAAM,KAAK,IAAI,EAAE,QAAQ,EAAE,MAAM;AACvC,MAAI,MAAM;AACV,MAAI,QAAQ;AACZ,MAAI,QAAQ;AACZ,WAAS,IAAI,GAAG,IAAI,KAAK,KAAK;AAC5B,WAAO,EAAE,CAAC,IAAI,EAAE,CAAC;AACjB,aAAS,EAAE,CAAC,IAAI,EAAE,CAAC;AACnB,aAAS,EAAE,CAAC,IAAI,EAAE,CAAC;AAAA,EACrB;AACA,MAAI,UAAU,KAAK,UAAU,EAAG,QAAO;AACvC,SAAO,OAAO,KAAK,KAAK,KAAK,IAAI,KAAK,KAAK,KAAK;AAClD;AAEA,SAAS,gBAAgB,OAAiB,YAAyC;AACjF,QAAM,UAAU,MAAM,MAAM,GAAG,UAAU;AACzC,QAAM,IAAI,QAAQ;AAClB,SAAO,QAAQ,IAAI,CAAC,KAAK,OAAO;AAAA,IAC9B;AAAA,IACA,OAAO;AAAA,IACP,UAAU;AAAA,IACV,iBAAiB,IAAI,IAAI,IAAI,IAAI,IAAI;AAAA,IACrC,QAAQ;AAAA,IACR,eAAe;AAAA,MACb,aAAa,IAAI,IAAI,IAAI,IAAI,IAAI;AAAA,IACnC;AAAA,EACF,EAAE;AACJ;AAEA,SAAS,YAAe,GAAe,IAAwB;AAC7D,SAAO,IAAI,QAAW,CAAC,SAAS,WAAW;AACzC,UAAM,IAAI,WAAW,MAAM,OAAO,IAAI,MAAM,iBAAiB,EAAE,IAAI,CAAC,GAAG,EAAE;AACzE,MAAE;AAAA,MACA,OAAK;AACH,qBAAa,CAAC;AACd,gBAAQ,CAAC;AAAA,MACX;AAAA,MACA,OAAK;AACH,qBAAa,CAAC;AACd,eAAO,CAAC;AAAA,MACV;AAAA,IACF;AAAA,EACF,CAAC;AACH;AAEA,SAAS,YAAY,MAIC;AACpB,SAAO;AAAA,IACL,SAAS,CAAC;AAAA,IACV,QAAQ;AAAA,IACR,YAAY;AAAA,IACZ,aAAa;AAAA,IACb,qBAAqB,KAAK;AAAA,IAC1B,OAAO,KAAK;AAAA,IACZ,eAAe,KAAK;AAAA,EACtB;AACF;","names":[]}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"mode.d.ts","sourceRoot":"","sources":["../../../src/search/find-similar/mode.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,gBAAgB,EAAE,MAAM,gBAAgB,CAAC;AAEvD,MAAM,MAAM,eAAe,GAAG,MAAM,GAAG,OAAO,GAAG,eAAe,GAAG,YAAY,CAAC;AAMhF,wBAAgB,UAAU,CAAC,KAAK,EAAE,gBAAgB,GAAG,eAAe,CAOnE"}
|
|
@@ -0,0 +1,12 @@
|
|
|
1
|
+
function selectMode(input) {
|
|
2
|
+
if (input.mode === "crawl-rank") {
|
|
3
|
+
if (input.url && input.url.trim().length > 0) return "crawl-rank";
|
|
4
|
+
return "cache";
|
|
5
|
+
}
|
|
6
|
+
if (input.mode === "cache" || input.mode === "web-expansion") return input.mode;
|
|
7
|
+
return "cache";
|
|
8
|
+
}
|
|
9
|
+
export {
|
|
10
|
+
selectMode
|
|
11
|
+
};
|
|
12
|
+
//# sourceMappingURL=mode.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../src/search/find-similar/mode.ts"],"sourcesContent":["import type { FindSimilarInput } from '../../types.js';\n\nexport type FindSimilarMode = 'auto' | 'cache' | 'web-expansion' | 'crawl-rank';\n\n// Dispatcher only branches on 'crawl-rank' today. 'cache' / 'web-expansion' /\n// 'auto' all fall through to the legacy hybrid flow in find-similar.ts so\n// existing callers keep their behavior. Crawl-rank requires an explicit\n// opt-in and a seed URL — concept-only inputs have nothing to crawl from.\nexport function selectMode(input: FindSimilarInput): FindSimilarMode {\n if (input.mode === 'crawl-rank') {\n if (input.url && input.url.trim().length > 0) return 'crawl-rank';\n return 'cache';\n }\n if (input.mode === 'cache' || input.mode === 'web-expansion') return input.mode;\n return 'cache';\n}\n"],"mappings":"AAQO,SAAS,WAAW,OAA0C;AACnE,MAAI,MAAM,SAAS,cAAc;AAC/B,QAAI,MAAM,OAAO,MAAM,IAAI,KAAK,EAAE,SAAS,EAAG,QAAO;AACrD,WAAO;AAAA,EACT;AACA,MAAI,MAAM,SAAS,WAAW,MAAM,SAAS,gBAAiB,QAAO,MAAM;AAC3E,SAAO;AACT;","names":[]}
|
|
@@ -0,0 +1,5 @@
|
|
|
1
|
+
import type { FindSimilarInput, FindSimilarOutput, SearchEngine } from '../types.js';
|
|
2
|
+
import type { SmartRouter } from '../fetch/router.js';
|
|
3
|
+
import type { BackendStatus } from '../server/backend-status.js';
|
|
4
|
+
export declare function findSimilar(input: FindSimilarInput, engines: SearchEngine[], router: SmartRouter, backendStatus?: BackendStatus): Promise<FindSimilarOutput>;
|
|
5
|
+
//# sourceMappingURL=find-similar.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"find-similar.d.ts","sourceRoot":"","sources":["../../src/search/find-similar.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACV,gBAAgB,EAChB,iBAAiB,EAEjB,YAAY,EAEb,MAAM,aAAa,CAAC;AACrB,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,oBAAoB,CAAC;AACtD,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,6BAA6B,CAAC;AA2BjE,wBAAsB,WAAW,CAC/B,KAAK,EAAE,gBAAgB,EACvB,OAAO,EAAE,YAAY,EAAE,EACvB,MAAM,EAAE,WAAW,EACnB,aAAa,CAAC,EAAE,aAAa,GAC5B,OAAO,CAAC,iBAAiB,CAAC,CA0M5B"}
|