@staticn0va/wigolo 0.1.0 → 0.1.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +1 -1
- package/README.md +146 -227
- package/SKILL.md +382 -0
- package/assets/blocks/claude-code/CLAUDE.md.block +20 -0
- package/assets/blocks/claude-code/wigolo-command.md +40 -0
- package/assets/blocks/cursor/wigolo.mdc +46 -0
- package/assets/blocks/gemini-cli/GEMINI.md.block +18 -0
- package/assets/blocks/vscode/copilot-instructions.md.block +18 -0
- package/assets/skills/wigolo/SKILL.md +50 -0
- package/assets/skills/wigolo/rules/cache-first.md +30 -0
- package/assets/skills/wigolo/rules/synthesis.md +43 -0
- package/assets/skills/wigolo-agent/SKILL.md +73 -0
- package/assets/skills/wigolo-crawl/SKILL.md +60 -0
- package/assets/skills/wigolo-extract/SKILL.md +59 -0
- package/assets/skills/wigolo-fetch/SKILL.md +65 -0
- package/assets/skills/wigolo-find-similar/SKILL.md +72 -0
- package/assets/skills/wigolo-research/SKILL.md +77 -0
- package/assets/skills/wigolo-search/SKILL.md +78 -0
- package/dist/agent/executor.d.ts +33 -0
- package/dist/agent/executor.d.ts.map +1 -0
- package/dist/agent/executor.js +233 -0
- package/dist/agent/executor.js.map +1 -0
- package/dist/agent/pipeline.d.ts +5 -0
- package/dist/agent/pipeline.d.ts.map +1 -0
- package/dist/agent/pipeline.js +238 -0
- package/dist/agent/pipeline.js.map +1 -0
- package/dist/agent/planner.d.ts +13 -0
- package/dist/agent/planner.d.ts.map +1 -0
- package/dist/agent/planner.js +271 -0
- package/dist/agent/planner.js.map +1 -0
- package/dist/agent/relevance.d.ts +15 -0
- package/dist/agent/relevance.d.ts.map +1 -0
- package/dist/agent/relevance.js +60 -0
- package/dist/agent/relevance.js.map +1 -0
- package/dist/cache/backfill-embeddings.d.ts +23 -0
- package/dist/cache/backfill-embeddings.d.ts.map +1 -0
- package/dist/cache/backfill-embeddings.js +105 -0
- package/dist/cache/backfill-embeddings.js.map +1 -0
- package/dist/cache/change-detector.d.ts +7 -0
- package/dist/cache/change-detector.d.ts.map +1 -0
- package/dist/cache/change-detector.js +43 -0
- package/dist/cache/change-detector.js.map +1 -0
- package/dist/cache/db.d.ts +1 -0
- package/dist/cache/db.d.ts.map +1 -1
- package/dist/cache/db.js +94 -22
- package/dist/cache/db.js.map +1 -1
- package/dist/cache/diff-summary.d.ts +2 -0
- package/dist/cache/diff-summary.d.ts.map +1 -0
- package/dist/cache/diff-summary.js +82 -0
- package/dist/cache/diff-summary.js.map +1 -0
- package/dist/cache/migrations/runner.d.ts +29 -0
- package/dist/cache/migrations/runner.d.ts.map +1 -0
- package/dist/cache/migrations/runner.js +147 -0
- package/dist/cache/migrations/runner.js.map +1 -0
- package/dist/cache/sqlite-vec-store.d.ts +42 -0
- package/dist/cache/sqlite-vec-store.d.ts.map +1 -0
- package/dist/cache/sqlite-vec-store.js +176 -0
- package/dist/cache/sqlite-vec-store.js.map +1 -0
- package/dist/cache/store.d.ts +47 -1
- package/dist/cache/store.d.ts.map +1 -1
- package/dist/cache/store.js +364 -168
- package/dist/cache/store.js.map +1 -1
- package/dist/cli/agents/antigravity.d.ts +20 -0
- package/dist/cli/agents/antigravity.d.ts.map +1 -0
- package/dist/cli/agents/antigravity.js +49 -0
- package/dist/cli/agents/antigravity.js.map +1 -0
- package/dist/cli/agents/claude-code.d.ts +25 -0
- package/dist/cli/agents/claude-code.d.ts.map +1 -0
- package/dist/cli/agents/claude-code.js +111 -0
- package/dist/cli/agents/claude-code.js.map +1 -0
- package/dist/cli/agents/cursor.d.ts +21 -0
- package/dist/cli/agents/cursor.d.ts.map +1 -0
- package/dist/cli/agents/cursor.js +58 -0
- package/dist/cli/agents/cursor.js.map +1 -0
- package/dist/cli/agents/gemini-cli.d.ts +21 -0
- package/dist/cli/agents/gemini-cli.d.ts.map +1 -0
- package/dist/cli/agents/gemini-cli.js +55 -0
- package/dist/cli/agents/gemini-cli.js.map +1 -0
- package/dist/cli/agents/registry.d.ts +21 -0
- package/dist/cli/agents/registry.d.ts.map +1 -0
- package/dist/cli/agents/registry.js +27 -0
- package/dist/cli/agents/registry.js.map +1 -0
- package/dist/cli/agents/utils.d.ts +26 -0
- package/dist/cli/agents/utils.d.ts.map +1 -0
- package/dist/cli/agents/utils.js +136 -0
- package/dist/cli/agents/utils.js.map +1 -0
- package/dist/cli/agents/vscode.d.ts +21 -0
- package/dist/cli/agents/vscode.d.ts.map +1 -0
- package/dist/cli/agents/vscode.js +62 -0
- package/dist/cli/agents/vscode.js.map +1 -0
- package/dist/cli/auth.d.ts +2 -0
- package/dist/cli/auth.d.ts.map +1 -0
- package/dist/cli/auth.js +94 -0
- package/dist/cli/auth.js.map +1 -0
- package/dist/cli/backfill.d.ts +2 -0
- package/dist/cli/backfill.d.ts.map +1 -0
- package/dist/cli/backfill.js +58 -0
- package/dist/cli/backfill.js.map +1 -0
- package/dist/cli/daemon.d.ts +6 -1
- package/dist/cli/daemon.d.ts.map +1 -1
- package/dist/cli/daemon.js +61 -3
- package/dist/cli/daemon.js.map +1 -1
- package/dist/cli/doctor.d.ts +8 -0
- package/dist/cli/doctor.d.ts.map +1 -0
- package/dist/cli/doctor.js +344 -0
- package/dist/cli/doctor.js.map +1 -0
- package/dist/cli/health.d.ts +1 -1
- package/dist/cli/health.d.ts.map +1 -1
- package/dist/cli/health.js +42 -3
- package/dist/cli/health.js.map +1 -1
- package/dist/cli/help.d.ts +6 -0
- package/dist/cli/help.d.ts.map +1 -0
- package/dist/cli/help.js +63 -0
- package/dist/cli/help.js.map +1 -0
- package/dist/cli/index.d.ts +1 -1
- package/dist/cli/index.d.ts.map +1 -1
- package/dist/cli/index.js +35 -7
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/init.d.ts +2 -0
- package/dist/cli/init.d.ts.map +1 -0
- package/dist/cli/init.js +201 -0
- package/dist/cli/init.js.map +1 -0
- package/dist/cli/plugin.d.ts +5 -0
- package/dist/cli/plugin.d.ts.map +1 -0
- package/dist/cli/plugin.js +185 -0
- package/dist/cli/plugin.js.map +1 -0
- package/dist/cli/setup-mcp.d.ts +2 -0
- package/dist/cli/setup-mcp.d.ts.map +1 -0
- package/dist/cli/setup-mcp.js +114 -0
- package/dist/cli/setup-mcp.js.map +1 -0
- package/dist/cli/shell.d.ts +2 -0
- package/dist/cli/shell.d.ts.map +1 -0
- package/dist/cli/shell.js +86 -0
- package/dist/cli/shell.js.map +1 -0
- package/dist/cli/shutdown.d.ts +2 -0
- package/dist/cli/shutdown.d.ts.map +1 -0
- package/dist/cli/shutdown.js +26 -0
- package/dist/cli/shutdown.js.map +1 -0
- package/dist/cli/status.d.ts +2 -0
- package/dist/cli/status.d.ts.map +1 -0
- package/dist/cli/status.js +31 -0
- package/dist/cli/status.js.map +1 -0
- package/dist/cli/telemetry.d.ts +10 -0
- package/dist/cli/telemetry.d.ts.map +1 -0
- package/dist/cli/telemetry.js +56 -0
- package/dist/cli/telemetry.js.map +1 -0
- package/dist/cli/tui/agents-types.d.ts +28 -0
- package/dist/cli/tui/agents-types.d.ts.map +1 -0
- package/dist/cli/tui/agents-types.js +1 -0
- package/dist/cli/tui/agents-types.js.map +1 -0
- package/dist/cli/tui/agents.d.ts +11 -0
- package/dist/cli/tui/agents.d.ts.map +1 -0
- package/dist/cli/tui/agents.js +93 -0
- package/dist/cli/tui/agents.js.map +1 -0
- package/dist/cli/tui/banner.d.ts +3 -0
- package/dist/cli/tui/banner.d.ts.map +1 -0
- package/dist/cli/tui/banner.js +30 -0
- package/dist/cli/tui/banner.js.map +1 -0
- package/dist/cli/tui/components/AgentSelect.d.ts +13 -0
- package/dist/cli/tui/components/AgentSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/AgentSelect.js +116 -0
- package/dist/cli/tui/components/AgentSelect.js.map +1 -0
- package/dist/cli/tui/components/Banner.d.ts +6 -0
- package/dist/cli/tui/components/Banner.d.ts.map +1 -0
- package/dist/cli/tui/components/Banner.js +25 -0
- package/dist/cli/tui/components/Banner.js.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts +7 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.js +19 -0
- package/dist/cli/tui/components/BrowserSelect.js.map +1 -0
- package/dist/cli/tui/components/InstallProgress.d.ts +9 -0
- package/dist/cli/tui/components/InstallProgress.d.ts.map +1 -0
- package/dist/cli/tui/components/InstallProgress.js +67 -0
- package/dist/cli/tui/components/InstallProgress.js.map +1 -0
- package/dist/cli/tui/components/SkillInstall.d.ts +14 -0
- package/dist/cli/tui/components/SkillInstall.d.ts.map +1 -0
- package/dist/cli/tui/components/SkillInstall.js +94 -0
- package/dist/cli/tui/components/SkillInstall.js.map +1 -0
- package/dist/cli/tui/components/Summary.d.ts +22 -0
- package/dist/cli/tui/components/Summary.d.ts.map +1 -0
- package/dist/cli/tui/components/Summary.js +135 -0
- package/dist/cli/tui/components/Summary.js.map +1 -0
- package/dist/cli/tui/components/SystemCheck.d.ts +8 -0
- package/dist/cli/tui/components/SystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/components/SystemCheck.js +71 -0
- package/dist/cli/tui/components/SystemCheck.js.map +1 -0
- package/dist/cli/tui/components/Verification.d.ts +8 -0
- package/dist/cli/tui/components/Verification.d.ts.map +1 -0
- package/dist/cli/tui/components/Verification.js +63 -0
- package/dist/cli/tui/components/Verification.js.map +1 -0
- package/dist/cli/tui/config-writer-cli.d.ts +12 -0
- package/dist/cli/tui/config-writer-cli.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-cli.js +39 -0
- package/dist/cli/tui/config-writer-cli.js.map +1 -0
- package/dist/cli/tui/config-writer-json.d.ts +16 -0
- package/dist/cli/tui/config-writer-json.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-json.js +86 -0
- package/dist/cli/tui/config-writer-json.js.map +1 -0
- package/dist/cli/tui/config-writer-toml.d.ts +16 -0
- package/dist/cli/tui/config-writer-toml.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-toml.js +83 -0
- package/dist/cli/tui/config-writer-toml.js.map +1 -0
- package/dist/cli/tui/config-writer.d.ts +25 -0
- package/dist/cli/tui/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/config-writer.js +101 -0
- package/dist/cli/tui/config-writer.js.map +1 -0
- package/dist/cli/tui/detect-helpers.d.ts +6 -0
- package/dist/cli/tui/detect-helpers.d.ts.map +1 -0
- package/dist/cli/tui/detect-helpers.js +45 -0
- package/dist/cli/tui/detect-helpers.js.map +1 -0
- package/dist/cli/tui/extras-prompt.d.ts +7 -0
- package/dist/cli/tui/extras-prompt.d.ts.map +1 -0
- package/dist/cli/tui/extras-prompt.js +42 -0
- package/dist/cli/tui/extras-prompt.js.map +1 -0
- package/dist/cli/tui/flags-types.d.ts +19 -0
- package/dist/cli/tui/flags-types.d.ts.map +1 -0
- package/dist/cli/tui/flags-types.js +23 -0
- package/dist/cli/tui/flags-types.js.map +1 -0
- package/dist/cli/tui/flags.d.ts +5 -0
- package/dist/cli/tui/flags.d.ts.map +1 -0
- package/dist/cli/tui/flags.js +132 -0
- package/dist/cli/tui/flags.js.map +1 -0
- package/dist/cli/tui/format.d.ts +14 -0
- package/dist/cli/tui/format.d.ts.map +1 -0
- package/dist/cli/tui/format.js +37 -0
- package/dist/cli/tui/format.js.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts +6 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.js +19 -0
- package/dist/cli/tui/hooks/useAgentDetect.js.map +1 -0
- package/dist/cli/tui/hooks/useInstall.d.ts +14 -0
- package/dist/cli/tui/hooks/useInstall.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useInstall.js +90 -0
- package/dist/cli/tui/hooks/useInstall.js.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts +13 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.js +95 -0
- package/dist/cli/tui/hooks/useSystemCheck.js.map +1 -0
- package/dist/cli/tui/hooks/useVerify.d.ts +14 -0
- package/dist/cli/tui/hooks/useVerify.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useVerify.js +71 -0
- package/dist/cli/tui/hooks/useVerify.js.map +1 -0
- package/dist/cli/tui/ink-init.d.ts +2 -0
- package/dist/cli/tui/ink-init.d.ts.map +1 -0
- package/dist/cli/tui/ink-init.js +198 -0
- package/dist/cli/tui/ink-init.js.map +1 -0
- package/dist/cli/tui/reporter-auto.d.ts +7 -0
- package/dist/cli/tui/reporter-auto.d.ts.map +1 -0
- package/dist/cli/tui/reporter-auto.js +15 -0
- package/dist/cli/tui/reporter-auto.js.map +1 -0
- package/dist/cli/tui/reporter.d.ts +26 -0
- package/dist/cli/tui/reporter.d.ts.map +1 -0
- package/dist/cli/tui/reporter.js +32 -0
- package/dist/cli/tui/reporter.js.map +1 -0
- package/dist/cli/tui/run-command.d.ts +14 -0
- package/dist/cli/tui/run-command.d.ts.map +1 -0
- package/dist/cli/tui/run-command.js +72 -0
- package/dist/cli/tui/run-command.js.map +1 -0
- package/dist/cli/tui/select-agents.d.ts +6 -0
- package/dist/cli/tui/select-agents.d.ts.map +1 -0
- package/dist/cli/tui/select-agents.js +32 -0
- package/dist/cli/tui/select-agents.js.map +1 -0
- package/dist/cli/tui/status-agents.d.ts +11 -0
- package/dist/cli/tui/status-agents.d.ts.map +1 -0
- package/dist/cli/tui/status-agents.js +53 -0
- package/dist/cli/tui/status-agents.js.map +1 -0
- package/dist/cli/tui/status-cache.d.ts +6 -0
- package/dist/cli/tui/status-cache.d.ts.map +1 -0
- package/dist/cli/tui/status-cache.js +39 -0
- package/dist/cli/tui/status-cache.js.map +1 -0
- package/dist/cli/tui/status-format.d.ts +14 -0
- package/dist/cli/tui/status-format.d.ts.map +1 -0
- package/dist/cli/tui/status-format.js +41 -0
- package/dist/cli/tui/status-format.js.map +1 -0
- package/dist/cli/tui/status-python.d.ts +6 -0
- package/dist/cli/tui/status-python.d.ts.map +1 -0
- package/dist/cli/tui/status-python.js +30 -0
- package/dist/cli/tui/status-python.js.map +1 -0
- package/dist/cli/tui/system-check.d.ts +24 -0
- package/dist/cli/tui/system-check.d.ts.map +1 -0
- package/dist/cli/tui/system-check.js +103 -0
- package/dist/cli/tui/system-check.js.map +1 -0
- package/dist/cli/tui/tui-reporter.d.ts +19 -0
- package/dist/cli/tui/tui-reporter.d.ts.map +1 -0
- package/dist/cli/tui/tui-reporter.js +95 -0
- package/dist/cli/tui/tui-reporter.js.map +1 -0
- package/dist/cli/tui/utils/config-writer.d.ts +3 -0
- package/dist/cli/tui/utils/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/utils/config-writer.js +22 -0
- package/dist/cli/tui/utils/config-writer.js.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts +3 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.js +11 -0
- package/dist/cli/tui/utils/suppress-logs.js.map +1 -0
- package/dist/cli/tui/verify-suggestions.d.ts +5 -0
- package/dist/cli/tui/verify-suggestions.d.ts.map +1 -0
- package/dist/cli/tui/verify-suggestions.js +20 -0
- package/dist/cli/tui/verify-suggestions.js.map +1 -0
- package/dist/cli/tui/verify.d.ts +14 -0
- package/dist/cli/tui/verify.d.ts.map +1 -0
- package/dist/cli/tui/verify.js +101 -0
- package/dist/cli/tui/verify.js.map +1 -0
- package/dist/cli/tui/version.d.ts +2 -0
- package/dist/cli/tui/version.d.ts.map +1 -0
- package/dist/cli/tui/version.js +14 -0
- package/dist/cli/tui/version.js.map +1 -0
- package/dist/cli/uninstall.d.ts +2 -0
- package/dist/cli/uninstall.d.ts.map +1 -0
- package/dist/cli/uninstall.js +57 -0
- package/dist/cli/uninstall.js.map +1 -0
- package/dist/cli/warmup.d.ts +10 -2
- package/dist/cli/warmup.d.ts.map +1 -1
- package/dist/cli/warmup.js +226 -93
- package/dist/cli/warmup.js.map +1 -1
- package/dist/config.d.ts +28 -2
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +106 -56
- package/dist/config.js.map +1 -1
- package/dist/crawl/crawler.d.ts +6 -0
- package/dist/crawl/crawler.d.ts.map +1 -1
- package/dist/crawl/crawler.js +210 -209
- package/dist/crawl/crawler.js.map +1 -1
- package/dist/crawl/dedup.d.ts +1 -0
- package/dist/crawl/dedup.d.ts.map +1 -1
- package/dist/crawl/dedup.js +124 -81
- package/dist/crawl/dedup.js.map +1 -1
- package/dist/crawl/etag-incremental.d.ts +43 -0
- package/dist/crawl/etag-incremental.d.ts.map +1 -0
- package/dist/crawl/etag-incremental.js +94 -0
- package/dist/crawl/etag-incremental.js.map +1 -0
- package/dist/crawl/index-to-vec.d.ts +10 -0
- package/dist/crawl/index-to-vec.d.ts.map +1 -0
- package/dist/crawl/index-to-vec.js +44 -0
- package/dist/crawl/index-to-vec.js.map +1 -0
- package/dist/crawl/mapper.js +136 -164
- package/dist/crawl/mapper.js.map +1 -1
- package/dist/crawl/rate-limiter.js +63 -66
- package/dist/crawl/rate-limiter.js.map +1 -1
- package/dist/crawl/robots.js +58 -57
- package/dist/crawl/robots.js.map +1 -1
- package/dist/crawl/sitemap-first.d.ts +12 -0
- package/dist/crawl/sitemap-first.d.ts.map +1 -0
- package/dist/crawl/sitemap-first.js +47 -0
- package/dist/crawl/sitemap-first.js.map +1 -0
- package/dist/crawl/sitemap.js +33 -32
- package/dist/crawl/sitemap.js.map +1 -1
- package/dist/crawl/url-utils.d.ts +1 -0
- package/dist/crawl/url-utils.d.ts.map +1 -1
- package/dist/crawl/url-utils.js +49 -37
- package/dist/crawl/url-utils.js.map +1 -1
- package/dist/daemon/health-check.d.ts +16 -0
- package/dist/daemon/health-check.d.ts.map +1 -0
- package/dist/daemon/health-check.js +33 -0
- package/dist/daemon/health-check.js.map +1 -0
- package/dist/daemon/http-server.d.ts +26 -0
- package/dist/daemon/http-server.d.ts.map +1 -0
- package/dist/daemon/http-server.js +275 -0
- package/dist/daemon/http-server.js.map +1 -0
- package/dist/daemon/proxy.d.ts +10 -0
- package/dist/daemon/proxy.d.ts.map +1 -0
- package/dist/daemon/proxy.js +93 -0
- package/dist/daemon/proxy.js.map +1 -0
- package/dist/embedding/embed.d.ts +59 -0
- package/dist/embedding/embed.d.ts.map +1 -0
- package/dist/embedding/embed.js +233 -0
- package/dist/embedding/embed.js.map +1 -0
- package/dist/embedding/fastembed-provider.d.ts +19 -0
- package/dist/embedding/fastembed-provider.d.ts.map +1 -0
- package/dist/embedding/fastembed-provider.js +51 -0
- package/dist/embedding/fastembed-provider.js.map +1 -0
- package/dist/embedding/key-terms.d.ts +12 -0
- package/dist/embedding/key-terms.d.ts.map +1 -0
- package/dist/embedding/key-terms.js +234 -0
- package/dist/embedding/key-terms.js.map +1 -0
- package/dist/extraction/boilerplate.d.ts +15 -0
- package/dist/extraction/boilerplate.d.ts.map +1 -0
- package/dist/extraction/boilerplate.js +52 -0
- package/dist/extraction/boilerplate.js.map +1 -0
- package/dist/extraction/defuddle.d.ts.map +1 -1
- package/dist/extraction/defuddle.js +27 -23
- package/dist/extraction/defuddle.js.map +1 -1
- package/dist/extraction/extract.d.ts.map +1 -1
- package/dist/extraction/extract.js +76 -76
- package/dist/extraction/extract.js.map +1 -1
- package/dist/extraction/jsonld.js +50 -54
- package/dist/extraction/jsonld.js.map +1 -1
- package/dist/extraction/lang-hints.d.ts +2 -0
- package/dist/extraction/lang-hints.d.ts.map +1 -0
- package/dist/extraction/lang-hints.js +30 -0
- package/dist/extraction/lang-hints.js.map +1 -0
- package/dist/extraction/llm-fallback.d.ts +17 -0
- package/dist/extraction/llm-fallback.d.ts.map +1 -0
- package/dist/extraction/llm-fallback.js +130 -0
- package/dist/extraction/llm-fallback.js.map +1 -0
- package/dist/extraction/markdown-sanitize.d.ts +2 -0
- package/dist/extraction/markdown-sanitize.d.ts.map +1 -0
- package/dist/extraction/markdown-sanitize.js +151 -0
- package/dist/extraction/markdown-sanitize.js.map +1 -0
- package/dist/extraction/markdown.d.ts +11 -0
- package/dist/extraction/markdown.d.ts.map +1 -1
- package/dist/extraction/markdown.js +195 -91
- package/dist/extraction/markdown.js.map +1 -1
- package/dist/extraction/pipeline.d.ts +8 -0
- package/dist/extraction/pipeline.d.ts.map +1 -1
- package/dist/extraction/pipeline.js +57 -91
- package/dist/extraction/pipeline.js.map +1 -1
- package/dist/extraction/readability.d.ts +1 -1
- package/dist/extraction/readability.d.ts.map +1 -1
- package/dist/extraction/readability.js +28 -29
- package/dist/extraction/readability.js.map +1 -1
- package/dist/extraction/schema.d.ts +12 -0
- package/dist/extraction/schema.d.ts.map +1 -1
- package/dist/extraction/schema.js +135 -72
- package/dist/extraction/schema.js.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.d.ts.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.js +81 -91
- package/dist/extraction/site-extractors/docs-generic.js.map +1 -1
- package/dist/extraction/site-extractors/github.d.ts.map +1 -1
- package/dist/extraction/site-extractors/github.js +87 -95
- package/dist/extraction/site-extractors/github.js.map +1 -1
- package/dist/extraction/site-extractors/mdn.d.ts.map +1 -1
- package/dist/extraction/site-extractors/mdn.js +46 -54
- package/dist/extraction/site-extractors/mdn.js.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.d.ts.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.js +71 -80
- package/dist/extraction/site-extractors/stackoverflow.js.map +1 -1
- package/dist/extraction/structured-data.d.ts +4 -0
- package/dist/extraction/structured-data.d.ts.map +1 -0
- package/dist/extraction/structured-data.js +173 -0
- package/dist/extraction/structured-data.js.map +1 -0
- package/dist/extraction/structured.d.ts +4 -0
- package/dist/extraction/structured.d.ts.map +1 -0
- package/dist/extraction/structured.js +163 -0
- package/dist/extraction/structured.js.map +1 -0
- package/dist/extraction/v1/classifier.d.ts +3 -0
- package/dist/extraction/v1/classifier.d.ts.map +1 -0
- package/dist/extraction/v1/classifier.js +110 -0
- package/dist/extraction/v1/classifier.js.map +1 -0
- package/dist/extraction/v1/extract-provider.d.ts +16 -0
- package/dist/extraction/v1/extract-provider.d.ts.map +1 -0
- package/dist/extraction/v1/extract-provider.js +43 -0
- package/dist/extraction/v1/extract-provider.js.map +1 -0
- package/dist/extraction/v1/local-llm.d.ts +8 -0
- package/dist/extraction/v1/local-llm.d.ts.map +1 -0
- package/dist/extraction/v1/local-llm.js +34 -0
- package/dist/extraction/v1/local-llm.js.map +1 -0
- package/dist/extraction/v1/news.d.ts +3 -0
- package/dist/extraction/v1/news.d.ts.map +1 -0
- package/dist/extraction/v1/news.js +61 -0
- package/dist/extraction/v1/news.js.map +1 -0
- package/dist/extraction/v1/product.d.ts +3 -0
- package/dist/extraction/v1/product.d.ts.map +1 -0
- package/dist/extraction/v1/product.js +166 -0
- package/dist/extraction/v1/product.js.map +1 -0
- package/dist/extraction/v1/recipe.d.ts +3 -0
- package/dist/extraction/v1/recipe.d.ts.map +1 -0
- package/dist/extraction/v1/recipe.js +136 -0
- package/dist/extraction/v1/recipe.js.map +1 -0
- package/dist/extraction/v1/routed.d.ts +17 -0
- package/dist/extraction/v1/routed.d.ts.map +1 -0
- package/dist/extraction/v1/routed.js +68 -0
- package/dist/extraction/v1/routed.js.map +1 -0
- package/dist/extraction/v1/schemas/Article.d.ts +11 -0
- package/dist/extraction/v1/schemas/Article.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Article.js +23 -0
- package/dist/extraction/v1/schemas/Article.js.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts +9 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js +90 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts +10 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.js +122 -0
- package/dist/extraction/v1/schemas/EventListing.js.map +1 -0
- package/dist/extraction/v1/schemas/Paper.d.ts +10 -0
- package/dist/extraction/v1/schemas/Paper.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Paper.js +156 -0
- package/dist/extraction/v1/schemas/Paper.js.map +1 -0
- package/dist/extraction/v1/schemas/Product.d.ts +17 -0
- package/dist/extraction/v1/schemas/Product.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Product.js +149 -0
- package/dist/extraction/v1/schemas/Product.js.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts +14 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.js +160 -0
- package/dist/extraction/v1/schemas/Recipe.js.map +1 -0
- package/dist/extraction/v1/schemas/index.d.ts +13 -0
- package/dist/extraction/v1/schemas/index.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/index.js +44 -0
- package/dist/extraction/v1/schemas/index.js.map +1 -0
- package/dist/extraction/v1/site-extractors.d.ts +5 -0
- package/dist/extraction/v1/site-extractors.d.ts.map +1 -0
- package/dist/extraction/v1/site-extractors.js +31 -0
- package/dist/extraction/v1/site-extractors.js.map +1 -0
- package/dist/fetch/action-executor.d.ts +28 -0
- package/dist/fetch/action-executor.d.ts.map +1 -0
- package/dist/fetch/action-executor.js +88 -0
- package/dist/fetch/action-executor.js.map +1 -0
- package/dist/fetch/auth.d.ts +2 -1
- package/dist/fetch/auth.d.ts.map +1 -1
- package/dist/fetch/auth.js +56 -26
- package/dist/fetch/auth.js.map +1 -1
- package/dist/fetch/browser-pool.d.ts +30 -11
- package/dist/fetch/browser-pool.d.ts.map +1 -1
- package/dist/fetch/browser-pool.js +303 -127
- package/dist/fetch/browser-pool.js.map +1 -1
- package/dist/fetch/browser-selector.d.ts +17 -0
- package/dist/fetch/browser-selector.d.ts.map +1 -0
- package/dist/fetch/browser-selector.js +72 -0
- package/dist/fetch/browser-selector.js.map +1 -0
- package/dist/fetch/browser-types.d.ts +3 -0
- package/dist/fetch/browser-types.d.ts.map +1 -0
- package/dist/fetch/browser-types.js +45 -0
- package/dist/fetch/browser-types.js.map +1 -0
- package/dist/fetch/cdp-client.d.ts +9 -0
- package/dist/fetch/cdp-client.d.ts.map +1 -0
- package/dist/fetch/cdp-client.js +89 -0
- package/dist/fetch/cdp-client.js.map +1 -0
- package/dist/fetch/content-check.js +39 -46
- package/dist/fetch/content-check.js.map +1 -1
- package/dist/fetch/error-describe.d.ts +7 -0
- package/dist/fetch/error-describe.d.ts.map +1 -0
- package/dist/fetch/error-describe.js +37 -0
- package/dist/fetch/error-describe.js.map +1 -0
- package/dist/fetch/http-client.d.ts +4 -0
- package/dist/fetch/http-client.d.ts.map +1 -1
- package/dist/fetch/http-client.js +147 -128
- package/dist/fetch/http-client.js.map +1 -1
- package/dist/fetch/lightpanda.d.ts +28 -0
- package/dist/fetch/lightpanda.d.ts.map +1 -0
- package/dist/fetch/lightpanda.js +174 -0
- package/dist/fetch/lightpanda.js.map +1 -0
- package/dist/fetch/playwright-tier.d.ts +19 -0
- package/dist/fetch/playwright-tier.d.ts.map +1 -0
- package/dist/fetch/playwright-tier.js +76 -0
- package/dist/fetch/playwright-tier.js.map +1 -0
- package/dist/fetch/router.d.ts +49 -3
- package/dist/fetch/router.d.ts.map +1 -1
- package/dist/fetch/router.js +187 -81
- package/dist/fetch/router.js.map +1 -1
- package/dist/index.js +102 -17
- package/dist/index.js.map +1 -1
- package/dist/instructions.d.ts +31 -0
- package/dist/instructions.d.ts.map +1 -0
- package/dist/instructions.js +245 -0
- package/dist/instructions.js.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts +3 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.js +41 -0
- package/dist/integrations/cloud/llm/anthropic.js.map +1 -0
- package/dist/integrations/cloud/llm/cache.d.ts +5 -0
- package/dist/integrations/cloud/llm/cache.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/cache.js +49 -0
- package/dist/integrations/cloud/llm/cache.js.map +1 -0
- package/dist/integrations/cloud/llm/gemini.d.ts +3 -0
- package/dist/integrations/cloud/llm/gemini.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/gemini.js +37 -0
- package/dist/integrations/cloud/llm/gemini.js.map +1 -0
- package/dist/integrations/cloud/llm/groq.d.ts +3 -0
- package/dist/integrations/cloud/llm/groq.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/groq.js +74 -0
- package/dist/integrations/cloud/llm/groq.js.map +1 -0
- package/dist/integrations/cloud/llm/hash.d.ts +3 -0
- package/dist/integrations/cloud/llm/hash.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/hash.js +26 -0
- package/dist/integrations/cloud/llm/hash.js.map +1 -0
- package/dist/integrations/cloud/llm/model-select.d.ts +5 -0
- package/dist/integrations/cloud/llm/model-select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/model-select.js +32 -0
- package/dist/integrations/cloud/llm/model-select.js.map +1 -0
- package/dist/integrations/cloud/llm/openai.d.ts +3 -0
- package/dist/integrations/cloud/llm/openai.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/openai.js +43 -0
- package/dist/integrations/cloud/llm/openai.js.map +1 -0
- package/dist/integrations/cloud/llm/run.d.ts +27 -0
- package/dist/integrations/cloud/llm/run.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/run.js +99 -0
- package/dist/integrations/cloud/llm/run.js.map +1 -0
- package/dist/integrations/cloud/llm/select.d.ts +5 -0
- package/dist/integrations/cloud/llm/select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/select.js +30 -0
- package/dist/integrations/cloud/llm/select.js.map +1 -0
- package/dist/integrations/cloud/llm/text-adapters.d.ts +19 -0
- package/dist/integrations/cloud/llm/text-adapters.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/text-adapters.js +103 -0
- package/dist/integrations/cloud/llm/text-adapters.js.map +1 -0
- package/dist/integrations/cloud/llm/types.d.ts +24 -0
- package/dist/integrations/cloud/llm/types.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/types.js +1 -0
- package/dist/integrations/cloud/llm/types.js.map +1 -0
- package/dist/integrations/cloud/llm/validate.d.ts +6 -0
- package/dist/integrations/cloud/llm/validate.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/validate.js +63 -0
- package/dist/integrations/cloud/llm/validate.js.map +1 -0
- package/dist/logger.d.ts +4 -1
- package/dist/logger.d.ts.map +1 -1
- package/dist/logger.js +71 -30
- package/dist/logger.js.map +1 -1
- package/dist/pdf-parse.d.js +1 -0
- package/dist/pdf-parse.d.js.map +1 -0
- package/dist/plugins/loader.d.ts +20 -0
- package/dist/plugins/loader.d.ts.map +1 -0
- package/dist/plugins/loader.js +157 -0
- package/dist/plugins/loader.js.map +1 -0
- package/dist/plugins/registry.d.ts +26 -0
- package/dist/plugins/registry.d.ts.map +1 -0
- package/dist/plugins/registry.js +71 -0
- package/dist/plugins/registry.js.map +1 -0
- package/dist/plugins/validate.d.ts +9 -0
- package/dist/plugins/validate.d.ts.map +1 -0
- package/dist/plugins/validate.js +79 -0
- package/dist/plugins/validate.js.map +1 -0
- package/dist/providers/embed-provider.d.ts +11 -0
- package/dist/providers/embed-provider.d.ts.map +1 -0
- package/dist/providers/embed-provider.js +24 -0
- package/dist/providers/embed-provider.js.map +1 -0
- package/dist/providers/extract-provider.d.ts +23 -0
- package/dist/providers/extract-provider.d.ts.map +1 -0
- package/dist/providers/extract-provider.js +25 -0
- package/dist/providers/extract-provider.js.map +1 -0
- package/dist/providers/rerank-provider.d.ts +17 -0
- package/dist/providers/rerank-provider.d.ts.map +1 -0
- package/dist/providers/rerank-provider.js +41 -0
- package/dist/providers/rerank-provider.js.map +1 -0
- package/dist/providers/search-provider.d.ts +25 -0
- package/dist/providers/search-provider.d.ts.map +1 -0
- package/dist/providers/search-provider.js +44 -0
- package/dist/providers/search-provider.js.map +1 -0
- package/dist/providers/vector-store.d.ts +27 -0
- package/dist/providers/vector-store.d.ts.map +1 -0
- package/dist/providers/vector-store.js +27 -0
- package/dist/providers/vector-store.js.map +1 -0
- package/dist/python-env.d.ts +9 -0
- package/dist/python-env.d.ts.map +1 -0
- package/dist/python-env.js +13 -0
- package/dist/python-env.js.map +1 -0
- package/dist/repl/commands/agent.d.ts +5 -0
- package/dist/repl/commands/agent.d.ts.map +1 -0
- package/dist/repl/commands/agent.js +62 -0
- package/dist/repl/commands/agent.js.map +1 -0
- package/dist/repl/commands/cache.d.ts +4 -0
- package/dist/repl/commands/cache.d.ts.map +1 -0
- package/dist/repl/commands/cache.js +43 -0
- package/dist/repl/commands/cache.js.map +1 -0
- package/dist/repl/commands/crawl.d.ts +7 -0
- package/dist/repl/commands/crawl.d.ts.map +1 -0
- package/dist/repl/commands/crawl.js +44 -0
- package/dist/repl/commands/crawl.js.map +1 -0
- package/dist/repl/commands/extract.d.ts +5 -0
- package/dist/repl/commands/extract.d.ts.map +1 -0
- package/dist/repl/commands/extract.js +47 -0
- package/dist/repl/commands/extract.js.map +1 -0
- package/dist/repl/commands/fetch.d.ts +5 -0
- package/dist/repl/commands/fetch.d.ts.map +1 -0
- package/dist/repl/commands/fetch.js +67 -0
- package/dist/repl/commands/fetch.js.map +1 -0
- package/dist/repl/commands/find-similar.d.ts +5 -0
- package/dist/repl/commands/find-similar.d.ts.map +1 -0
- package/dist/repl/commands/find-similar.js +74 -0
- package/dist/repl/commands/find-similar.js.map +1 -0
- package/dist/repl/commands/research.d.ts +5 -0
- package/dist/repl/commands/research.d.ts.map +1 -0
- package/dist/repl/commands/research.js +65 -0
- package/dist/repl/commands/research.js.map +1 -0
- package/dist/repl/commands/search.d.ts +5 -0
- package/dist/repl/commands/search.d.ts.map +1 -0
- package/dist/repl/commands/search.js +74 -0
- package/dist/repl/commands/search.js.map +1 -0
- package/dist/repl/commands/types.d.ts +9 -0
- package/dist/repl/commands/types.d.ts.map +1 -0
- package/dist/repl/commands/types.js +1 -0
- package/dist/repl/commands/types.js.map +1 -0
- package/dist/repl/formatters.d.ts +13 -0
- package/dist/repl/formatters.d.ts.map +1 -0
- package/dist/repl/formatters.js +283 -0
- package/dist/repl/formatters.js.map +1 -0
- package/dist/repl/parser.d.ts +9 -0
- package/dist/repl/parser.d.ts.map +1 -0
- package/dist/repl/parser.js +86 -0
- package/dist/repl/parser.js.map +1 -0
- package/dist/repl/shell.d.ts +8 -0
- package/dist/repl/shell.d.ts.map +1 -0
- package/dist/repl/shell.js +184 -0
- package/dist/repl/shell.js.map +1 -0
- package/dist/research/branch-exploration.d.ts +14 -0
- package/dist/research/branch-exploration.d.ts.map +1 -0
- package/dist/research/branch-exploration.js +100 -0
- package/dist/research/branch-exploration.js.map +1 -0
- package/dist/research/brief.d.ts +6 -0
- package/dist/research/brief.d.ts.map +1 -0
- package/dist/research/brief.js +246 -0
- package/dist/research/brief.js.map +1 -0
- package/dist/research/citation-graph.d.ts +9 -0
- package/dist/research/citation-graph.d.ts.map +1 -0
- package/dist/research/citation-graph.js +114 -0
- package/dist/research/citation-graph.js.map +1 -0
- package/dist/research/decompose.d.ts +14 -0
- package/dist/research/decompose.d.ts.map +1 -0
- package/dist/research/decompose.js +439 -0
- package/dist/research/decompose.js.map +1 -0
- package/dist/research/pipeline.d.ts +5 -0
- package/dist/research/pipeline.d.ts.map +1 -0
- package/dist/research/pipeline.js +269 -0
- package/dist/research/pipeline.js.map +1 -0
- package/dist/research/synthesis-local.d.ts +19 -0
- package/dist/research/synthesis-local.d.ts.map +1 -0
- package/dist/research/synthesis-local.js +62 -0
- package/dist/research/synthesis-local.js.map +1 -0
- package/dist/research/synthesize.d.ts +10 -0
- package/dist/research/synthesize.d.ts.map +1 -0
- package/dist/research/synthesize.js +137 -0
- package/dist/research/synthesize.js.map +1 -0
- package/dist/search/answer-synthesis.d.ts +33 -0
- package/dist/search/answer-synthesis.d.ts.map +1 -0
- package/dist/search/answer-synthesis.js +244 -0
- package/dist/search/answer-synthesis.js.map +1 -0
- package/dist/search/context-formatter.d.ts +3 -0
- package/dist/search/context-formatter.d.ts.map +1 -0
- package/dist/search/context-formatter.js +56 -0
- package/dist/search/context-formatter.js.map +1 -0
- package/dist/search/dedup.d.ts +1 -0
- package/dist/search/dedup.d.ts.map +1 -1
- package/dist/search/dedup.js +40 -32
- package/dist/search/dedup.js.map +1 -1
- package/dist/search/engines/arxiv.d.ts +7 -0
- package/dist/search/engines/arxiv.d.ts.map +1 -0
- package/dist/search/engines/arxiv.js +70 -0
- package/dist/search/engines/arxiv.js.map +1 -0
- package/dist/search/engines/bing-news.d.ts +7 -0
- package/dist/search/engines/bing-news.d.ts.map +1 -0
- package/dist/search/engines/bing-news.js +97 -0
- package/dist/search/engines/bing-news.js.map +1 -0
- package/dist/search/engines/bing.d.ts +1 -0
- package/dist/search/engines/bing.d.ts.map +1 -1
- package/dist/search/engines/bing.js +100 -44
- package/dist/search/engines/bing.js.map +1 -1
- package/dist/search/engines/devdocs.d.ts +6 -0
- package/dist/search/engines/devdocs.d.ts.map +1 -0
- package/dist/search/engines/devdocs.js +56 -0
- package/dist/search/engines/devdocs.js.map +1 -0
- package/dist/search/engines/duckduckgo.d.ts.map +1 -1
- package/dist/search/engines/duckduckgo.js +56 -44
- package/dist/search/engines/duckduckgo.js.map +1 -1
- package/dist/search/engines/github-code.d.ts +7 -0
- package/dist/search/engines/github-code.d.ts.map +1 -0
- package/dist/search/engines/github-code.js +55 -0
- package/dist/search/engines/github-code.js.map +1 -0
- package/dist/search/engines/hn-algolia.d.ts +7 -0
- package/dist/search/engines/hn-algolia.d.ts.map +1 -0
- package/dist/search/engines/hn-algolia.js +76 -0
- package/dist/search/engines/hn-algolia.js.map +1 -0
- package/dist/search/engines/lobsters.d.ts +7 -0
- package/dist/search/engines/lobsters.d.ts.map +1 -0
- package/dist/search/engines/lobsters.js +83 -0
- package/dist/search/engines/lobsters.js.map +1 -0
- package/dist/search/engines/mdn.d.ts +7 -0
- package/dist/search/engines/mdn.d.ts.map +1 -0
- package/dist/search/engines/mdn.js +48 -0
- package/dist/search/engines/mdn.js.map +1 -0
- package/dist/search/engines/semantic-scholar.d.ts +7 -0
- package/dist/search/engines/semantic-scholar.d.ts.map +1 -0
- package/dist/search/engines/semantic-scholar.js +69 -0
- package/dist/search/engines/semantic-scholar.js.map +1 -0
- package/dist/search/engines/stackoverflow.d.ts +7 -0
- package/dist/search/engines/stackoverflow.d.ts.map +1 -0
- package/dist/search/engines/stackoverflow.js +73 -0
- package/dist/search/engines/stackoverflow.js.map +1 -0
- package/dist/search/engines/startpage.d.ts.map +1 -1
- package/dist/search/engines/startpage.js +65 -46
- package/dist/search/engines/startpage.js.map +1 -1
- package/dist/search/evidence.d.ts +25 -0
- package/dist/search/evidence.d.ts.map +1 -0
- package/dist/search/evidence.js +220 -0
- package/dist/search/evidence.js.map +1 -0
- package/dist/search/filters.d.ts.map +1 -1
- package/dist/search/filters.js +58 -54
- package/dist/search/filters.js.map +1 -1
- package/dist/search/find-similar/crawl-rank.d.ts +9 -0
- package/dist/search/find-similar/crawl-rank.d.ts.map +1 -0
- package/dist/search/find-similar/crawl-rank.js +272 -0
- package/dist/search/find-similar/crawl-rank.js.map +1 -0
- package/dist/search/find-similar/mode.d.ts +4 -0
- package/dist/search/find-similar/mode.d.ts.map +1 -0
- package/dist/search/find-similar/mode.js +12 -0
- package/dist/search/find-similar/mode.js.map +1 -0
- package/dist/search/find-similar.d.ts +5 -0
- package/dist/search/find-similar.d.ts.map +1 -0
- package/dist/search/find-similar.js +509 -0
- package/dist/search/find-similar.js.map +1 -0
- package/dist/search/highlights.d.ts +19 -0
- package/dist/search/highlights.d.ts.map +1 -0
- package/dist/search/highlights.js +167 -0
- package/dist/search/highlights.js.map +1 -0
- package/dist/search/language-filter.d.ts +29 -0
- package/dist/search/language-filter.d.ts.map +1 -0
- package/dist/search/language-filter.js +126 -0
- package/dist/search/language-filter.js.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts +4 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.js +501 -0
- package/dist/search/legacy/searxng-orchestrator.js.map +1 -0
- package/dist/search/legacy/searxng-provider.d.ts +7 -0
- package/dist/search/legacy/searxng-provider.d.ts.map +1 -0
- package/dist/search/legacy/searxng-provider.js +11 -0
- package/dist/search/legacy/searxng-provider.js.map +1 -0
- package/dist/search/multi-query.d.ts +25 -0
- package/dist/search/multi-query.d.ts.map +1 -0
- package/dist/search/multi-query.js +228 -0
- package/dist/search/multi-query.js.map +1 -0
- package/dist/search/query.js +32 -34
- package/dist/search/query.js.map +1 -1
- package/dist/search/rerank.d.ts +3 -1
- package/dist/search/rerank.d.ts.map +1 -1
- package/dist/search/rerank.js +44 -35
- package/dist/search/rerank.js.map +1 -1
- package/dist/search/reranker/authority-boost.d.ts +3 -0
- package/dist/search/reranker/authority-boost.d.ts.map +1 -0
- package/dist/search/reranker/authority-boost.js +179 -0
- package/dist/search/reranker/authority-boost.js.map +1 -0
- package/dist/search/reranker/consensus-boost.d.ts +3 -0
- package/dist/search/reranker/consensus-boost.d.ts.map +1 -0
- package/dist/search/reranker/consensus-boost.js +27 -0
- package/dist/search/reranker/consensus-boost.js.map +1 -0
- package/dist/search/reranker/recency-boost.d.ts +3 -0
- package/dist/search/reranker/recency-boost.d.ts.map +1 -0
- package/dist/search/reranker/recency-boost.js +13 -0
- package/dist/search/reranker/recency-boost.js.map +1 -0
- package/dist/search/reranker/recency.d.ts +3 -0
- package/dist/search/reranker/recency.d.ts.map +1 -0
- package/dist/search/reranker/recency.js +23 -0
- package/dist/search/reranker/recency.js.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts +13 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.js +94 -0
- package/dist/search/reranker/transformers-rerank-provider.js.map +1 -0
- package/dist/search/rrf.d.ts +17 -0
- package/dist/search/rrf.d.ts.map +1 -0
- package/dist/search/rrf.js +39 -0
- package/dist/search/rrf.js.map +1 -0
- package/dist/search/sampling.d.ts +25 -0
- package/dist/search/sampling.d.ts.map +1 -0
- package/dist/search/sampling.js +52 -0
- package/dist/search/sampling.js.map +1 -0
- package/dist/search/searxng.d.ts.map +1 -1
- package/dist/search/searxng.js +69 -79
- package/dist/search/searxng.js.map +1 -1
- package/dist/search/tokens.d.ts +3 -0
- package/dist/search/tokens.d.ts.map +1 -0
- package/dist/search/tokens.js +39 -0
- package/dist/search/tokens.js.map +1 -0
- package/dist/search/truncate.d.ts +6 -0
- package/dist/search/truncate.d.ts.map +1 -0
- package/dist/search/truncate.js +26 -0
- package/dist/search/truncate.js.map +1 -0
- package/dist/search/url-unwrap.d.ts +3 -0
- package/dist/search/url-unwrap.d.ts.map +1 -0
- package/dist/search/url-unwrap.js +43 -0
- package/dist/search/url-unwrap.js.map +1 -0
- package/dist/search/v1/context-rank.d.ts +13 -0
- package/dist/search/v1/context-rank.d.ts.map +1 -0
- package/dist/search/v1/context-rank.js +74 -0
- package/dist/search/v1/context-rank.js.map +1 -0
- package/dist/search/v1/engine-base.d.ts +27 -0
- package/dist/search/v1/engine-base.d.ts.map +1 -0
- package/dist/search/v1/engine-base.js +110 -0
- package/dist/search/v1/engine-base.js.map +1 -0
- package/dist/search/v1/intent-router.d.ts +22 -0
- package/dist/search/v1/intent-router.d.ts.map +1 -0
- package/dist/search/v1/intent-router.js +138 -0
- package/dist/search/v1/intent-router.js.map +1 -0
- package/dist/search/v1/orchestrator.d.ts +24 -0
- package/dist/search/v1/orchestrator.d.ts.map +1 -0
- package/dist/search/v1/orchestrator.js +163 -0
- package/dist/search/v1/orchestrator.js.map +1 -0
- package/dist/search/v1/recency-boost.d.ts +9 -0
- package/dist/search/v1/recency-boost.d.ts.map +1 -0
- package/dist/search/v1/recency-boost.js +37 -0
- package/dist/search/v1/recency-boost.js.map +1 -0
- package/dist/search/v1/recent-cache-dedup.d.ts +6 -0
- package/dist/search/v1/recent-cache-dedup.d.ts.map +1 -0
- package/dist/search/v1/recent-cache-dedup.js +85 -0
- package/dist/search/v1/recent-cache-dedup.js.map +1 -0
- package/dist/search/v1/rss/feed-config.d.ts +21 -0
- package/dist/search/v1/rss/feed-config.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-config.js +90 -0
- package/dist/search/v1/rss/feed-config.js.map +1 -0
- package/dist/search/v1/rss/feed-parser.d.ts +14 -0
- package/dist/search/v1/rss/feed-parser.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-parser.js +104 -0
- package/dist/search/v1/rss/feed-parser.js.map +1 -0
- package/dist/search/v1/rss/feed-poller.d.ts +22 -0
- package/dist/search/v1/rss/feed-poller.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-poller.js +102 -0
- package/dist/search/v1/rss/feed-poller.js.map +1 -0
- package/dist/search/v1/rss/feed-store.d.ts +30 -0
- package/dist/search/v1/rss/feed-store.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-store.js +134 -0
- package/dist/search/v1/rss/feed-store.js.map +1 -0
- package/dist/search/v1/rss/rss-engine.d.ts +6 -0
- package/dist/search/v1/rss/rss-engine.d.ts.map +1 -0
- package/dist/search/v1/rss/rss-engine.js +28 -0
- package/dist/search/v1/rss/rss-engine.js.map +1 -0
- package/dist/search/v1/v1-provider.d.ts +7 -0
- package/dist/search/v1/v1-provider.d.ts.map +1 -0
- package/dist/search/v1/v1-provider.js +68 -0
- package/dist/search/v1/v1-provider.js.map +1 -0
- package/dist/search/v1/verticals/code.d.ts +4 -0
- package/dist/search/v1/verticals/code.d.ts.map +1 -0
- package/dist/search/v1/verticals/code.js +20 -0
- package/dist/search/v1/verticals/code.js.map +1 -0
- package/dist/search/v1/verticals/docs.d.ts +4 -0
- package/dist/search/v1/verticals/docs.d.ts.map +1 -0
- package/dist/search/v1/verticals/docs.js +20 -0
- package/dist/search/v1/verticals/docs.js.map +1 -0
- package/dist/search/v1/verticals/general.d.ts +4 -0
- package/dist/search/v1/verticals/general.d.ts.map +1 -0
- package/dist/search/v1/verticals/general.js +22 -0
- package/dist/search/v1/verticals/general.js.map +1 -0
- package/dist/search/v1/verticals/news.d.ts +10 -0
- package/dist/search/v1/verticals/news.d.ts.map +1 -0
- package/dist/search/v1/verticals/news.js +52 -0
- package/dist/search/v1/verticals/news.js.map +1 -0
- package/dist/search/v1/verticals/papers.d.ts +4 -0
- package/dist/search/v1/verticals/papers.d.ts.map +1 -0
- package/dist/search/v1/verticals/papers.js +23 -0
- package/dist/search/v1/verticals/papers.js.map +1 -0
- package/dist/search/validator.js +31 -31
- package/dist/search/validator.js.map +1 -1
- package/dist/searxng/bootstrap.d.ts +30 -0
- package/dist/searxng/bootstrap.d.ts.map +1 -1
- package/dist/searxng/bootstrap.js +223 -85
- package/dist/searxng/bootstrap.js.map +1 -1
- package/dist/searxng/docker.d.ts.map +1 -1
- package/dist/searxng/docker.js +69 -60
- package/dist/searxng/docker.js.map +1 -1
- package/dist/searxng/process.d.ts +13 -1
- package/dist/searxng/process.d.ts.map +1 -1
- package/dist/searxng/process.js +231 -164
- package/dist/searxng/process.js.map +1 -1
- package/dist/server/backend-status.d.ts +13 -0
- package/dist/server/backend-status.d.ts.map +1 -0
- package/dist/server/backend-status.js +40 -0
- package/dist/server/backend-status.js.map +1 -0
- package/dist/server/tool-schemas.d.ts +549 -0
- package/dist/server/tool-schemas.d.ts.map +1 -0
- package/dist/server/tool-schemas.js +464 -0
- package/dist/server/tool-schemas.js.map +1 -0
- package/dist/server/warmup-on-start.d.ts +9 -0
- package/dist/server/warmup-on-start.d.ts.map +1 -0
- package/dist/server/warmup-on-start.js +55 -0
- package/dist/server/warmup-on-start.js.map +1 -0
- package/dist/server.d.ts +17 -0
- package/dist/server.d.ts.map +1 -1
- package/dist/server.js +454 -297
- package/dist/server.js.map +1 -1
- package/dist/tools/agent.d.ts +5 -0
- package/dist/tools/agent.d.ts.map +1 -0
- package/dist/tools/agent.js +128 -0
- package/dist/tools/agent.js.map +1 -0
- package/dist/tools/cache.d.ts +2 -1
- package/dist/tools/cache.d.ts.map +1 -1
- package/dist/tools/cache.js +177 -44
- package/dist/tools/cache.js.map +1 -1
- package/dist/tools/crawl.d.ts.map +1 -1
- package/dist/tools/crawl.js +171 -88
- package/dist/tools/crawl.js.map +1 -1
- package/dist/tools/extract.d.ts +2 -2
- package/dist/tools/extract.d.ts.map +1 -1
- package/dist/tools/extract.js +175 -59
- package/dist/tools/extract.js.map +1 -1
- package/dist/tools/fetch.d.ts +2 -2
- package/dist/tools/fetch.d.ts.map +1 -1
- package/dist/tools/fetch.js +174 -68
- package/dist/tools/fetch.js.map +1 -1
- package/dist/tools/find-similar.d.ts +5 -0
- package/dist/tools/find-similar.d.ts.map +1 -0
- package/dist/tools/find-similar.js +127 -0
- package/dist/tools/find-similar.js.map +1 -0
- package/dist/tools/research.d.ts +5 -0
- package/dist/tools/research.d.ts.map +1 -0
- package/dist/tools/research.js +107 -0
- package/dist/tools/research.js.map +1 -0
- package/dist/tools/search.d.ts +10 -2
- package/dist/tools/search.d.ts.map +1 -1
- package/dist/tools/search.js +13 -158
- package/dist/tools/search.js.map +1 -1
- package/dist/types.d.ts +350 -7
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js +6 -1
- package/dist/types.js.map +1 -1
- package/dist/util/mode.d.ts +4 -0
- package/dist/util/mode.d.ts.map +1 -0
- package/dist/util/mode.js +34 -0
- package/dist/util/mode.js.map +1 -0
- package/package.json +78 -8
- package/dist/extraction/trafilatura.d.ts +0 -6
- package/dist/extraction/trafilatura.d.ts.map +0 -1
- package/dist/extraction/trafilatura.js +0 -105
- package/dist/extraction/trafilatura.js.map +0 -1
- package/dist/search/flashrank.d.ts +0 -12
- package/dist/search/flashrank.d.ts.map +0 -1
- package/dist/search/flashrank.js +0 -63
- package/dist/search/flashrank.js.map +0 -1
|
@@ -0,0 +1,167 @@
|
|
|
1
|
+
import { getRerankProvider } from "../providers/rerank-provider.js";
|
|
2
|
+
import { getConfig } from "../config.js";
|
|
3
|
+
import { createLogger } from "../logger.js";
|
|
4
|
+
import { parseHeadings, lineStartCharOffsets } from "../extraction/markdown.js";
|
|
5
|
+
const log = createLogger("search");
|
|
6
|
+
const MAX_PASSAGE_LENGTH = 500;
|
|
7
|
+
const MIN_PASSAGE_LENGTH = 50;
|
|
8
|
+
const DEFAULT_MAX_HIGHLIGHTS = 10;
|
|
9
|
+
function shouldKeep(trimmed) {
|
|
10
|
+
if (trimmed.length < MIN_PASSAGE_LENGTH) return false;
|
|
11
|
+
if (trimmed.startsWith("#")) return false;
|
|
12
|
+
if (trimmed.startsWith("|")) return false;
|
|
13
|
+
if (trimmed.startsWith("```")) return false;
|
|
14
|
+
if (trimmed.startsWith("- ") && trimmed.length <= 120) return false;
|
|
15
|
+
return true;
|
|
16
|
+
}
|
|
17
|
+
function splitIntoPassages(markdown) {
|
|
18
|
+
if (!markdown) return [];
|
|
19
|
+
const out = [];
|
|
20
|
+
const re = /\n\n+/g;
|
|
21
|
+
let blockStart = 0;
|
|
22
|
+
let m;
|
|
23
|
+
const consider = (rawStart, rawEnd) => {
|
|
24
|
+
const raw = markdown.slice(rawStart, rawEnd);
|
|
25
|
+
if (!raw) return;
|
|
26
|
+
let leading = 0;
|
|
27
|
+
while (leading < raw.length && /\s/.test(raw[leading])) leading++;
|
|
28
|
+
let trailing = raw.length;
|
|
29
|
+
while (trailing > leading && /\s/.test(raw[trailing - 1])) trailing--;
|
|
30
|
+
if (trailing <= leading) return;
|
|
31
|
+
const trimmedStart = rawStart + leading;
|
|
32
|
+
const trimmedEnd = rawStart + trailing;
|
|
33
|
+
const trimmed = markdown.slice(trimmedStart, trimmedEnd);
|
|
34
|
+
if (!shouldKeep(trimmed)) return;
|
|
35
|
+
const text = trimmed.length > MAX_PASSAGE_LENGTH ? trimmed.slice(0, MAX_PASSAGE_LENGTH) : trimmed;
|
|
36
|
+
const charEnd = trimmedStart + text.length;
|
|
37
|
+
out.push({ text, charStart: trimmedStart, charEnd });
|
|
38
|
+
};
|
|
39
|
+
while ((m = re.exec(markdown)) !== null) {
|
|
40
|
+
consider(blockStart, m.index);
|
|
41
|
+
blockStart = m.index + m[0].length;
|
|
42
|
+
}
|
|
43
|
+
consider(blockStart, markdown.length);
|
|
44
|
+
return out;
|
|
45
|
+
}
|
|
46
|
+
function splitIntoPassageStrings(markdown) {
|
|
47
|
+
return splitIntoPassages(markdown).map((p) => p.text);
|
|
48
|
+
}
|
|
49
|
+
function mapPassageHeadings(markdown, passages) {
|
|
50
|
+
const lines = markdown.split("\n");
|
|
51
|
+
const headings = parseHeadings(lines);
|
|
52
|
+
const offsets = lineStartCharOffsets(lines);
|
|
53
|
+
const headingOffsets = headings.map((h) => ({ text: h.text, charStart: offsets[h.lineIndex] }));
|
|
54
|
+
return passages.map((p) => {
|
|
55
|
+
let nearest = null;
|
|
56
|
+
for (const h of headingOffsets) {
|
|
57
|
+
if (h.charStart <= p.charStart) nearest = h.text;
|
|
58
|
+
else break;
|
|
59
|
+
}
|
|
60
|
+
return { ...p, sectionHeading: nearest };
|
|
61
|
+
});
|
|
62
|
+
}
|
|
63
|
+
async function extractHighlights(query, results, maxHighlights = DEFAULT_MAX_HIGHLIGHTS) {
|
|
64
|
+
const citations = [];
|
|
65
|
+
const candidates = [];
|
|
66
|
+
for (let i = 0; i < results.length; i++) {
|
|
67
|
+
const r = results[i];
|
|
68
|
+
citations.push({
|
|
69
|
+
index: i + 1,
|
|
70
|
+
url: r.url,
|
|
71
|
+
title: r.title,
|
|
72
|
+
snippet: r.snippet
|
|
73
|
+
});
|
|
74
|
+
const source = r.markdown_content ?? r.snippet ?? "";
|
|
75
|
+
const passages = splitIntoPassages(source);
|
|
76
|
+
const annotated = mapPassageHeadings(source, passages);
|
|
77
|
+
for (const p of annotated) {
|
|
78
|
+
candidates.push({
|
|
79
|
+
text: p.text,
|
|
80
|
+
sourceIndex: i + 1,
|
|
81
|
+
sourceUrl: r.url,
|
|
82
|
+
sourceTitle: r.title,
|
|
83
|
+
charStart: p.charStart,
|
|
84
|
+
charEnd: p.charEnd,
|
|
85
|
+
sectionHeading: p.sectionHeading
|
|
86
|
+
});
|
|
87
|
+
}
|
|
88
|
+
}
|
|
89
|
+
if (candidates.length === 0) {
|
|
90
|
+
return {
|
|
91
|
+
highlights: fallbackHighlights(results, maxHighlights),
|
|
92
|
+
citations,
|
|
93
|
+
reranker_used: false
|
|
94
|
+
};
|
|
95
|
+
}
|
|
96
|
+
const cfg = getConfig();
|
|
97
|
+
if (cfg.reranker === "onnx") {
|
|
98
|
+
try {
|
|
99
|
+
const provider = await getRerankProvider();
|
|
100
|
+
const scored = await provider.rerank(
|
|
101
|
+
query,
|
|
102
|
+
candidates.map((c, i) => ({ id: String(i), text: c.text }))
|
|
103
|
+
);
|
|
104
|
+
if (scored.length > 0) {
|
|
105
|
+
const ranked = scored.slice(0, maxHighlights);
|
|
106
|
+
const highlights = ranked.map((s) => {
|
|
107
|
+
const cand = candidates[Number(s.id)];
|
|
108
|
+
return {
|
|
109
|
+
text: cand.text,
|
|
110
|
+
source_index: cand.sourceIndex,
|
|
111
|
+
relevance_score: s.score,
|
|
112
|
+
source_url: cand.sourceUrl,
|
|
113
|
+
source_title: cand.sourceTitle,
|
|
114
|
+
section_heading: cand.sectionHeading,
|
|
115
|
+
source_span: { start: cand.charStart, end: cand.charEnd }
|
|
116
|
+
};
|
|
117
|
+
});
|
|
118
|
+
return { highlights, citations, reranker_used: true };
|
|
119
|
+
}
|
|
120
|
+
} catch (err) {
|
|
121
|
+
log.debug("rerank provider failed, using fallback passages", { error: String(err) });
|
|
122
|
+
}
|
|
123
|
+
}
|
|
124
|
+
return { highlights: fallbackHighlights(results, maxHighlights), citations, reranker_used: false };
|
|
125
|
+
}
|
|
126
|
+
function fallbackHighlights(results, maxHighlights) {
|
|
127
|
+
const out = [];
|
|
128
|
+
for (let i = 0; i < results.length && out.length < maxHighlights; i++) {
|
|
129
|
+
const r = results[i];
|
|
130
|
+
const source = r.markdown_content ?? "";
|
|
131
|
+
const passages = source ? splitIntoPassages(source) : [];
|
|
132
|
+
if (passages.length > 0) {
|
|
133
|
+
const annotated = mapPassageHeadings(source, [passages[0]])[0];
|
|
134
|
+
const text2 = annotated.text.slice(0, MAX_PASSAGE_LENGTH);
|
|
135
|
+
out.push({
|
|
136
|
+
text: text2,
|
|
137
|
+
source_index: i + 1,
|
|
138
|
+
relevance_score: r.relevance_score,
|
|
139
|
+
source_url: r.url,
|
|
140
|
+
source_title: r.title,
|
|
141
|
+
section_heading: annotated.sectionHeading,
|
|
142
|
+
source_span: { start: annotated.charStart, end: annotated.charStart + text2.length }
|
|
143
|
+
});
|
|
144
|
+
continue;
|
|
145
|
+
}
|
|
146
|
+
const snippet = r.snippet ?? "";
|
|
147
|
+
if (!snippet) continue;
|
|
148
|
+
const text = snippet.slice(0, MAX_PASSAGE_LENGTH);
|
|
149
|
+
out.push({
|
|
150
|
+
text,
|
|
151
|
+
source_index: i + 1,
|
|
152
|
+
relevance_score: r.relevance_score,
|
|
153
|
+
source_url: r.url,
|
|
154
|
+
source_title: r.title,
|
|
155
|
+
section_heading: null,
|
|
156
|
+
source_span: { start: 0, end: text.length }
|
|
157
|
+
});
|
|
158
|
+
}
|
|
159
|
+
return out;
|
|
160
|
+
}
|
|
161
|
+
export {
|
|
162
|
+
extractHighlights,
|
|
163
|
+
fallbackHighlights,
|
|
164
|
+
mapPassageHeadings,
|
|
165
|
+
splitIntoPassages
|
|
166
|
+
};
|
|
167
|
+
//# sourceMappingURL=highlights.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../src/search/highlights.ts"],"sourcesContent":["import type { SearchResultItem, Citation, Highlight } from '../types.js';\nimport { getRerankProvider } from '../providers/rerank-provider.js';\nimport { getConfig } from '../config.js';\nimport { createLogger } from '../logger.js';\nimport { parseHeadings, lineStartCharOffsets } from '../extraction/markdown.js';\n\nconst log = createLogger('search');\n\nconst MAX_PASSAGE_LENGTH = 500;\nconst MIN_PASSAGE_LENGTH = 50;\nconst DEFAULT_MAX_HIGHLIGHTS = 10;\n\nexport interface HighlightSynthesisResult {\n highlights: Highlight[];\n citations: Citation[];\n reranker_used: boolean;\n}\n\nexport interface Passage {\n text: string;\n charStart: number;\n charEnd: number;\n}\n\ninterface PassageCandidate {\n text: string;\n sourceIndex: number;\n sourceUrl: string;\n sourceTitle: string;\n charStart: number;\n charEnd: number;\n sectionHeading: string | null;\n}\n\nfunction shouldKeep(trimmed: string): boolean {\n if (trimmed.length < MIN_PASSAGE_LENGTH) return false;\n if (trimmed.startsWith('#')) return false;\n if (trimmed.startsWith('|')) return false;\n if (trimmed.startsWith('```')) return false;\n if (trimmed.startsWith('- ') && trimmed.length <= 120) return false;\n return true;\n}\n\n// Walk the source markdown block-by-block (separated by blank lines) tracking\n// char offsets so each surviving passage carries an accurate {charStart,\n// charEnd} range pointing back into the original markdown.\nexport function splitIntoPassages(markdown: string): Passage[] {\n if (!markdown) return [];\n const out: Passage[] = [];\n const re = /\\n\\n+/g;\n let blockStart = 0;\n let m: RegExpExecArray | null;\n const consider = (rawStart: number, rawEnd: number) => {\n // raw block is markdown.slice(rawStart, rawEnd); compute trimmed range.\n const raw = markdown.slice(rawStart, rawEnd);\n if (!raw) return;\n let leading = 0;\n while (leading < raw.length && /\\s/.test(raw[leading])) leading++;\n let trailing = raw.length;\n while (trailing > leading && /\\s/.test(raw[trailing - 1])) trailing--;\n if (trailing <= leading) return;\n const trimmedStart = rawStart + leading;\n const trimmedEnd = rawStart + trailing;\n const trimmed = markdown.slice(trimmedStart, trimmedEnd);\n if (!shouldKeep(trimmed)) return;\n const text = trimmed.length > MAX_PASSAGE_LENGTH ? trimmed.slice(0, MAX_PASSAGE_LENGTH) : trimmed;\n const charEnd = trimmedStart + text.length;\n out.push({ text, charStart: trimmedStart, charEnd });\n };\n while ((m = re.exec(markdown)) !== null) {\n consider(blockStart, m.index);\n blockStart = m.index + m[0].length;\n }\n consider(blockStart, markdown.length);\n return out;\n}\n\n// Internal helper preserved for callers that only need the text strings.\nfunction splitIntoPassageStrings(markdown: string): string[] {\n return splitIntoPassages(markdown).map((p) => p.text);\n}\n\nexport interface AnnotatedPassage extends Passage {\n sectionHeading: string | null;\n}\n\n// Annotate each passage with the nearest preceding markdown heading. Uses\n// `parseHeadings` and a char-offset prefix sum so the lookup is O(passages\n// * headings) without re-parsing markdown for every passage.\nexport function mapPassageHeadings(\n markdown: string,\n passages: Passage[],\n): AnnotatedPassage[] {\n const lines = markdown.split('\\n');\n const headings = parseHeadings(lines);\n const offsets = lineStartCharOffsets(lines);\n const headingOffsets = headings.map((h) => ({ text: h.text, charStart: offsets[h.lineIndex] }));\n return passages.map((p) => {\n let nearest: string | null = null;\n for (const h of headingOffsets) {\n if (h.charStart <= p.charStart) nearest = h.text;\n else break;\n }\n return { ...p, sectionHeading: nearest };\n });\n}\n\n// Score passages across all results and return the top N using the\n// cross-encoder rerank provider, with a graceful first-paragraph fallback\n// when reranking is disabled or fails. Each Highlight carries a\n// source_index suitable for citing.\nexport async function extractHighlights(\n query: string,\n results: SearchResultItem[],\n maxHighlights: number = DEFAULT_MAX_HIGHLIGHTS,\n): Promise<HighlightSynthesisResult> {\n const citations: Citation[] = [];\n const candidates: PassageCandidate[] = [];\n\n for (let i = 0; i < results.length; i++) {\n const r = results[i];\n citations.push({\n index: i + 1,\n url: r.url,\n title: r.title,\n snippet: r.snippet,\n });\n\n const source = r.markdown_content ?? r.snippet ?? '';\n const passages = splitIntoPassages(source);\n const annotated = mapPassageHeadings(source, passages);\n for (const p of annotated) {\n candidates.push({\n text: p.text,\n sourceIndex: i + 1,\n sourceUrl: r.url,\n sourceTitle: r.title,\n charStart: p.charStart,\n charEnd: p.charEnd,\n sectionHeading: p.sectionHeading,\n });\n }\n }\n\n if (candidates.length === 0) {\n return {\n highlights: fallbackHighlights(results, maxHighlights),\n citations,\n reranker_used: false,\n };\n }\n\n const cfg = getConfig();\n if (cfg.reranker === 'onnx') {\n try {\n const provider = await getRerankProvider();\n const scored = await provider.rerank(\n query,\n candidates.map((c, i) => ({ id: String(i), text: c.text })),\n );\n if (scored.length > 0) {\n const ranked = scored.slice(0, maxHighlights);\n const highlights = ranked.map<Highlight>((s) => {\n const cand = candidates[Number(s.id)];\n return {\n text: cand.text,\n source_index: cand.sourceIndex,\n relevance_score: s.score,\n source_url: cand.sourceUrl,\n source_title: cand.sourceTitle,\n section_heading: cand.sectionHeading,\n source_span: { start: cand.charStart, end: cand.charEnd },\n };\n });\n return { highlights, citations, reranker_used: true };\n }\n } catch (err) {\n log.debug('rerank provider failed, using fallback passages', { error: String(err) });\n }\n }\n\n return { highlights: fallbackHighlights(results, maxHighlights), citations, reranker_used: false };\n}\n\n// Fallback when the cross-encoder reranker is unavailable: take the first substantive paragraph\n// from each source (ordered by engine relevance). Preserves citation indices\n// so host LLMs can still cite [N] correctly.\nexport function fallbackHighlights(\n results: SearchResultItem[],\n maxHighlights: number,\n): Highlight[] {\n const out: Highlight[] = [];\n for (let i = 0; i < results.length && out.length < maxHighlights; i++) {\n const r = results[i];\n const source = r.markdown_content ?? '';\n const passages = source ? splitIntoPassages(source) : [];\n if (passages.length > 0) {\n const annotated = mapPassageHeadings(source, [passages[0]])[0];\n const text = annotated.text.slice(0, MAX_PASSAGE_LENGTH);\n out.push({\n text,\n source_index: i + 1,\n relevance_score: r.relevance_score,\n source_url: r.url,\n source_title: r.title,\n section_heading: annotated.sectionHeading,\n source_span: { start: annotated.charStart, end: annotated.charStart + text.length },\n });\n continue;\n }\n const snippet = r.snippet ?? '';\n if (!snippet) continue;\n const text = snippet.slice(0, MAX_PASSAGE_LENGTH);\n out.push({\n text,\n source_index: i + 1,\n relevance_score: r.relevance_score,\n source_url: r.url,\n source_title: r.title,\n section_heading: null,\n source_span: { start: 0, end: text.length },\n });\n }\n return out;\n}\n"],"mappings":"AACA,SAAS,yBAAyB;AAClC,SAAS,iBAAiB;AAC1B,SAAS,oBAAoB;AAC7B,SAAS,eAAe,4BAA4B;AAEpD,MAAM,MAAM,aAAa,QAAQ;AAEjC,MAAM,qBAAqB;AAC3B,MAAM,qBAAqB;AAC3B,MAAM,yBAAyB;AAwB/B,SAAS,WAAW,SAA0B;AAC5C,MAAI,QAAQ,SAAS,mBAAoB,QAAO;AAChD,MAAI,QAAQ,WAAW,GAAG,EAAG,QAAO;AACpC,MAAI,QAAQ,WAAW,GAAG,EAAG,QAAO;AACpC,MAAI,QAAQ,WAAW,KAAK,EAAG,QAAO;AACtC,MAAI,QAAQ,WAAW,IAAI,KAAK,QAAQ,UAAU,IAAK,QAAO;AAC9D,SAAO;AACT;AAKO,SAAS,kBAAkB,UAA6B;AAC7D,MAAI,CAAC,SAAU,QAAO,CAAC;AACvB,QAAM,MAAiB,CAAC;AACxB,QAAM,KAAK;AACX,MAAI,aAAa;AACjB,MAAI;AACJ,QAAM,WAAW,CAAC,UAAkB,WAAmB;AAErD,UAAM,MAAM,SAAS,MAAM,UAAU,MAAM;AAC3C,QAAI,CAAC,IAAK;AACV,QAAI,UAAU;AACd,WAAO,UAAU,IAAI,UAAU,KAAK,KAAK,IAAI,OAAO,CAAC,EAAG;AACxD,QAAI,WAAW,IAAI;AACnB,WAAO,WAAW,WAAW,KAAK,KAAK,IAAI,WAAW,CAAC,CAAC,EAAG;AAC3D,QAAI,YAAY,QAAS;AACzB,UAAM,eAAe,WAAW;AAChC,UAAM,aAAa,WAAW;AAC9B,UAAM,UAAU,SAAS,MAAM,cAAc,UAAU;AACvD,QAAI,CAAC,WAAW,OAAO,EAAG;AAC1B,UAAM,OAAO,QAAQ,SAAS,qBAAqB,QAAQ,MAAM,GAAG,kBAAkB,IAAI;AAC1F,UAAM,UAAU,eAAe,KAAK;AACpC,QAAI,KAAK,EAAE,MAAM,WAAW,cAAc,QAAQ,CAAC;AAAA,EACrD;AACA,UAAQ,IAAI,GAAG,KAAK,QAAQ,OAAO,MAAM;AACvC,aAAS,YAAY,EAAE,KAAK;AAC5B,iBAAa,EAAE,QAAQ,EAAE,CAAC,EAAE;AAAA,EAC9B;AACA,WAAS,YAAY,SAAS,MAAM;AACpC,SAAO;AACT;AAGA,SAAS,wBAAwB,UAA4B;AAC3D,SAAO,kBAAkB,QAAQ,EAAE,IAAI,CAAC,MAAM,EAAE,IAAI;AACtD;AASO,SAAS,mBACd,UACA,UACoB;AACpB,QAAM,QAAQ,SAAS,MAAM,IAAI;AACjC,QAAM,WAAW,cAAc,KAAK;AACpC,QAAM,UAAU,qBAAqB,KAAK;AAC1C,QAAM,iBAAiB,SAAS,IAAI,CAAC,OAAO,EAAE,MAAM,EAAE,MAAM,WAAW,QAAQ,EAAE,SAAS,EAAE,EAAE;AAC9F,SAAO,SAAS,IAAI,CAAC,MAAM;AACzB,QAAI,UAAyB;AAC7B,eAAW,KAAK,gBAAgB;AAC9B,UAAI,EAAE,aAAa,EAAE,UAAW,WAAU,EAAE;AAAA,UACvC;AAAA,IACP;AACA,WAAO,EAAE,GAAG,GAAG,gBAAgB,QAAQ;AAAA,EACzC,CAAC;AACH;AAMA,eAAsB,kBACpB,OACA,SACA,gBAAwB,wBACW;AACnC,QAAM,YAAwB,CAAC;AAC/B,QAAM,aAAiC,CAAC;AAExC,WAAS,IAAI,GAAG,IAAI,QAAQ,QAAQ,KAAK;AACvC,UAAM,IAAI,QAAQ,CAAC;AACnB,cAAU,KAAK;AAAA,MACb,OAAO,IAAI;AAAA,MACX,KAAK,EAAE;AAAA,MACP,OAAO,EAAE;AAAA,MACT,SAAS,EAAE;AAAA,IACb,CAAC;AAED,UAAM,SAAS,EAAE,oBAAoB,EAAE,WAAW;AAClD,UAAM,WAAW,kBAAkB,MAAM;AACzC,UAAM,YAAY,mBAAmB,QAAQ,QAAQ;AACrD,eAAW,KAAK,WAAW;AACzB,iBAAW,KAAK;AAAA,QACd,MAAM,EAAE;AAAA,QACR,aAAa,IAAI;AAAA,QACjB,WAAW,EAAE;AAAA,QACb,aAAa,EAAE;AAAA,QACf,WAAW,EAAE;AAAA,QACb,SAAS,EAAE;AAAA,QACX,gBAAgB,EAAE;AAAA,MACpB,CAAC;AAAA,IACH;AAAA,EACF;AAEA,MAAI,WAAW,WAAW,GAAG;AAC3B,WAAO;AAAA,MACL,YAAY,mBAAmB,SAAS,aAAa;AAAA,MACrD;AAAA,MACA,eAAe;AAAA,IACjB;AAAA,EACF;AAEA,QAAM,MAAM,UAAU;AACtB,MAAI,IAAI,aAAa,QAAQ;AAC3B,QAAI;AACF,YAAM,WAAW,MAAM,kBAAkB;AACzC,YAAM,SAAS,MAAM,SAAS;AAAA,QAC5B;AAAA,QACA,WAAW,IAAI,CAAC,GAAG,OAAO,EAAE,IAAI,OAAO,CAAC,GAAG,MAAM,EAAE,KAAK,EAAE;AAAA,MAC5D;AACA,UAAI,OAAO,SAAS,GAAG;AACrB,cAAM,SAAS,OAAO,MAAM,GAAG,aAAa;AAC5C,cAAM,aAAa,OAAO,IAAe,CAAC,MAAM;AAC9C,gBAAM,OAAO,WAAW,OAAO,EAAE,EAAE,CAAC;AACpC,iBAAO;AAAA,YACL,MAAM,KAAK;AAAA,YACX,cAAc,KAAK;AAAA,YACnB,iBAAiB,EAAE;AAAA,YACnB,YAAY,KAAK;AAAA,YACjB,cAAc,KAAK;AAAA,YACnB,iBAAiB,KAAK;AAAA,YACtB,aAAa,EAAE,OAAO,KAAK,WAAW,KAAK,KAAK,QAAQ;AAAA,UAC1D;AAAA,QACF,CAAC;AACD,eAAO,EAAE,YAAY,WAAW,eAAe,KAAK;AAAA,MACtD;AAAA,IACF,SAAS,KAAK;AACZ,UAAI,MAAM,mDAAmD,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AAAA,IACrF;AAAA,EACF;AAEA,SAAO,EAAE,YAAY,mBAAmB,SAAS,aAAa,GAAG,WAAW,eAAe,MAAM;AACnG;AAKO,SAAS,mBACd,SACA,eACa;AACb,QAAM,MAAmB,CAAC;AAC1B,WAAS,IAAI,GAAG,IAAI,QAAQ,UAAU,IAAI,SAAS,eAAe,KAAK;AACrE,UAAM,IAAI,QAAQ,CAAC;AACnB,UAAM,SAAS,EAAE,oBAAoB;AACrC,UAAM,WAAW,SAAS,kBAAkB,MAAM,IAAI,CAAC;AACvD,QAAI,SAAS,SAAS,GAAG;AACvB,YAAM,YAAY,mBAAmB,QAAQ,CAAC,SAAS,CAAC,CAAC,CAAC,EAAE,CAAC;AAC7D,YAAMA,QAAO,UAAU,KAAK,MAAM,GAAG,kBAAkB;AACvD,UAAI,KAAK;AAAA,QACP,MAAAA;AAAA,QACA,cAAc,IAAI;AAAA,QAClB,iBAAiB,EAAE;AAAA,QACnB,YAAY,EAAE;AAAA,QACd,cAAc,EAAE;AAAA,QAChB,iBAAiB,UAAU;AAAA,QAC3B,aAAa,EAAE,OAAO,UAAU,WAAW,KAAK,UAAU,YAAYA,MAAK,OAAO;AAAA,MACpF,CAAC;AACD;AAAA,IACF;AACA,UAAM,UAAU,EAAE,WAAW;AAC7B,QAAI,CAAC,QAAS;AACd,UAAM,OAAO,QAAQ,MAAM,GAAG,kBAAkB;AAChD,QAAI,KAAK;AAAA,MACP;AAAA,MACA,cAAc,IAAI;AAAA,MAClB,iBAAiB,EAAE;AAAA,MACnB,YAAY,EAAE;AAAA,MACd,cAAc,EAAE;AAAA,MAChB,iBAAiB;AAAA,MACjB,aAAa,EAAE,OAAO,GAAG,KAAK,KAAK,OAAO;AAAA,IAC5C,CAAC;AAAA,EACH;AACA,SAAO;AACT;","names":["text"]}
|
|
@@ -0,0 +1,29 @@
|
|
|
1
|
+
export interface RawSearchResult {
|
|
2
|
+
url: string;
|
|
3
|
+
title: string;
|
|
4
|
+
snippet: string;
|
|
5
|
+
engine: string;
|
|
6
|
+
[k: string]: unknown;
|
|
7
|
+
}
|
|
8
|
+
export interface DiscardedResult<T extends RawLike = RawSearchResult> {
|
|
9
|
+
result: T;
|
|
10
|
+
reason: 'invalid_url' | 'language_mismatch' | 'engine_batch_dropped';
|
|
11
|
+
}
|
|
12
|
+
export interface FilterOptions {
|
|
13
|
+
target: string;
|
|
14
|
+
dropThreshold: number;
|
|
15
|
+
}
|
|
16
|
+
export interface FilterResult<T extends RawLike = RawSearchResult> {
|
|
17
|
+
results: T[];
|
|
18
|
+
discarded: DiscardedResult<T>[];
|
|
19
|
+
warnings: string[];
|
|
20
|
+
}
|
|
21
|
+
interface RawLike {
|
|
22
|
+
url: string;
|
|
23
|
+
title: string;
|
|
24
|
+
snippet: string;
|
|
25
|
+
engine: string;
|
|
26
|
+
}
|
|
27
|
+
export declare function filterByLanguage<T extends RawLike>(results: T[], opts: FilterOptions): FilterResult<T>;
|
|
28
|
+
export {};
|
|
29
|
+
//# sourceMappingURL=language-filter.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"language-filter.d.ts","sourceRoot":"","sources":["../../src/search/language-filter.ts"],"names":[],"mappings":"AAgBA,MAAM,WAAW,eAAe;IAC9B,GAAG,EAAE,MAAM,CAAC;IACZ,KAAK,EAAE,MAAM,CAAC;IACd,OAAO,EAAE,MAAM,CAAC;IAChB,MAAM,EAAE,MAAM,CAAC;IACf,CAAC,CAAC,EAAE,MAAM,GAAG,OAAO,CAAC;CACtB;AAED,MAAM,WAAW,eAAe,CAAC,CAAC,SAAS,OAAO,GAAG,eAAe;IAClE,MAAM,EAAE,CAAC,CAAC;IACV,MAAM,EAAE,aAAa,GAAG,mBAAmB,GAAG,sBAAsB,CAAC;CACtE;AAED,MAAM,WAAW,aAAa;IAC5B,MAAM,EAAE,MAAM,CAAC;IACf,aAAa,EAAE,MAAM,CAAC;CACvB;AAED,MAAM,WAAW,YAAY,CAAC,CAAC,SAAS,OAAO,GAAG,eAAe;IAC/D,OAAO,EAAE,CAAC,EAAE,CAAC;IACb,SAAS,EAAE,eAAe,CAAC,CAAC,CAAC,EAAE,CAAC;IAChC,QAAQ,EAAE,MAAM,EAAE,CAAC;CACpB;AAED,UAAU,OAAO;IACf,GAAG,EAAE,MAAM,CAAC;IACZ,KAAK,EAAE,MAAM,CAAC;IACd,OAAO,EAAE,MAAM,CAAC;IAChB,MAAM,EAAE,MAAM,CAAC;CAChB;AAwBD,wBAAgB,gBAAgB,CAAC,CAAC,SAAS,OAAO,EAChD,OAAO,EAAE,CAAC,EAAE,EACZ,IAAI,EAAE,aAAa,GAClB,YAAY,CAAC,CAAC,CAAC,CA6DjB"}
|
|
@@ -0,0 +1,126 @@
|
|
|
1
|
+
import { detectAll } from "tinyld";
|
|
2
|
+
import { createLogger } from "../logger.js";
|
|
3
|
+
const MIN_DETECT_CHARS = 12;
|
|
4
|
+
const MIN_CONFIDENCE = 0.1;
|
|
5
|
+
const LATIN_LANGS = /* @__PURE__ */ new Set([
|
|
6
|
+
"en",
|
|
7
|
+
"es",
|
|
8
|
+
"fr",
|
|
9
|
+
"pt",
|
|
10
|
+
"de",
|
|
11
|
+
"it",
|
|
12
|
+
"nl",
|
|
13
|
+
"da",
|
|
14
|
+
"sv",
|
|
15
|
+
"no",
|
|
16
|
+
"fi",
|
|
17
|
+
"is",
|
|
18
|
+
"pl",
|
|
19
|
+
"cs",
|
|
20
|
+
"sk",
|
|
21
|
+
"hu",
|
|
22
|
+
"ro",
|
|
23
|
+
"hr",
|
|
24
|
+
"sl",
|
|
25
|
+
"lt",
|
|
26
|
+
"lv",
|
|
27
|
+
"et",
|
|
28
|
+
"tr",
|
|
29
|
+
"vi",
|
|
30
|
+
"id",
|
|
31
|
+
"ms",
|
|
32
|
+
"tl",
|
|
33
|
+
"sw",
|
|
34
|
+
"af",
|
|
35
|
+
"ca",
|
|
36
|
+
"gl",
|
|
37
|
+
"eu",
|
|
38
|
+
"ga",
|
|
39
|
+
"cy",
|
|
40
|
+
"mt",
|
|
41
|
+
"sq",
|
|
42
|
+
"lb",
|
|
43
|
+
"fo",
|
|
44
|
+
"ber",
|
|
45
|
+
"so",
|
|
46
|
+
"ha",
|
|
47
|
+
"yo",
|
|
48
|
+
"ig",
|
|
49
|
+
"zu",
|
|
50
|
+
"xh",
|
|
51
|
+
"st",
|
|
52
|
+
"tn"
|
|
53
|
+
]);
|
|
54
|
+
const log = createLogger("language-filter");
|
|
55
|
+
function isValidUrl(u) {
|
|
56
|
+
try {
|
|
57
|
+
const parsed = new URL(u);
|
|
58
|
+
return parsed.protocol === "http:" || parsed.protocol === "https:";
|
|
59
|
+
} catch {
|
|
60
|
+
return false;
|
|
61
|
+
}
|
|
62
|
+
}
|
|
63
|
+
function detectLang(text) {
|
|
64
|
+
const t = text?.trim() ?? "";
|
|
65
|
+
if (t.length < MIN_DETECT_CHARS) return "und";
|
|
66
|
+
try {
|
|
67
|
+
const ranked = detectAll(t);
|
|
68
|
+
const top = ranked[0];
|
|
69
|
+
if (!top || top.accuracy < MIN_CONFIDENCE) return "und";
|
|
70
|
+
return top.lang || "und";
|
|
71
|
+
} catch {
|
|
72
|
+
return "und";
|
|
73
|
+
}
|
|
74
|
+
}
|
|
75
|
+
function filterByLanguage(results, opts) {
|
|
76
|
+
const discarded = [];
|
|
77
|
+
const warnings = [];
|
|
78
|
+
const urlValid = [];
|
|
79
|
+
for (const r of results) {
|
|
80
|
+
if (!isValidUrl(r.url)) {
|
|
81
|
+
discarded.push({ result: r, reason: "invalid_url" });
|
|
82
|
+
continue;
|
|
83
|
+
}
|
|
84
|
+
urlValid.push(r);
|
|
85
|
+
}
|
|
86
|
+
if (urlValid.length === 0) return { results: [], discarded, warnings };
|
|
87
|
+
const byEngine = /* @__PURE__ */ new Map();
|
|
88
|
+
for (const r of urlValid) {
|
|
89
|
+
const arr = byEngine.get(r.engine) ?? [];
|
|
90
|
+
arr.push(r);
|
|
91
|
+
byEngine.set(r.engine, arr);
|
|
92
|
+
}
|
|
93
|
+
const targetIsLatin = LATIN_LANGS.has(opts.target);
|
|
94
|
+
const isMismatch = (lang) => {
|
|
95
|
+
if (lang === opts.target || lang === "und") return false;
|
|
96
|
+
if (targetIsLatin && LATIN_LANGS.has(lang)) return false;
|
|
97
|
+
return true;
|
|
98
|
+
};
|
|
99
|
+
const kept = [];
|
|
100
|
+
for (const [engine, batch] of byEngine) {
|
|
101
|
+
let nonTarget = 0;
|
|
102
|
+
const langs = batch.map((r) => detectLang(`${r.title} ${r.snippet}`));
|
|
103
|
+
for (const l of langs) if (isMismatch(l)) nonTarget += 1;
|
|
104
|
+
const ratio = nonTarget / batch.length;
|
|
105
|
+
if (ratio > opts.dropThreshold) {
|
|
106
|
+
warnings.push(
|
|
107
|
+
`engine_language_mismatch: ${engine} returned ${Math.round(ratio * 100)}% non-${opts.target}; batch dropped`
|
|
108
|
+
);
|
|
109
|
+
for (const r of batch) discarded.push({ result: r, reason: "engine_batch_dropped" });
|
|
110
|
+
log.warn("dropped engine batch for language mismatch", { engine, ratio });
|
|
111
|
+
continue;
|
|
112
|
+
}
|
|
113
|
+
for (let i = 0; i < batch.length; i += 1) {
|
|
114
|
+
if (isMismatch(langs[i])) {
|
|
115
|
+
discarded.push({ result: batch[i], reason: "language_mismatch" });
|
|
116
|
+
} else {
|
|
117
|
+
kept.push(batch[i]);
|
|
118
|
+
}
|
|
119
|
+
}
|
|
120
|
+
}
|
|
121
|
+
return { results: kept, discarded, warnings };
|
|
122
|
+
}
|
|
123
|
+
export {
|
|
124
|
+
filterByLanguage
|
|
125
|
+
};
|
|
126
|
+
//# sourceMappingURL=language-filter.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../src/search/language-filter.ts"],"sourcesContent":["import { detectAll } from 'tinyld';\nimport { createLogger } from '../logger.js';\n\nconst MIN_DETECT_CHARS = 12;\nconst MIN_CONFIDENCE = 0.1;\n\n// Languages that use Latin script — used to avoid false positives when target is Latin.\nconst LATIN_LANGS = new Set([\n 'en', 'es', 'fr', 'pt', 'de', 'it', 'nl', 'da', 'sv', 'no', 'fi', 'is',\n 'pl', 'cs', 'sk', 'hu', 'ro', 'hr', 'sl', 'lt', 'lv', 'et', 'tr', 'vi',\n 'id', 'ms', 'tl', 'sw', 'af', 'ca', 'gl', 'eu', 'ga', 'cy', 'mt', 'sq',\n 'lb', 'fo', 'ber', 'so', 'ha', 'yo', 'ig', 'zu', 'xh', 'st', 'tn',\n]);\n\nconst log = createLogger('language-filter');\n\nexport interface RawSearchResult {\n url: string;\n title: string;\n snippet: string;\n engine: string;\n [k: string]: unknown;\n}\n\nexport interface DiscardedResult<T extends RawLike = RawSearchResult> {\n result: T;\n reason: 'invalid_url' | 'language_mismatch' | 'engine_batch_dropped';\n}\n\nexport interface FilterOptions {\n target: string; // ISO-639 code, e.g. 'en'\n dropThreshold: number; // fraction of batch non-target before drop, e.g. 0.4\n}\n\nexport interface FilterResult<T extends RawLike = RawSearchResult> {\n results: T[];\n discarded: DiscardedResult<T>[];\n warnings: string[];\n}\n\ninterface RawLike {\n url: string;\n title: string;\n snippet: string;\n engine: string;\n}\n\nfunction isValidUrl(u: string): boolean {\n try {\n const parsed = new URL(u);\n return parsed.protocol === 'http:' || parsed.protocol === 'https:';\n } catch {\n return false;\n }\n}\n\nfunction detectLang(text: string): string {\n const t = text?.trim() ?? '';\n if (t.length < MIN_DETECT_CHARS) return 'und';\n try {\n const ranked = detectAll(t);\n const top = ranked[0];\n if (!top || top.accuracy < MIN_CONFIDENCE) return 'und';\n return top.lang || 'und';\n } catch {\n return 'und';\n }\n}\n\nexport function filterByLanguage<T extends RawLike>(\n results: T[],\n opts: FilterOptions,\n): FilterResult<T> {\n const discarded: DiscardedResult<T>[] = [];\n const warnings: string[] = [];\n\n // Step 1: drop invalid URLs first\n const urlValid: T[] = [];\n for (const r of results) {\n if (!isValidUrl(r.url)) {\n discarded.push({ result: r, reason: 'invalid_url' });\n continue;\n }\n urlValid.push(r);\n }\n\n if (urlValid.length === 0) return { results: [], discarded, warnings };\n\n // Step 2: per-engine batch language check\n const byEngine = new Map<string, T[]>();\n for (const r of urlValid) {\n const arr = byEngine.get(r.engine) ?? [];\n arr.push(r);\n byEngine.set(r.engine, arr);\n }\n\n const targetIsLatin = LATIN_LANGS.has(opts.target);\n const isMismatch = (lang: string): boolean => {\n if (lang === opts.target || lang === 'und') return false;\n // Script-aware: Latin-target vs Latin-detected is treated as a match\n // because tinyld misclassifies short Latin-script text into other Latin\n // languages with low confidence.\n if (targetIsLatin && LATIN_LANGS.has(lang)) return false;\n return true;\n };\n\n const kept: T[] = [];\n for (const [engine, batch] of byEngine) {\n let nonTarget = 0;\n const langs = batch.map(r => detectLang(`${r.title} ${r.snippet}`));\n for (const l of langs) if (isMismatch(l)) nonTarget += 1;\n const ratio = nonTarget / batch.length;\n\n if (ratio > opts.dropThreshold) {\n warnings.push(\n `engine_language_mismatch: ${engine} returned ${Math.round(ratio * 100)}% non-${opts.target}; batch dropped`,\n );\n for (const r of batch) discarded.push({ result: r, reason: 'engine_batch_dropped' });\n log.warn('dropped engine batch for language mismatch', { engine, ratio });\n continue;\n }\n\n // Drop individual non-target results inside an otherwise-fine batch\n for (let i = 0; i < batch.length; i += 1) {\n if (isMismatch(langs[i])) {\n discarded.push({ result: batch[i], reason: 'language_mismatch' });\n } else {\n kept.push(batch[i]);\n }\n }\n }\n\n return { results: kept, discarded, warnings };\n}\n"],"mappings":"AAAA,SAAS,iBAAiB;AAC1B,SAAS,oBAAoB;AAE7B,MAAM,mBAAmB;AACzB,MAAM,iBAAiB;AAGvB,MAAM,cAAc,oBAAI,IAAI;AAAA,EAC1B;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAClE;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAClE;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAClE;AAAA,EAAM;AAAA,EAAM;AAAA,EAAO;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAAA,EAAM;AAC/D,CAAC;AAED,MAAM,MAAM,aAAa,iBAAiB;AAiC1C,SAAS,WAAW,GAAoB;AACtC,MAAI;AACF,UAAM,SAAS,IAAI,IAAI,CAAC;AACxB,WAAO,OAAO,aAAa,WAAW,OAAO,aAAa;AAAA,EAC5D,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAEA,SAAS,WAAW,MAAsB;AACxC,QAAM,IAAI,MAAM,KAAK,KAAK;AAC1B,MAAI,EAAE,SAAS,iBAAkB,QAAO;AACxC,MAAI;AACF,UAAM,SAAS,UAAU,CAAC;AAC1B,UAAM,MAAM,OAAO,CAAC;AACpB,QAAI,CAAC,OAAO,IAAI,WAAW,eAAgB,QAAO;AAClD,WAAO,IAAI,QAAQ;AAAA,EACrB,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAEO,SAAS,iBACd,SACA,MACiB;AACjB,QAAM,YAAkC,CAAC;AACzC,QAAM,WAAqB,CAAC;AAG5B,QAAM,WAAgB,CAAC;AACvB,aAAW,KAAK,SAAS;AACvB,QAAI,CAAC,WAAW,EAAE,GAAG,GAAG;AACtB,gBAAU,KAAK,EAAE,QAAQ,GAAG,QAAQ,cAAc,CAAC;AACnD;AAAA,IACF;AACA,aAAS,KAAK,CAAC;AAAA,EACjB;AAEA,MAAI,SAAS,WAAW,EAAG,QAAO,EAAE,SAAS,CAAC,GAAG,WAAW,SAAS;AAGrE,QAAM,WAAW,oBAAI,IAAiB;AACtC,aAAW,KAAK,UAAU;AACxB,UAAM,MAAM,SAAS,IAAI,EAAE,MAAM,KAAK,CAAC;AACvC,QAAI,KAAK,CAAC;AACV,aAAS,IAAI,EAAE,QAAQ,GAAG;AAAA,EAC5B;AAEA,QAAM,gBAAgB,YAAY,IAAI,KAAK,MAAM;AACjD,QAAM,aAAa,CAAC,SAA0B;AAC5C,QAAI,SAAS,KAAK,UAAU,SAAS,MAAO,QAAO;AAInD,QAAI,iBAAiB,YAAY,IAAI,IAAI,EAAG,QAAO;AACnD,WAAO;AAAA,EACT;AAEA,QAAM,OAAY,CAAC;AACnB,aAAW,CAAC,QAAQ,KAAK,KAAK,UAAU;AACtC,QAAI,YAAY;AAChB,UAAM,QAAQ,MAAM,IAAI,OAAK,WAAW,GAAG,EAAE,KAAK,IAAI,EAAE,OAAO,EAAE,CAAC;AAClE,eAAW,KAAK,MAAO,KAAI,WAAW,CAAC,EAAG,cAAa;AACvD,UAAM,QAAQ,YAAY,MAAM;AAEhC,QAAI,QAAQ,KAAK,eAAe;AAC9B,eAAS;AAAA,QACP,6BAA6B,MAAM,aAAa,KAAK,MAAM,QAAQ,GAAG,CAAC,SAAS,KAAK,MAAM;AAAA,MAC7F;AACA,iBAAW,KAAK,MAAO,WAAU,KAAK,EAAE,QAAQ,GAAG,QAAQ,uBAAuB,CAAC;AACnF,UAAI,KAAK,8CAA8C,EAAE,QAAQ,MAAM,CAAC;AACxE;AAAA,IACF;AAGA,aAAS,IAAI,GAAG,IAAI,MAAM,QAAQ,KAAK,GAAG;AACxC,UAAI,WAAW,MAAM,CAAC,CAAC,GAAG;AACxB,kBAAU,KAAK,EAAE,QAAQ,MAAM,CAAC,GAAG,QAAQ,oBAAoB,CAAC;AAAA,MAClE,OAAO;AACL,aAAK,KAAK,MAAM,CAAC,CAAC;AAAA,MACpB;AAAA,IACF;AAAA,EACF;AAEA,SAAO,EAAE,SAAS,MAAM,WAAW,SAAS;AAC9C;","names":[]}
|
|
@@ -0,0 +1,4 @@
|
|
|
1
|
+
import type { SearchInput, SearchOutput, StageResult } from '../../types.js';
|
|
2
|
+
import type { SearchContext } from '../../providers/search-provider.js';
|
|
3
|
+
export declare function runSearxngSearch(input: SearchInput, ctx: SearchContext): Promise<StageResult<SearchOutput>>;
|
|
4
|
+
//# sourceMappingURL=searxng-orchestrator.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"searxng-orchestrator.d.ts","sourceRoot":"","sources":["../../../src/search/legacy/searxng-orchestrator.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACV,WAAW,EACX,YAAY,EAGZ,WAAW,EACZ,MAAM,gBAAgB,CAAC;AAExB,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,oCAAoC,CAAC;AA0BxE,wBAAsB,gBAAgB,CACpC,KAAK,EAAE,WAAW,EAClB,GAAG,EAAE,aAAa,GACjB,OAAO,CAAC,WAAW,CAAC,YAAY,CAAC,CAAC,CAqdpC"}
|