@staticn0va/wigolo 0.1.0 → 0.1.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +1 -1
- package/README.md +146 -227
- package/SKILL.md +382 -0
- package/assets/blocks/claude-code/CLAUDE.md.block +20 -0
- package/assets/blocks/claude-code/wigolo-command.md +40 -0
- package/assets/blocks/cursor/wigolo.mdc +46 -0
- package/assets/blocks/gemini-cli/GEMINI.md.block +18 -0
- package/assets/blocks/vscode/copilot-instructions.md.block +18 -0
- package/assets/skills/wigolo/SKILL.md +50 -0
- package/assets/skills/wigolo/rules/cache-first.md +30 -0
- package/assets/skills/wigolo/rules/synthesis.md +43 -0
- package/assets/skills/wigolo-agent/SKILL.md +73 -0
- package/assets/skills/wigolo-crawl/SKILL.md +60 -0
- package/assets/skills/wigolo-extract/SKILL.md +59 -0
- package/assets/skills/wigolo-fetch/SKILL.md +65 -0
- package/assets/skills/wigolo-find-similar/SKILL.md +72 -0
- package/assets/skills/wigolo-research/SKILL.md +77 -0
- package/assets/skills/wigolo-search/SKILL.md +78 -0
- package/dist/agent/executor.d.ts +33 -0
- package/dist/agent/executor.d.ts.map +1 -0
- package/dist/agent/executor.js +233 -0
- package/dist/agent/executor.js.map +1 -0
- package/dist/agent/pipeline.d.ts +5 -0
- package/dist/agent/pipeline.d.ts.map +1 -0
- package/dist/agent/pipeline.js +238 -0
- package/dist/agent/pipeline.js.map +1 -0
- package/dist/agent/planner.d.ts +13 -0
- package/dist/agent/planner.d.ts.map +1 -0
- package/dist/agent/planner.js +271 -0
- package/dist/agent/planner.js.map +1 -0
- package/dist/agent/relevance.d.ts +15 -0
- package/dist/agent/relevance.d.ts.map +1 -0
- package/dist/agent/relevance.js +60 -0
- package/dist/agent/relevance.js.map +1 -0
- package/dist/cache/backfill-embeddings.d.ts +23 -0
- package/dist/cache/backfill-embeddings.d.ts.map +1 -0
- package/dist/cache/backfill-embeddings.js +105 -0
- package/dist/cache/backfill-embeddings.js.map +1 -0
- package/dist/cache/change-detector.d.ts +7 -0
- package/dist/cache/change-detector.d.ts.map +1 -0
- package/dist/cache/change-detector.js +43 -0
- package/dist/cache/change-detector.js.map +1 -0
- package/dist/cache/db.d.ts +1 -0
- package/dist/cache/db.d.ts.map +1 -1
- package/dist/cache/db.js +94 -22
- package/dist/cache/db.js.map +1 -1
- package/dist/cache/diff-summary.d.ts +2 -0
- package/dist/cache/diff-summary.d.ts.map +1 -0
- package/dist/cache/diff-summary.js +82 -0
- package/dist/cache/diff-summary.js.map +1 -0
- package/dist/cache/migrations/runner.d.ts +29 -0
- package/dist/cache/migrations/runner.d.ts.map +1 -0
- package/dist/cache/migrations/runner.js +147 -0
- package/dist/cache/migrations/runner.js.map +1 -0
- package/dist/cache/sqlite-vec-store.d.ts +42 -0
- package/dist/cache/sqlite-vec-store.d.ts.map +1 -0
- package/dist/cache/sqlite-vec-store.js +176 -0
- package/dist/cache/sqlite-vec-store.js.map +1 -0
- package/dist/cache/store.d.ts +47 -1
- package/dist/cache/store.d.ts.map +1 -1
- package/dist/cache/store.js +364 -168
- package/dist/cache/store.js.map +1 -1
- package/dist/cli/agents/antigravity.d.ts +20 -0
- package/dist/cli/agents/antigravity.d.ts.map +1 -0
- package/dist/cli/agents/antigravity.js +49 -0
- package/dist/cli/agents/antigravity.js.map +1 -0
- package/dist/cli/agents/claude-code.d.ts +25 -0
- package/dist/cli/agents/claude-code.d.ts.map +1 -0
- package/dist/cli/agents/claude-code.js +111 -0
- package/dist/cli/agents/claude-code.js.map +1 -0
- package/dist/cli/agents/cursor.d.ts +21 -0
- package/dist/cli/agents/cursor.d.ts.map +1 -0
- package/dist/cli/agents/cursor.js +58 -0
- package/dist/cli/agents/cursor.js.map +1 -0
- package/dist/cli/agents/gemini-cli.d.ts +21 -0
- package/dist/cli/agents/gemini-cli.d.ts.map +1 -0
- package/dist/cli/agents/gemini-cli.js +55 -0
- package/dist/cli/agents/gemini-cli.js.map +1 -0
- package/dist/cli/agents/registry.d.ts +21 -0
- package/dist/cli/agents/registry.d.ts.map +1 -0
- package/dist/cli/agents/registry.js +27 -0
- package/dist/cli/agents/registry.js.map +1 -0
- package/dist/cli/agents/utils.d.ts +26 -0
- package/dist/cli/agents/utils.d.ts.map +1 -0
- package/dist/cli/agents/utils.js +136 -0
- package/dist/cli/agents/utils.js.map +1 -0
- package/dist/cli/agents/vscode.d.ts +21 -0
- package/dist/cli/agents/vscode.d.ts.map +1 -0
- package/dist/cli/agents/vscode.js +62 -0
- package/dist/cli/agents/vscode.js.map +1 -0
- package/dist/cli/auth.d.ts +2 -0
- package/dist/cli/auth.d.ts.map +1 -0
- package/dist/cli/auth.js +94 -0
- package/dist/cli/auth.js.map +1 -0
- package/dist/cli/backfill.d.ts +2 -0
- package/dist/cli/backfill.d.ts.map +1 -0
- package/dist/cli/backfill.js +58 -0
- package/dist/cli/backfill.js.map +1 -0
- package/dist/cli/daemon.d.ts +6 -1
- package/dist/cli/daemon.d.ts.map +1 -1
- package/dist/cli/daemon.js +61 -3
- package/dist/cli/daemon.js.map +1 -1
- package/dist/cli/doctor.d.ts +8 -0
- package/dist/cli/doctor.d.ts.map +1 -0
- package/dist/cli/doctor.js +344 -0
- package/dist/cli/doctor.js.map +1 -0
- package/dist/cli/health.d.ts +1 -1
- package/dist/cli/health.d.ts.map +1 -1
- package/dist/cli/health.js +42 -3
- package/dist/cli/health.js.map +1 -1
- package/dist/cli/help.d.ts +6 -0
- package/dist/cli/help.d.ts.map +1 -0
- package/dist/cli/help.js +63 -0
- package/dist/cli/help.js.map +1 -0
- package/dist/cli/index.d.ts +1 -1
- package/dist/cli/index.d.ts.map +1 -1
- package/dist/cli/index.js +35 -7
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/init.d.ts +2 -0
- package/dist/cli/init.d.ts.map +1 -0
- package/dist/cli/init.js +201 -0
- package/dist/cli/init.js.map +1 -0
- package/dist/cli/plugin.d.ts +5 -0
- package/dist/cli/plugin.d.ts.map +1 -0
- package/dist/cli/plugin.js +185 -0
- package/dist/cli/plugin.js.map +1 -0
- package/dist/cli/setup-mcp.d.ts +2 -0
- package/dist/cli/setup-mcp.d.ts.map +1 -0
- package/dist/cli/setup-mcp.js +114 -0
- package/dist/cli/setup-mcp.js.map +1 -0
- package/dist/cli/shell.d.ts +2 -0
- package/dist/cli/shell.d.ts.map +1 -0
- package/dist/cli/shell.js +86 -0
- package/dist/cli/shell.js.map +1 -0
- package/dist/cli/shutdown.d.ts +2 -0
- package/dist/cli/shutdown.d.ts.map +1 -0
- package/dist/cli/shutdown.js +26 -0
- package/dist/cli/shutdown.js.map +1 -0
- package/dist/cli/status.d.ts +2 -0
- package/dist/cli/status.d.ts.map +1 -0
- package/dist/cli/status.js +31 -0
- package/dist/cli/status.js.map +1 -0
- package/dist/cli/telemetry.d.ts +10 -0
- package/dist/cli/telemetry.d.ts.map +1 -0
- package/dist/cli/telemetry.js +56 -0
- package/dist/cli/telemetry.js.map +1 -0
- package/dist/cli/tui/agents-types.d.ts +28 -0
- package/dist/cli/tui/agents-types.d.ts.map +1 -0
- package/dist/cli/tui/agents-types.js +1 -0
- package/dist/cli/tui/agents-types.js.map +1 -0
- package/dist/cli/tui/agents.d.ts +11 -0
- package/dist/cli/tui/agents.d.ts.map +1 -0
- package/dist/cli/tui/agents.js +93 -0
- package/dist/cli/tui/agents.js.map +1 -0
- package/dist/cli/tui/banner.d.ts +3 -0
- package/dist/cli/tui/banner.d.ts.map +1 -0
- package/dist/cli/tui/banner.js +30 -0
- package/dist/cli/tui/banner.js.map +1 -0
- package/dist/cli/tui/components/AgentSelect.d.ts +13 -0
- package/dist/cli/tui/components/AgentSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/AgentSelect.js +116 -0
- package/dist/cli/tui/components/AgentSelect.js.map +1 -0
- package/dist/cli/tui/components/Banner.d.ts +6 -0
- package/dist/cli/tui/components/Banner.d.ts.map +1 -0
- package/dist/cli/tui/components/Banner.js +25 -0
- package/dist/cli/tui/components/Banner.js.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts +7 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.js +19 -0
- package/dist/cli/tui/components/BrowserSelect.js.map +1 -0
- package/dist/cli/tui/components/InstallProgress.d.ts +9 -0
- package/dist/cli/tui/components/InstallProgress.d.ts.map +1 -0
- package/dist/cli/tui/components/InstallProgress.js +67 -0
- package/dist/cli/tui/components/InstallProgress.js.map +1 -0
- package/dist/cli/tui/components/SkillInstall.d.ts +14 -0
- package/dist/cli/tui/components/SkillInstall.d.ts.map +1 -0
- package/dist/cli/tui/components/SkillInstall.js +94 -0
- package/dist/cli/tui/components/SkillInstall.js.map +1 -0
- package/dist/cli/tui/components/Summary.d.ts +22 -0
- package/dist/cli/tui/components/Summary.d.ts.map +1 -0
- package/dist/cli/tui/components/Summary.js +135 -0
- package/dist/cli/tui/components/Summary.js.map +1 -0
- package/dist/cli/tui/components/SystemCheck.d.ts +8 -0
- package/dist/cli/tui/components/SystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/components/SystemCheck.js +71 -0
- package/dist/cli/tui/components/SystemCheck.js.map +1 -0
- package/dist/cli/tui/components/Verification.d.ts +8 -0
- package/dist/cli/tui/components/Verification.d.ts.map +1 -0
- package/dist/cli/tui/components/Verification.js +63 -0
- package/dist/cli/tui/components/Verification.js.map +1 -0
- package/dist/cli/tui/config-writer-cli.d.ts +12 -0
- package/dist/cli/tui/config-writer-cli.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-cli.js +39 -0
- package/dist/cli/tui/config-writer-cli.js.map +1 -0
- package/dist/cli/tui/config-writer-json.d.ts +16 -0
- package/dist/cli/tui/config-writer-json.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-json.js +86 -0
- package/dist/cli/tui/config-writer-json.js.map +1 -0
- package/dist/cli/tui/config-writer-toml.d.ts +16 -0
- package/dist/cli/tui/config-writer-toml.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-toml.js +83 -0
- package/dist/cli/tui/config-writer-toml.js.map +1 -0
- package/dist/cli/tui/config-writer.d.ts +25 -0
- package/dist/cli/tui/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/config-writer.js +101 -0
- package/dist/cli/tui/config-writer.js.map +1 -0
- package/dist/cli/tui/detect-helpers.d.ts +6 -0
- package/dist/cli/tui/detect-helpers.d.ts.map +1 -0
- package/dist/cli/tui/detect-helpers.js +45 -0
- package/dist/cli/tui/detect-helpers.js.map +1 -0
- package/dist/cli/tui/extras-prompt.d.ts +7 -0
- package/dist/cli/tui/extras-prompt.d.ts.map +1 -0
- package/dist/cli/tui/extras-prompt.js +42 -0
- package/dist/cli/tui/extras-prompt.js.map +1 -0
- package/dist/cli/tui/flags-types.d.ts +19 -0
- package/dist/cli/tui/flags-types.d.ts.map +1 -0
- package/dist/cli/tui/flags-types.js +23 -0
- package/dist/cli/tui/flags-types.js.map +1 -0
- package/dist/cli/tui/flags.d.ts +5 -0
- package/dist/cli/tui/flags.d.ts.map +1 -0
- package/dist/cli/tui/flags.js +132 -0
- package/dist/cli/tui/flags.js.map +1 -0
- package/dist/cli/tui/format.d.ts +14 -0
- package/dist/cli/tui/format.d.ts.map +1 -0
- package/dist/cli/tui/format.js +37 -0
- package/dist/cli/tui/format.js.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts +6 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.js +19 -0
- package/dist/cli/tui/hooks/useAgentDetect.js.map +1 -0
- package/dist/cli/tui/hooks/useInstall.d.ts +14 -0
- package/dist/cli/tui/hooks/useInstall.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useInstall.js +90 -0
- package/dist/cli/tui/hooks/useInstall.js.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts +13 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.js +95 -0
- package/dist/cli/tui/hooks/useSystemCheck.js.map +1 -0
- package/dist/cli/tui/hooks/useVerify.d.ts +14 -0
- package/dist/cli/tui/hooks/useVerify.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useVerify.js +71 -0
- package/dist/cli/tui/hooks/useVerify.js.map +1 -0
- package/dist/cli/tui/ink-init.d.ts +2 -0
- package/dist/cli/tui/ink-init.d.ts.map +1 -0
- package/dist/cli/tui/ink-init.js +198 -0
- package/dist/cli/tui/ink-init.js.map +1 -0
- package/dist/cli/tui/reporter-auto.d.ts +7 -0
- package/dist/cli/tui/reporter-auto.d.ts.map +1 -0
- package/dist/cli/tui/reporter-auto.js +15 -0
- package/dist/cli/tui/reporter-auto.js.map +1 -0
- package/dist/cli/tui/reporter.d.ts +26 -0
- package/dist/cli/tui/reporter.d.ts.map +1 -0
- package/dist/cli/tui/reporter.js +32 -0
- package/dist/cli/tui/reporter.js.map +1 -0
- package/dist/cli/tui/run-command.d.ts +14 -0
- package/dist/cli/tui/run-command.d.ts.map +1 -0
- package/dist/cli/tui/run-command.js +72 -0
- package/dist/cli/tui/run-command.js.map +1 -0
- package/dist/cli/tui/select-agents.d.ts +6 -0
- package/dist/cli/tui/select-agents.d.ts.map +1 -0
- package/dist/cli/tui/select-agents.js +32 -0
- package/dist/cli/tui/select-agents.js.map +1 -0
- package/dist/cli/tui/status-agents.d.ts +11 -0
- package/dist/cli/tui/status-agents.d.ts.map +1 -0
- package/dist/cli/tui/status-agents.js +53 -0
- package/dist/cli/tui/status-agents.js.map +1 -0
- package/dist/cli/tui/status-cache.d.ts +6 -0
- package/dist/cli/tui/status-cache.d.ts.map +1 -0
- package/dist/cli/tui/status-cache.js +39 -0
- package/dist/cli/tui/status-cache.js.map +1 -0
- package/dist/cli/tui/status-format.d.ts +14 -0
- package/dist/cli/tui/status-format.d.ts.map +1 -0
- package/dist/cli/tui/status-format.js +41 -0
- package/dist/cli/tui/status-format.js.map +1 -0
- package/dist/cli/tui/status-python.d.ts +6 -0
- package/dist/cli/tui/status-python.d.ts.map +1 -0
- package/dist/cli/tui/status-python.js +30 -0
- package/dist/cli/tui/status-python.js.map +1 -0
- package/dist/cli/tui/system-check.d.ts +24 -0
- package/dist/cli/tui/system-check.d.ts.map +1 -0
- package/dist/cli/tui/system-check.js +103 -0
- package/dist/cli/tui/system-check.js.map +1 -0
- package/dist/cli/tui/tui-reporter.d.ts +19 -0
- package/dist/cli/tui/tui-reporter.d.ts.map +1 -0
- package/dist/cli/tui/tui-reporter.js +95 -0
- package/dist/cli/tui/tui-reporter.js.map +1 -0
- package/dist/cli/tui/utils/config-writer.d.ts +3 -0
- package/dist/cli/tui/utils/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/utils/config-writer.js +22 -0
- package/dist/cli/tui/utils/config-writer.js.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts +3 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.js +11 -0
- package/dist/cli/tui/utils/suppress-logs.js.map +1 -0
- package/dist/cli/tui/verify-suggestions.d.ts +5 -0
- package/dist/cli/tui/verify-suggestions.d.ts.map +1 -0
- package/dist/cli/tui/verify-suggestions.js +20 -0
- package/dist/cli/tui/verify-suggestions.js.map +1 -0
- package/dist/cli/tui/verify.d.ts +14 -0
- package/dist/cli/tui/verify.d.ts.map +1 -0
- package/dist/cli/tui/verify.js +101 -0
- package/dist/cli/tui/verify.js.map +1 -0
- package/dist/cli/tui/version.d.ts +2 -0
- package/dist/cli/tui/version.d.ts.map +1 -0
- package/dist/cli/tui/version.js +14 -0
- package/dist/cli/tui/version.js.map +1 -0
- package/dist/cli/uninstall.d.ts +2 -0
- package/dist/cli/uninstall.d.ts.map +1 -0
- package/dist/cli/uninstall.js +57 -0
- package/dist/cli/uninstall.js.map +1 -0
- package/dist/cli/warmup.d.ts +10 -2
- package/dist/cli/warmup.d.ts.map +1 -1
- package/dist/cli/warmup.js +226 -93
- package/dist/cli/warmup.js.map +1 -1
- package/dist/config.d.ts +28 -2
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +106 -56
- package/dist/config.js.map +1 -1
- package/dist/crawl/crawler.d.ts +6 -0
- package/dist/crawl/crawler.d.ts.map +1 -1
- package/dist/crawl/crawler.js +210 -209
- package/dist/crawl/crawler.js.map +1 -1
- package/dist/crawl/dedup.d.ts +1 -0
- package/dist/crawl/dedup.d.ts.map +1 -1
- package/dist/crawl/dedup.js +124 -81
- package/dist/crawl/dedup.js.map +1 -1
- package/dist/crawl/etag-incremental.d.ts +43 -0
- package/dist/crawl/etag-incremental.d.ts.map +1 -0
- package/dist/crawl/etag-incremental.js +94 -0
- package/dist/crawl/etag-incremental.js.map +1 -0
- package/dist/crawl/index-to-vec.d.ts +10 -0
- package/dist/crawl/index-to-vec.d.ts.map +1 -0
- package/dist/crawl/index-to-vec.js +44 -0
- package/dist/crawl/index-to-vec.js.map +1 -0
- package/dist/crawl/mapper.js +136 -164
- package/dist/crawl/mapper.js.map +1 -1
- package/dist/crawl/rate-limiter.js +63 -66
- package/dist/crawl/rate-limiter.js.map +1 -1
- package/dist/crawl/robots.js +58 -57
- package/dist/crawl/robots.js.map +1 -1
- package/dist/crawl/sitemap-first.d.ts +12 -0
- package/dist/crawl/sitemap-first.d.ts.map +1 -0
- package/dist/crawl/sitemap-first.js +47 -0
- package/dist/crawl/sitemap-first.js.map +1 -0
- package/dist/crawl/sitemap.js +33 -32
- package/dist/crawl/sitemap.js.map +1 -1
- package/dist/crawl/url-utils.d.ts +1 -0
- package/dist/crawl/url-utils.d.ts.map +1 -1
- package/dist/crawl/url-utils.js +49 -37
- package/dist/crawl/url-utils.js.map +1 -1
- package/dist/daemon/health-check.d.ts +16 -0
- package/dist/daemon/health-check.d.ts.map +1 -0
- package/dist/daemon/health-check.js +33 -0
- package/dist/daemon/health-check.js.map +1 -0
- package/dist/daemon/http-server.d.ts +26 -0
- package/dist/daemon/http-server.d.ts.map +1 -0
- package/dist/daemon/http-server.js +275 -0
- package/dist/daemon/http-server.js.map +1 -0
- package/dist/daemon/proxy.d.ts +10 -0
- package/dist/daemon/proxy.d.ts.map +1 -0
- package/dist/daemon/proxy.js +93 -0
- package/dist/daemon/proxy.js.map +1 -0
- package/dist/embedding/embed.d.ts +59 -0
- package/dist/embedding/embed.d.ts.map +1 -0
- package/dist/embedding/embed.js +233 -0
- package/dist/embedding/embed.js.map +1 -0
- package/dist/embedding/fastembed-provider.d.ts +19 -0
- package/dist/embedding/fastembed-provider.d.ts.map +1 -0
- package/dist/embedding/fastembed-provider.js +51 -0
- package/dist/embedding/fastembed-provider.js.map +1 -0
- package/dist/embedding/key-terms.d.ts +12 -0
- package/dist/embedding/key-terms.d.ts.map +1 -0
- package/dist/embedding/key-terms.js +234 -0
- package/dist/embedding/key-terms.js.map +1 -0
- package/dist/extraction/boilerplate.d.ts +15 -0
- package/dist/extraction/boilerplate.d.ts.map +1 -0
- package/dist/extraction/boilerplate.js +52 -0
- package/dist/extraction/boilerplate.js.map +1 -0
- package/dist/extraction/defuddle.d.ts.map +1 -1
- package/dist/extraction/defuddle.js +27 -23
- package/dist/extraction/defuddle.js.map +1 -1
- package/dist/extraction/extract.d.ts.map +1 -1
- package/dist/extraction/extract.js +76 -76
- package/dist/extraction/extract.js.map +1 -1
- package/dist/extraction/jsonld.js +50 -54
- package/dist/extraction/jsonld.js.map +1 -1
- package/dist/extraction/lang-hints.d.ts +2 -0
- package/dist/extraction/lang-hints.d.ts.map +1 -0
- package/dist/extraction/lang-hints.js +30 -0
- package/dist/extraction/lang-hints.js.map +1 -0
- package/dist/extraction/llm-fallback.d.ts +17 -0
- package/dist/extraction/llm-fallback.d.ts.map +1 -0
- package/dist/extraction/llm-fallback.js +130 -0
- package/dist/extraction/llm-fallback.js.map +1 -0
- package/dist/extraction/markdown-sanitize.d.ts +2 -0
- package/dist/extraction/markdown-sanitize.d.ts.map +1 -0
- package/dist/extraction/markdown-sanitize.js +151 -0
- package/dist/extraction/markdown-sanitize.js.map +1 -0
- package/dist/extraction/markdown.d.ts +11 -0
- package/dist/extraction/markdown.d.ts.map +1 -1
- package/dist/extraction/markdown.js +195 -91
- package/dist/extraction/markdown.js.map +1 -1
- package/dist/extraction/pipeline.d.ts +8 -0
- package/dist/extraction/pipeline.d.ts.map +1 -1
- package/dist/extraction/pipeline.js +57 -91
- package/dist/extraction/pipeline.js.map +1 -1
- package/dist/extraction/readability.d.ts +1 -1
- package/dist/extraction/readability.d.ts.map +1 -1
- package/dist/extraction/readability.js +28 -29
- package/dist/extraction/readability.js.map +1 -1
- package/dist/extraction/schema.d.ts +12 -0
- package/dist/extraction/schema.d.ts.map +1 -1
- package/dist/extraction/schema.js +135 -72
- package/dist/extraction/schema.js.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.d.ts.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.js +81 -91
- package/dist/extraction/site-extractors/docs-generic.js.map +1 -1
- package/dist/extraction/site-extractors/github.d.ts.map +1 -1
- package/dist/extraction/site-extractors/github.js +87 -95
- package/dist/extraction/site-extractors/github.js.map +1 -1
- package/dist/extraction/site-extractors/mdn.d.ts.map +1 -1
- package/dist/extraction/site-extractors/mdn.js +46 -54
- package/dist/extraction/site-extractors/mdn.js.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.d.ts.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.js +71 -80
- package/dist/extraction/site-extractors/stackoverflow.js.map +1 -1
- package/dist/extraction/structured-data.d.ts +4 -0
- package/dist/extraction/structured-data.d.ts.map +1 -0
- package/dist/extraction/structured-data.js +173 -0
- package/dist/extraction/structured-data.js.map +1 -0
- package/dist/extraction/structured.d.ts +4 -0
- package/dist/extraction/structured.d.ts.map +1 -0
- package/dist/extraction/structured.js +163 -0
- package/dist/extraction/structured.js.map +1 -0
- package/dist/extraction/v1/classifier.d.ts +3 -0
- package/dist/extraction/v1/classifier.d.ts.map +1 -0
- package/dist/extraction/v1/classifier.js +110 -0
- package/dist/extraction/v1/classifier.js.map +1 -0
- package/dist/extraction/v1/extract-provider.d.ts +16 -0
- package/dist/extraction/v1/extract-provider.d.ts.map +1 -0
- package/dist/extraction/v1/extract-provider.js +43 -0
- package/dist/extraction/v1/extract-provider.js.map +1 -0
- package/dist/extraction/v1/local-llm.d.ts +8 -0
- package/dist/extraction/v1/local-llm.d.ts.map +1 -0
- package/dist/extraction/v1/local-llm.js +34 -0
- package/dist/extraction/v1/local-llm.js.map +1 -0
- package/dist/extraction/v1/news.d.ts +3 -0
- package/dist/extraction/v1/news.d.ts.map +1 -0
- package/dist/extraction/v1/news.js +61 -0
- package/dist/extraction/v1/news.js.map +1 -0
- package/dist/extraction/v1/product.d.ts +3 -0
- package/dist/extraction/v1/product.d.ts.map +1 -0
- package/dist/extraction/v1/product.js +166 -0
- package/dist/extraction/v1/product.js.map +1 -0
- package/dist/extraction/v1/recipe.d.ts +3 -0
- package/dist/extraction/v1/recipe.d.ts.map +1 -0
- package/dist/extraction/v1/recipe.js +136 -0
- package/dist/extraction/v1/recipe.js.map +1 -0
- package/dist/extraction/v1/routed.d.ts +17 -0
- package/dist/extraction/v1/routed.d.ts.map +1 -0
- package/dist/extraction/v1/routed.js +68 -0
- package/dist/extraction/v1/routed.js.map +1 -0
- package/dist/extraction/v1/schemas/Article.d.ts +11 -0
- package/dist/extraction/v1/schemas/Article.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Article.js +23 -0
- package/dist/extraction/v1/schemas/Article.js.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts +9 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js +90 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts +10 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.js +122 -0
- package/dist/extraction/v1/schemas/EventListing.js.map +1 -0
- package/dist/extraction/v1/schemas/Paper.d.ts +10 -0
- package/dist/extraction/v1/schemas/Paper.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Paper.js +156 -0
- package/dist/extraction/v1/schemas/Paper.js.map +1 -0
- package/dist/extraction/v1/schemas/Product.d.ts +17 -0
- package/dist/extraction/v1/schemas/Product.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Product.js +149 -0
- package/dist/extraction/v1/schemas/Product.js.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts +14 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.js +160 -0
- package/dist/extraction/v1/schemas/Recipe.js.map +1 -0
- package/dist/extraction/v1/schemas/index.d.ts +13 -0
- package/dist/extraction/v1/schemas/index.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/index.js +44 -0
- package/dist/extraction/v1/schemas/index.js.map +1 -0
- package/dist/extraction/v1/site-extractors.d.ts +5 -0
- package/dist/extraction/v1/site-extractors.d.ts.map +1 -0
- package/dist/extraction/v1/site-extractors.js +31 -0
- package/dist/extraction/v1/site-extractors.js.map +1 -0
- package/dist/fetch/action-executor.d.ts +28 -0
- package/dist/fetch/action-executor.d.ts.map +1 -0
- package/dist/fetch/action-executor.js +88 -0
- package/dist/fetch/action-executor.js.map +1 -0
- package/dist/fetch/auth.d.ts +2 -1
- package/dist/fetch/auth.d.ts.map +1 -1
- package/dist/fetch/auth.js +56 -26
- package/dist/fetch/auth.js.map +1 -1
- package/dist/fetch/browser-pool.d.ts +30 -11
- package/dist/fetch/browser-pool.d.ts.map +1 -1
- package/dist/fetch/browser-pool.js +303 -127
- package/dist/fetch/browser-pool.js.map +1 -1
- package/dist/fetch/browser-selector.d.ts +17 -0
- package/dist/fetch/browser-selector.d.ts.map +1 -0
- package/dist/fetch/browser-selector.js +72 -0
- package/dist/fetch/browser-selector.js.map +1 -0
- package/dist/fetch/browser-types.d.ts +3 -0
- package/dist/fetch/browser-types.d.ts.map +1 -0
- package/dist/fetch/browser-types.js +45 -0
- package/dist/fetch/browser-types.js.map +1 -0
- package/dist/fetch/cdp-client.d.ts +9 -0
- package/dist/fetch/cdp-client.d.ts.map +1 -0
- package/dist/fetch/cdp-client.js +89 -0
- package/dist/fetch/cdp-client.js.map +1 -0
- package/dist/fetch/content-check.js +39 -46
- package/dist/fetch/content-check.js.map +1 -1
- package/dist/fetch/error-describe.d.ts +7 -0
- package/dist/fetch/error-describe.d.ts.map +1 -0
- package/dist/fetch/error-describe.js +37 -0
- package/dist/fetch/error-describe.js.map +1 -0
- package/dist/fetch/http-client.d.ts +4 -0
- package/dist/fetch/http-client.d.ts.map +1 -1
- package/dist/fetch/http-client.js +147 -128
- package/dist/fetch/http-client.js.map +1 -1
- package/dist/fetch/lightpanda.d.ts +28 -0
- package/dist/fetch/lightpanda.d.ts.map +1 -0
- package/dist/fetch/lightpanda.js +174 -0
- package/dist/fetch/lightpanda.js.map +1 -0
- package/dist/fetch/playwright-tier.d.ts +19 -0
- package/dist/fetch/playwright-tier.d.ts.map +1 -0
- package/dist/fetch/playwright-tier.js +76 -0
- package/dist/fetch/playwright-tier.js.map +1 -0
- package/dist/fetch/router.d.ts +49 -3
- package/dist/fetch/router.d.ts.map +1 -1
- package/dist/fetch/router.js +187 -81
- package/dist/fetch/router.js.map +1 -1
- package/dist/index.js +102 -17
- package/dist/index.js.map +1 -1
- package/dist/instructions.d.ts +31 -0
- package/dist/instructions.d.ts.map +1 -0
- package/dist/instructions.js +245 -0
- package/dist/instructions.js.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts +3 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.js +41 -0
- package/dist/integrations/cloud/llm/anthropic.js.map +1 -0
- package/dist/integrations/cloud/llm/cache.d.ts +5 -0
- package/dist/integrations/cloud/llm/cache.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/cache.js +49 -0
- package/dist/integrations/cloud/llm/cache.js.map +1 -0
- package/dist/integrations/cloud/llm/gemini.d.ts +3 -0
- package/dist/integrations/cloud/llm/gemini.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/gemini.js +37 -0
- package/dist/integrations/cloud/llm/gemini.js.map +1 -0
- package/dist/integrations/cloud/llm/groq.d.ts +3 -0
- package/dist/integrations/cloud/llm/groq.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/groq.js +74 -0
- package/dist/integrations/cloud/llm/groq.js.map +1 -0
- package/dist/integrations/cloud/llm/hash.d.ts +3 -0
- package/dist/integrations/cloud/llm/hash.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/hash.js +26 -0
- package/dist/integrations/cloud/llm/hash.js.map +1 -0
- package/dist/integrations/cloud/llm/model-select.d.ts +5 -0
- package/dist/integrations/cloud/llm/model-select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/model-select.js +32 -0
- package/dist/integrations/cloud/llm/model-select.js.map +1 -0
- package/dist/integrations/cloud/llm/openai.d.ts +3 -0
- package/dist/integrations/cloud/llm/openai.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/openai.js +43 -0
- package/dist/integrations/cloud/llm/openai.js.map +1 -0
- package/dist/integrations/cloud/llm/run.d.ts +27 -0
- package/dist/integrations/cloud/llm/run.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/run.js +99 -0
- package/dist/integrations/cloud/llm/run.js.map +1 -0
- package/dist/integrations/cloud/llm/select.d.ts +5 -0
- package/dist/integrations/cloud/llm/select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/select.js +30 -0
- package/dist/integrations/cloud/llm/select.js.map +1 -0
- package/dist/integrations/cloud/llm/text-adapters.d.ts +19 -0
- package/dist/integrations/cloud/llm/text-adapters.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/text-adapters.js +103 -0
- package/dist/integrations/cloud/llm/text-adapters.js.map +1 -0
- package/dist/integrations/cloud/llm/types.d.ts +24 -0
- package/dist/integrations/cloud/llm/types.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/types.js +1 -0
- package/dist/integrations/cloud/llm/types.js.map +1 -0
- package/dist/integrations/cloud/llm/validate.d.ts +6 -0
- package/dist/integrations/cloud/llm/validate.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/validate.js +63 -0
- package/dist/integrations/cloud/llm/validate.js.map +1 -0
- package/dist/logger.d.ts +4 -1
- package/dist/logger.d.ts.map +1 -1
- package/dist/logger.js +71 -30
- package/dist/logger.js.map +1 -1
- package/dist/pdf-parse.d.js +1 -0
- package/dist/pdf-parse.d.js.map +1 -0
- package/dist/plugins/loader.d.ts +20 -0
- package/dist/plugins/loader.d.ts.map +1 -0
- package/dist/plugins/loader.js +157 -0
- package/dist/plugins/loader.js.map +1 -0
- package/dist/plugins/registry.d.ts +26 -0
- package/dist/plugins/registry.d.ts.map +1 -0
- package/dist/plugins/registry.js +71 -0
- package/dist/plugins/registry.js.map +1 -0
- package/dist/plugins/validate.d.ts +9 -0
- package/dist/plugins/validate.d.ts.map +1 -0
- package/dist/plugins/validate.js +79 -0
- package/dist/plugins/validate.js.map +1 -0
- package/dist/providers/embed-provider.d.ts +11 -0
- package/dist/providers/embed-provider.d.ts.map +1 -0
- package/dist/providers/embed-provider.js +24 -0
- package/dist/providers/embed-provider.js.map +1 -0
- package/dist/providers/extract-provider.d.ts +23 -0
- package/dist/providers/extract-provider.d.ts.map +1 -0
- package/dist/providers/extract-provider.js +25 -0
- package/dist/providers/extract-provider.js.map +1 -0
- package/dist/providers/rerank-provider.d.ts +17 -0
- package/dist/providers/rerank-provider.d.ts.map +1 -0
- package/dist/providers/rerank-provider.js +41 -0
- package/dist/providers/rerank-provider.js.map +1 -0
- package/dist/providers/search-provider.d.ts +25 -0
- package/dist/providers/search-provider.d.ts.map +1 -0
- package/dist/providers/search-provider.js +44 -0
- package/dist/providers/search-provider.js.map +1 -0
- package/dist/providers/vector-store.d.ts +27 -0
- package/dist/providers/vector-store.d.ts.map +1 -0
- package/dist/providers/vector-store.js +27 -0
- package/dist/providers/vector-store.js.map +1 -0
- package/dist/python-env.d.ts +9 -0
- package/dist/python-env.d.ts.map +1 -0
- package/dist/python-env.js +13 -0
- package/dist/python-env.js.map +1 -0
- package/dist/repl/commands/agent.d.ts +5 -0
- package/dist/repl/commands/agent.d.ts.map +1 -0
- package/dist/repl/commands/agent.js +62 -0
- package/dist/repl/commands/agent.js.map +1 -0
- package/dist/repl/commands/cache.d.ts +4 -0
- package/dist/repl/commands/cache.d.ts.map +1 -0
- package/dist/repl/commands/cache.js +43 -0
- package/dist/repl/commands/cache.js.map +1 -0
- package/dist/repl/commands/crawl.d.ts +7 -0
- package/dist/repl/commands/crawl.d.ts.map +1 -0
- package/dist/repl/commands/crawl.js +44 -0
- package/dist/repl/commands/crawl.js.map +1 -0
- package/dist/repl/commands/extract.d.ts +5 -0
- package/dist/repl/commands/extract.d.ts.map +1 -0
- package/dist/repl/commands/extract.js +47 -0
- package/dist/repl/commands/extract.js.map +1 -0
- package/dist/repl/commands/fetch.d.ts +5 -0
- package/dist/repl/commands/fetch.d.ts.map +1 -0
- package/dist/repl/commands/fetch.js +67 -0
- package/dist/repl/commands/fetch.js.map +1 -0
- package/dist/repl/commands/find-similar.d.ts +5 -0
- package/dist/repl/commands/find-similar.d.ts.map +1 -0
- package/dist/repl/commands/find-similar.js +74 -0
- package/dist/repl/commands/find-similar.js.map +1 -0
- package/dist/repl/commands/research.d.ts +5 -0
- package/dist/repl/commands/research.d.ts.map +1 -0
- package/dist/repl/commands/research.js +65 -0
- package/dist/repl/commands/research.js.map +1 -0
- package/dist/repl/commands/search.d.ts +5 -0
- package/dist/repl/commands/search.d.ts.map +1 -0
- package/dist/repl/commands/search.js +74 -0
- package/dist/repl/commands/search.js.map +1 -0
- package/dist/repl/commands/types.d.ts +9 -0
- package/dist/repl/commands/types.d.ts.map +1 -0
- package/dist/repl/commands/types.js +1 -0
- package/dist/repl/commands/types.js.map +1 -0
- package/dist/repl/formatters.d.ts +13 -0
- package/dist/repl/formatters.d.ts.map +1 -0
- package/dist/repl/formatters.js +283 -0
- package/dist/repl/formatters.js.map +1 -0
- package/dist/repl/parser.d.ts +9 -0
- package/dist/repl/parser.d.ts.map +1 -0
- package/dist/repl/parser.js +86 -0
- package/dist/repl/parser.js.map +1 -0
- package/dist/repl/shell.d.ts +8 -0
- package/dist/repl/shell.d.ts.map +1 -0
- package/dist/repl/shell.js +184 -0
- package/dist/repl/shell.js.map +1 -0
- package/dist/research/branch-exploration.d.ts +14 -0
- package/dist/research/branch-exploration.d.ts.map +1 -0
- package/dist/research/branch-exploration.js +100 -0
- package/dist/research/branch-exploration.js.map +1 -0
- package/dist/research/brief.d.ts +6 -0
- package/dist/research/brief.d.ts.map +1 -0
- package/dist/research/brief.js +246 -0
- package/dist/research/brief.js.map +1 -0
- package/dist/research/citation-graph.d.ts +9 -0
- package/dist/research/citation-graph.d.ts.map +1 -0
- package/dist/research/citation-graph.js +114 -0
- package/dist/research/citation-graph.js.map +1 -0
- package/dist/research/decompose.d.ts +14 -0
- package/dist/research/decompose.d.ts.map +1 -0
- package/dist/research/decompose.js +439 -0
- package/dist/research/decompose.js.map +1 -0
- package/dist/research/pipeline.d.ts +5 -0
- package/dist/research/pipeline.d.ts.map +1 -0
- package/dist/research/pipeline.js +269 -0
- package/dist/research/pipeline.js.map +1 -0
- package/dist/research/synthesis-local.d.ts +19 -0
- package/dist/research/synthesis-local.d.ts.map +1 -0
- package/dist/research/synthesis-local.js +62 -0
- package/dist/research/synthesis-local.js.map +1 -0
- package/dist/research/synthesize.d.ts +10 -0
- package/dist/research/synthesize.d.ts.map +1 -0
- package/dist/research/synthesize.js +137 -0
- package/dist/research/synthesize.js.map +1 -0
- package/dist/search/answer-synthesis.d.ts +33 -0
- package/dist/search/answer-synthesis.d.ts.map +1 -0
- package/dist/search/answer-synthesis.js +244 -0
- package/dist/search/answer-synthesis.js.map +1 -0
- package/dist/search/context-formatter.d.ts +3 -0
- package/dist/search/context-formatter.d.ts.map +1 -0
- package/dist/search/context-formatter.js +56 -0
- package/dist/search/context-formatter.js.map +1 -0
- package/dist/search/dedup.d.ts +1 -0
- package/dist/search/dedup.d.ts.map +1 -1
- package/dist/search/dedup.js +40 -32
- package/dist/search/dedup.js.map +1 -1
- package/dist/search/engines/arxiv.d.ts +7 -0
- package/dist/search/engines/arxiv.d.ts.map +1 -0
- package/dist/search/engines/arxiv.js +70 -0
- package/dist/search/engines/arxiv.js.map +1 -0
- package/dist/search/engines/bing-news.d.ts +7 -0
- package/dist/search/engines/bing-news.d.ts.map +1 -0
- package/dist/search/engines/bing-news.js +97 -0
- package/dist/search/engines/bing-news.js.map +1 -0
- package/dist/search/engines/bing.d.ts +1 -0
- package/dist/search/engines/bing.d.ts.map +1 -1
- package/dist/search/engines/bing.js +100 -44
- package/dist/search/engines/bing.js.map +1 -1
- package/dist/search/engines/devdocs.d.ts +6 -0
- package/dist/search/engines/devdocs.d.ts.map +1 -0
- package/dist/search/engines/devdocs.js +56 -0
- package/dist/search/engines/devdocs.js.map +1 -0
- package/dist/search/engines/duckduckgo.d.ts.map +1 -1
- package/dist/search/engines/duckduckgo.js +56 -44
- package/dist/search/engines/duckduckgo.js.map +1 -1
- package/dist/search/engines/github-code.d.ts +7 -0
- package/dist/search/engines/github-code.d.ts.map +1 -0
- package/dist/search/engines/github-code.js +55 -0
- package/dist/search/engines/github-code.js.map +1 -0
- package/dist/search/engines/hn-algolia.d.ts +7 -0
- package/dist/search/engines/hn-algolia.d.ts.map +1 -0
- package/dist/search/engines/hn-algolia.js +76 -0
- package/dist/search/engines/hn-algolia.js.map +1 -0
- package/dist/search/engines/lobsters.d.ts +7 -0
- package/dist/search/engines/lobsters.d.ts.map +1 -0
- package/dist/search/engines/lobsters.js +83 -0
- package/dist/search/engines/lobsters.js.map +1 -0
- package/dist/search/engines/mdn.d.ts +7 -0
- package/dist/search/engines/mdn.d.ts.map +1 -0
- package/dist/search/engines/mdn.js +48 -0
- package/dist/search/engines/mdn.js.map +1 -0
- package/dist/search/engines/semantic-scholar.d.ts +7 -0
- package/dist/search/engines/semantic-scholar.d.ts.map +1 -0
- package/dist/search/engines/semantic-scholar.js +69 -0
- package/dist/search/engines/semantic-scholar.js.map +1 -0
- package/dist/search/engines/stackoverflow.d.ts +7 -0
- package/dist/search/engines/stackoverflow.d.ts.map +1 -0
- package/dist/search/engines/stackoverflow.js +73 -0
- package/dist/search/engines/stackoverflow.js.map +1 -0
- package/dist/search/engines/startpage.d.ts.map +1 -1
- package/dist/search/engines/startpage.js +65 -46
- package/dist/search/engines/startpage.js.map +1 -1
- package/dist/search/evidence.d.ts +25 -0
- package/dist/search/evidence.d.ts.map +1 -0
- package/dist/search/evidence.js +220 -0
- package/dist/search/evidence.js.map +1 -0
- package/dist/search/filters.d.ts.map +1 -1
- package/dist/search/filters.js +58 -54
- package/dist/search/filters.js.map +1 -1
- package/dist/search/find-similar/crawl-rank.d.ts +9 -0
- package/dist/search/find-similar/crawl-rank.d.ts.map +1 -0
- package/dist/search/find-similar/crawl-rank.js +272 -0
- package/dist/search/find-similar/crawl-rank.js.map +1 -0
- package/dist/search/find-similar/mode.d.ts +4 -0
- package/dist/search/find-similar/mode.d.ts.map +1 -0
- package/dist/search/find-similar/mode.js +12 -0
- package/dist/search/find-similar/mode.js.map +1 -0
- package/dist/search/find-similar.d.ts +5 -0
- package/dist/search/find-similar.d.ts.map +1 -0
- package/dist/search/find-similar.js +509 -0
- package/dist/search/find-similar.js.map +1 -0
- package/dist/search/highlights.d.ts +19 -0
- package/dist/search/highlights.d.ts.map +1 -0
- package/dist/search/highlights.js +167 -0
- package/dist/search/highlights.js.map +1 -0
- package/dist/search/language-filter.d.ts +29 -0
- package/dist/search/language-filter.d.ts.map +1 -0
- package/dist/search/language-filter.js +126 -0
- package/dist/search/language-filter.js.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts +4 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.js +501 -0
- package/dist/search/legacy/searxng-orchestrator.js.map +1 -0
- package/dist/search/legacy/searxng-provider.d.ts +7 -0
- package/dist/search/legacy/searxng-provider.d.ts.map +1 -0
- package/dist/search/legacy/searxng-provider.js +11 -0
- package/dist/search/legacy/searxng-provider.js.map +1 -0
- package/dist/search/multi-query.d.ts +25 -0
- package/dist/search/multi-query.d.ts.map +1 -0
- package/dist/search/multi-query.js +228 -0
- package/dist/search/multi-query.js.map +1 -0
- package/dist/search/query.js +32 -34
- package/dist/search/query.js.map +1 -1
- package/dist/search/rerank.d.ts +3 -1
- package/dist/search/rerank.d.ts.map +1 -1
- package/dist/search/rerank.js +44 -35
- package/dist/search/rerank.js.map +1 -1
- package/dist/search/reranker/authority-boost.d.ts +3 -0
- package/dist/search/reranker/authority-boost.d.ts.map +1 -0
- package/dist/search/reranker/authority-boost.js +179 -0
- package/dist/search/reranker/authority-boost.js.map +1 -0
- package/dist/search/reranker/consensus-boost.d.ts +3 -0
- package/dist/search/reranker/consensus-boost.d.ts.map +1 -0
- package/dist/search/reranker/consensus-boost.js +27 -0
- package/dist/search/reranker/consensus-boost.js.map +1 -0
- package/dist/search/reranker/recency-boost.d.ts +3 -0
- package/dist/search/reranker/recency-boost.d.ts.map +1 -0
- package/dist/search/reranker/recency-boost.js +13 -0
- package/dist/search/reranker/recency-boost.js.map +1 -0
- package/dist/search/reranker/recency.d.ts +3 -0
- package/dist/search/reranker/recency.d.ts.map +1 -0
- package/dist/search/reranker/recency.js +23 -0
- package/dist/search/reranker/recency.js.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts +13 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.js +94 -0
- package/dist/search/reranker/transformers-rerank-provider.js.map +1 -0
- package/dist/search/rrf.d.ts +17 -0
- package/dist/search/rrf.d.ts.map +1 -0
- package/dist/search/rrf.js +39 -0
- package/dist/search/rrf.js.map +1 -0
- package/dist/search/sampling.d.ts +25 -0
- package/dist/search/sampling.d.ts.map +1 -0
- package/dist/search/sampling.js +52 -0
- package/dist/search/sampling.js.map +1 -0
- package/dist/search/searxng.d.ts.map +1 -1
- package/dist/search/searxng.js +69 -79
- package/dist/search/searxng.js.map +1 -1
- package/dist/search/tokens.d.ts +3 -0
- package/dist/search/tokens.d.ts.map +1 -0
- package/dist/search/tokens.js +39 -0
- package/dist/search/tokens.js.map +1 -0
- package/dist/search/truncate.d.ts +6 -0
- package/dist/search/truncate.d.ts.map +1 -0
- package/dist/search/truncate.js +26 -0
- package/dist/search/truncate.js.map +1 -0
- package/dist/search/url-unwrap.d.ts +3 -0
- package/dist/search/url-unwrap.d.ts.map +1 -0
- package/dist/search/url-unwrap.js +43 -0
- package/dist/search/url-unwrap.js.map +1 -0
- package/dist/search/v1/context-rank.d.ts +13 -0
- package/dist/search/v1/context-rank.d.ts.map +1 -0
- package/dist/search/v1/context-rank.js +74 -0
- package/dist/search/v1/context-rank.js.map +1 -0
- package/dist/search/v1/engine-base.d.ts +27 -0
- package/dist/search/v1/engine-base.d.ts.map +1 -0
- package/dist/search/v1/engine-base.js +110 -0
- package/dist/search/v1/engine-base.js.map +1 -0
- package/dist/search/v1/intent-router.d.ts +22 -0
- package/dist/search/v1/intent-router.d.ts.map +1 -0
- package/dist/search/v1/intent-router.js +138 -0
- package/dist/search/v1/intent-router.js.map +1 -0
- package/dist/search/v1/orchestrator.d.ts +24 -0
- package/dist/search/v1/orchestrator.d.ts.map +1 -0
- package/dist/search/v1/orchestrator.js +163 -0
- package/dist/search/v1/orchestrator.js.map +1 -0
- package/dist/search/v1/recency-boost.d.ts +9 -0
- package/dist/search/v1/recency-boost.d.ts.map +1 -0
- package/dist/search/v1/recency-boost.js +37 -0
- package/dist/search/v1/recency-boost.js.map +1 -0
- package/dist/search/v1/recent-cache-dedup.d.ts +6 -0
- package/dist/search/v1/recent-cache-dedup.d.ts.map +1 -0
- package/dist/search/v1/recent-cache-dedup.js +85 -0
- package/dist/search/v1/recent-cache-dedup.js.map +1 -0
- package/dist/search/v1/rss/feed-config.d.ts +21 -0
- package/dist/search/v1/rss/feed-config.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-config.js +90 -0
- package/dist/search/v1/rss/feed-config.js.map +1 -0
- package/dist/search/v1/rss/feed-parser.d.ts +14 -0
- package/dist/search/v1/rss/feed-parser.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-parser.js +104 -0
- package/dist/search/v1/rss/feed-parser.js.map +1 -0
- package/dist/search/v1/rss/feed-poller.d.ts +22 -0
- package/dist/search/v1/rss/feed-poller.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-poller.js +102 -0
- package/dist/search/v1/rss/feed-poller.js.map +1 -0
- package/dist/search/v1/rss/feed-store.d.ts +30 -0
- package/dist/search/v1/rss/feed-store.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-store.js +134 -0
- package/dist/search/v1/rss/feed-store.js.map +1 -0
- package/dist/search/v1/rss/rss-engine.d.ts +6 -0
- package/dist/search/v1/rss/rss-engine.d.ts.map +1 -0
- package/dist/search/v1/rss/rss-engine.js +28 -0
- package/dist/search/v1/rss/rss-engine.js.map +1 -0
- package/dist/search/v1/v1-provider.d.ts +7 -0
- package/dist/search/v1/v1-provider.d.ts.map +1 -0
- package/dist/search/v1/v1-provider.js +68 -0
- package/dist/search/v1/v1-provider.js.map +1 -0
- package/dist/search/v1/verticals/code.d.ts +4 -0
- package/dist/search/v1/verticals/code.d.ts.map +1 -0
- package/dist/search/v1/verticals/code.js +20 -0
- package/dist/search/v1/verticals/code.js.map +1 -0
- package/dist/search/v1/verticals/docs.d.ts +4 -0
- package/dist/search/v1/verticals/docs.d.ts.map +1 -0
- package/dist/search/v1/verticals/docs.js +20 -0
- package/dist/search/v1/verticals/docs.js.map +1 -0
- package/dist/search/v1/verticals/general.d.ts +4 -0
- package/dist/search/v1/verticals/general.d.ts.map +1 -0
- package/dist/search/v1/verticals/general.js +22 -0
- package/dist/search/v1/verticals/general.js.map +1 -0
- package/dist/search/v1/verticals/news.d.ts +10 -0
- package/dist/search/v1/verticals/news.d.ts.map +1 -0
- package/dist/search/v1/verticals/news.js +52 -0
- package/dist/search/v1/verticals/news.js.map +1 -0
- package/dist/search/v1/verticals/papers.d.ts +4 -0
- package/dist/search/v1/verticals/papers.d.ts.map +1 -0
- package/dist/search/v1/verticals/papers.js +23 -0
- package/dist/search/v1/verticals/papers.js.map +1 -0
- package/dist/search/validator.js +31 -31
- package/dist/search/validator.js.map +1 -1
- package/dist/searxng/bootstrap.d.ts +30 -0
- package/dist/searxng/bootstrap.d.ts.map +1 -1
- package/dist/searxng/bootstrap.js +223 -85
- package/dist/searxng/bootstrap.js.map +1 -1
- package/dist/searxng/docker.d.ts.map +1 -1
- package/dist/searxng/docker.js +69 -60
- package/dist/searxng/docker.js.map +1 -1
- package/dist/searxng/process.d.ts +13 -1
- package/dist/searxng/process.d.ts.map +1 -1
- package/dist/searxng/process.js +231 -164
- package/dist/searxng/process.js.map +1 -1
- package/dist/server/backend-status.d.ts +13 -0
- package/dist/server/backend-status.d.ts.map +1 -0
- package/dist/server/backend-status.js +40 -0
- package/dist/server/backend-status.js.map +1 -0
- package/dist/server/tool-schemas.d.ts +549 -0
- package/dist/server/tool-schemas.d.ts.map +1 -0
- package/dist/server/tool-schemas.js +464 -0
- package/dist/server/tool-schemas.js.map +1 -0
- package/dist/server/warmup-on-start.d.ts +9 -0
- package/dist/server/warmup-on-start.d.ts.map +1 -0
- package/dist/server/warmup-on-start.js +55 -0
- package/dist/server/warmup-on-start.js.map +1 -0
- package/dist/server.d.ts +17 -0
- package/dist/server.d.ts.map +1 -1
- package/dist/server.js +454 -297
- package/dist/server.js.map +1 -1
- package/dist/tools/agent.d.ts +5 -0
- package/dist/tools/agent.d.ts.map +1 -0
- package/dist/tools/agent.js +128 -0
- package/dist/tools/agent.js.map +1 -0
- package/dist/tools/cache.d.ts +2 -1
- package/dist/tools/cache.d.ts.map +1 -1
- package/dist/tools/cache.js +177 -44
- package/dist/tools/cache.js.map +1 -1
- package/dist/tools/crawl.d.ts.map +1 -1
- package/dist/tools/crawl.js +171 -88
- package/dist/tools/crawl.js.map +1 -1
- package/dist/tools/extract.d.ts +2 -2
- package/dist/tools/extract.d.ts.map +1 -1
- package/dist/tools/extract.js +175 -59
- package/dist/tools/extract.js.map +1 -1
- package/dist/tools/fetch.d.ts +2 -2
- package/dist/tools/fetch.d.ts.map +1 -1
- package/dist/tools/fetch.js +174 -68
- package/dist/tools/fetch.js.map +1 -1
- package/dist/tools/find-similar.d.ts +5 -0
- package/dist/tools/find-similar.d.ts.map +1 -0
- package/dist/tools/find-similar.js +127 -0
- package/dist/tools/find-similar.js.map +1 -0
- package/dist/tools/research.d.ts +5 -0
- package/dist/tools/research.d.ts.map +1 -0
- package/dist/tools/research.js +107 -0
- package/dist/tools/research.js.map +1 -0
- package/dist/tools/search.d.ts +10 -2
- package/dist/tools/search.d.ts.map +1 -1
- package/dist/tools/search.js +13 -158
- package/dist/tools/search.js.map +1 -1
- package/dist/types.d.ts +350 -7
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js +6 -1
- package/dist/types.js.map +1 -1
- package/dist/util/mode.d.ts +4 -0
- package/dist/util/mode.d.ts.map +1 -0
- package/dist/util/mode.js +34 -0
- package/dist/util/mode.js.map +1 -0
- package/package.json +78 -8
- package/dist/extraction/trafilatura.d.ts +0 -6
- package/dist/extraction/trafilatura.d.ts.map +0 -1
- package/dist/extraction/trafilatura.js +0 -105
- package/dist/extraction/trafilatura.js.map +0 -1
- package/dist/search/flashrank.d.ts +0 -12
- package/dist/search/flashrank.d.ts.map +0 -1
- package/dist/search/flashrank.js +0 -63
- package/dist/search/flashrank.js.map +0 -1
|
@@ -0,0 +1,271 @@
|
|
|
1
|
+
import { createLogger } from "../logger.js";
|
|
2
|
+
import {
|
|
3
|
+
requestSampling,
|
|
4
|
+
checkSamplingSupport
|
|
5
|
+
} from "../search/sampling.js";
|
|
6
|
+
import { preFilterCandidates } from "./relevance.js";
|
|
7
|
+
const log = createLogger("agent");
|
|
8
|
+
const MAX_SEARCH_QUERIES = 5;
|
|
9
|
+
const MAX_QUERY_LENGTH = 250;
|
|
10
|
+
function applyUrlFilter(urls) {
|
|
11
|
+
const filtered = preFilterCandidates(urls.map((url) => ({ url })));
|
|
12
|
+
const kept = filtered.kept.map((k) => k.url);
|
|
13
|
+
const excluded = filtered.excluded.map((e) => ({ url: e.item.url, reason: e.reason }));
|
|
14
|
+
if (excluded.length > 0) {
|
|
15
|
+
log.info("agent pre-filter", { kept: kept.length, excluded: excluded.length });
|
|
16
|
+
}
|
|
17
|
+
return { kept, excluded };
|
|
18
|
+
}
|
|
19
|
+
async function planExecution(prompt, urls, server) {
|
|
20
|
+
const trimmedPrompt = prompt.trim();
|
|
21
|
+
if (!trimmedPrompt) {
|
|
22
|
+
const { kept: kept2, excluded: excluded2 } = applyUrlFilter(urls ?? []);
|
|
23
|
+
return {
|
|
24
|
+
searches: [],
|
|
25
|
+
urls: kept2,
|
|
26
|
+
notes: "Empty prompt provided",
|
|
27
|
+
samplingUsed: false,
|
|
28
|
+
excluded_urls: excluded2
|
|
29
|
+
};
|
|
30
|
+
}
|
|
31
|
+
if (server) {
|
|
32
|
+
try {
|
|
33
|
+
const samplingResult = await planWithSampling(trimmedPrompt, server);
|
|
34
|
+
if (samplingResult) {
|
|
35
|
+
const mergedUrls2 = mergeUrls(samplingResult.urls, urls ?? []);
|
|
36
|
+
const { kept: kept2, excluded: excluded2 } = applyUrlFilter(mergedUrls2);
|
|
37
|
+
return {
|
|
38
|
+
searches: samplingResult.searches,
|
|
39
|
+
urls: kept2,
|
|
40
|
+
notes: samplingResult.notes,
|
|
41
|
+
samplingUsed: true,
|
|
42
|
+
excluded_urls: excluded2
|
|
43
|
+
};
|
|
44
|
+
}
|
|
45
|
+
} catch (err) {
|
|
46
|
+
log.warn("sampling planning failed, using fallback", {
|
|
47
|
+
error: err instanceof Error ? err.message : String(err)
|
|
48
|
+
});
|
|
49
|
+
}
|
|
50
|
+
}
|
|
51
|
+
const fallback = planWithFallback(trimmedPrompt);
|
|
52
|
+
const mergedUrls = mergeUrls(fallback.urls, urls ?? []);
|
|
53
|
+
const { kept, excluded } = applyUrlFilter(mergedUrls);
|
|
54
|
+
return {
|
|
55
|
+
searches: fallback.searches,
|
|
56
|
+
urls: kept,
|
|
57
|
+
notes: fallback.notes,
|
|
58
|
+
samplingUsed: false,
|
|
59
|
+
excluded_urls: excluded
|
|
60
|
+
};
|
|
61
|
+
}
|
|
62
|
+
async function planWithSampling(prompt, server) {
|
|
63
|
+
try {
|
|
64
|
+
if (!checkSamplingSupport(server)) {
|
|
65
|
+
log.debug("client does not support sampling for planning");
|
|
66
|
+
return null;
|
|
67
|
+
}
|
|
68
|
+
const samplingPrompt = `You are a data gathering assistant. Given the user's prompt, create an execution plan.
|
|
69
|
+
|
|
70
|
+
Return a JSON object with:
|
|
71
|
+
- "searches": array of 1-5 search engine queries to find the needed data
|
|
72
|
+
- "urls": array of specific URLs to visit (if any are obvious from the prompt)
|
|
73
|
+
- "notes": brief string with any relevant observations
|
|
74
|
+
|
|
75
|
+
Prompt: ${prompt}
|
|
76
|
+
|
|
77
|
+
Respond with ONLY valid JSON: {"searches": [...], "urls": [...], "notes": "..."}`;
|
|
78
|
+
const response = await requestSampling(
|
|
79
|
+
server,
|
|
80
|
+
[{ role: "user", content: { type: "text", text: samplingPrompt } }],
|
|
81
|
+
500
|
|
82
|
+
);
|
|
83
|
+
if (!response?.content?.text) {
|
|
84
|
+
log.debug("sampling returned empty response for planning");
|
|
85
|
+
return null;
|
|
86
|
+
}
|
|
87
|
+
const text = response.content.text.trim();
|
|
88
|
+
let parsed;
|
|
89
|
+
try {
|
|
90
|
+
parsed = JSON.parse(text);
|
|
91
|
+
} catch {
|
|
92
|
+
const jsonMatch = text.match(/\{[\s\S]*\}/);
|
|
93
|
+
if (jsonMatch) {
|
|
94
|
+
try {
|
|
95
|
+
parsed = JSON.parse(jsonMatch[0]);
|
|
96
|
+
} catch {
|
|
97
|
+
log.debug("could not extract JSON from sampling plan response");
|
|
98
|
+
return null;
|
|
99
|
+
}
|
|
100
|
+
} else {
|
|
101
|
+
return null;
|
|
102
|
+
}
|
|
103
|
+
}
|
|
104
|
+
if (typeof parsed !== "object" || parsed === null) return null;
|
|
105
|
+
const obj = parsed;
|
|
106
|
+
const searches = Array.isArray(obj.searches) ? obj.searches.filter((s) => typeof s === "string" && s.trim().length > 0).map((s) => s.trim()) : [];
|
|
107
|
+
const extractedUrls = Array.isArray(obj.urls) ? obj.urls.filter((u) => typeof u === "string" && isValidUrl(u)) : [];
|
|
108
|
+
const notes = typeof obj.notes === "string" ? obj.notes : "";
|
|
109
|
+
if (searches.length === 0 && extractedUrls.length === 0) {
|
|
110
|
+
log.debug("sampling plan had no searches or URLs");
|
|
111
|
+
return null;
|
|
112
|
+
}
|
|
113
|
+
return { searches: searches.slice(0, MAX_SEARCH_QUERIES), urls: extractedUrls, notes };
|
|
114
|
+
} catch (err) {
|
|
115
|
+
log.debug("sampling planning request failed", {
|
|
116
|
+
error: err instanceof Error ? err.message : String(err)
|
|
117
|
+
});
|
|
118
|
+
return null;
|
|
119
|
+
}
|
|
120
|
+
}
|
|
121
|
+
function planWithFallback(prompt) {
|
|
122
|
+
const extractedUrls = extractUrlsFromText(prompt);
|
|
123
|
+
const searches = generateSearchQueries(prompt);
|
|
124
|
+
return {
|
|
125
|
+
searches,
|
|
126
|
+
urls: extractedUrls,
|
|
127
|
+
notes: "Fallback plan from keyword extraction"
|
|
128
|
+
};
|
|
129
|
+
}
|
|
130
|
+
function extractUrlsFromText(text) {
|
|
131
|
+
const urlRegex = /https?:\/\/[^\s,;"')\]]+/gi;
|
|
132
|
+
const matches = text.match(urlRegex) ?? [];
|
|
133
|
+
const cleaned = matches.map((url) => url.replace(/[.,;:!?)]+$/, ""));
|
|
134
|
+
return [...new Set(cleaned)].filter(isValidUrl);
|
|
135
|
+
}
|
|
136
|
+
function isValidUrl(url) {
|
|
137
|
+
try {
|
|
138
|
+
new URL(url);
|
|
139
|
+
return true;
|
|
140
|
+
} catch {
|
|
141
|
+
return false;
|
|
142
|
+
}
|
|
143
|
+
}
|
|
144
|
+
function generateSearchQueries(prompt) {
|
|
145
|
+
const stopWords = /* @__PURE__ */ new Set([
|
|
146
|
+
"the",
|
|
147
|
+
"a",
|
|
148
|
+
"an",
|
|
149
|
+
"is",
|
|
150
|
+
"are",
|
|
151
|
+
"was",
|
|
152
|
+
"were",
|
|
153
|
+
"be",
|
|
154
|
+
"been",
|
|
155
|
+
"being",
|
|
156
|
+
"have",
|
|
157
|
+
"has",
|
|
158
|
+
"had",
|
|
159
|
+
"do",
|
|
160
|
+
"does",
|
|
161
|
+
"did",
|
|
162
|
+
"will",
|
|
163
|
+
"would",
|
|
164
|
+
"could",
|
|
165
|
+
"should",
|
|
166
|
+
"may",
|
|
167
|
+
"might",
|
|
168
|
+
"can",
|
|
169
|
+
"shall",
|
|
170
|
+
"to",
|
|
171
|
+
"of",
|
|
172
|
+
"in",
|
|
173
|
+
"for",
|
|
174
|
+
"on",
|
|
175
|
+
"with",
|
|
176
|
+
"at",
|
|
177
|
+
"by",
|
|
178
|
+
"from",
|
|
179
|
+
"as",
|
|
180
|
+
"into",
|
|
181
|
+
"through",
|
|
182
|
+
"and",
|
|
183
|
+
"but",
|
|
184
|
+
"or",
|
|
185
|
+
"not",
|
|
186
|
+
"so",
|
|
187
|
+
"yet",
|
|
188
|
+
"find",
|
|
189
|
+
"get",
|
|
190
|
+
"search",
|
|
191
|
+
"look",
|
|
192
|
+
"show",
|
|
193
|
+
"me",
|
|
194
|
+
"i",
|
|
195
|
+
"we",
|
|
196
|
+
"you",
|
|
197
|
+
"they",
|
|
198
|
+
"it",
|
|
199
|
+
"this",
|
|
200
|
+
"that",
|
|
201
|
+
"my",
|
|
202
|
+
"your",
|
|
203
|
+
"our",
|
|
204
|
+
"their",
|
|
205
|
+
"all",
|
|
206
|
+
"each",
|
|
207
|
+
"every",
|
|
208
|
+
"some",
|
|
209
|
+
"any",
|
|
210
|
+
"also",
|
|
211
|
+
"about",
|
|
212
|
+
"up",
|
|
213
|
+
"out",
|
|
214
|
+
"if",
|
|
215
|
+
"then",
|
|
216
|
+
"than",
|
|
217
|
+
"too",
|
|
218
|
+
"very",
|
|
219
|
+
"just",
|
|
220
|
+
"please",
|
|
221
|
+
"need",
|
|
222
|
+
"want"
|
|
223
|
+
]);
|
|
224
|
+
const urlFree = prompt.replace(/https?:\/\/[^\s]+/g, "").trim();
|
|
225
|
+
if (!urlFree) return [];
|
|
226
|
+
const words = urlFree.replace(/[?!.,;:'"()\[\]{}]/g, " ").split(/\s+/).filter(Boolean);
|
|
227
|
+
const contentWords = words.filter((w) => !stopWords.has(w.toLowerCase()) && w.length > 1);
|
|
228
|
+
if (contentWords.length === 0) return [];
|
|
229
|
+
const queries = [];
|
|
230
|
+
const fullQuery = contentWords.join(" ");
|
|
231
|
+
if (fullQuery.length <= MAX_QUERY_LENGTH) {
|
|
232
|
+
queries.push(fullQuery);
|
|
233
|
+
} else {
|
|
234
|
+
queries.push(fullQuery.slice(0, MAX_QUERY_LENGTH));
|
|
235
|
+
}
|
|
236
|
+
if (contentWords.length >= 4) {
|
|
237
|
+
const half = Math.ceil(contentWords.length / 2);
|
|
238
|
+
queries.push(contentWords.slice(0, half).join(" "));
|
|
239
|
+
}
|
|
240
|
+
if (contentWords.length >= 4) {
|
|
241
|
+
const half = Math.ceil(contentWords.length / 2);
|
|
242
|
+
queries.push(contentWords.slice(half).join(" "));
|
|
243
|
+
}
|
|
244
|
+
if (contentWords.length >= 3) {
|
|
245
|
+
const bigrams = [];
|
|
246
|
+
for (let i = 0; i < contentWords.length - 1 && bigrams.length < 3; i++) {
|
|
247
|
+
bigrams.push(`${contentWords[i]} ${contentWords[i + 1]}`);
|
|
248
|
+
}
|
|
249
|
+
if (bigrams.length > 0) {
|
|
250
|
+
queries.push(bigrams.join(" "));
|
|
251
|
+
}
|
|
252
|
+
}
|
|
253
|
+
const keyTerms = contentWords.filter(
|
|
254
|
+
(w) => w.length > 4 || w[0] === w[0].toUpperCase()
|
|
255
|
+
);
|
|
256
|
+
if (keyTerms.length >= 2) {
|
|
257
|
+
queries.push(keyTerms.slice(0, 5).join(" "));
|
|
258
|
+
}
|
|
259
|
+
const unique = [...new Set(queries)].map(
|
|
260
|
+
(q) => q.length > MAX_QUERY_LENGTH ? q.slice(0, MAX_QUERY_LENGTH) : q
|
|
261
|
+
);
|
|
262
|
+
return unique.slice(0, MAX_SEARCH_QUERIES);
|
|
263
|
+
}
|
|
264
|
+
function mergeUrls(samplingUrls, explicitUrls) {
|
|
265
|
+
const all = [...samplingUrls, ...explicitUrls];
|
|
266
|
+
return [...new Set(all)];
|
|
267
|
+
}
|
|
268
|
+
export {
|
|
269
|
+
planExecution
|
|
270
|
+
};
|
|
271
|
+
//# sourceMappingURL=planner.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../src/agent/planner.ts"],"sourcesContent":["import { createLogger } from '../logger.js';\nimport {\n type SamplingCapableServer,\n requestSampling,\n checkSamplingSupport,\n} from '../search/sampling.js';\nimport { preFilterCandidates } from './relevance.js';\n\nconst log = createLogger('agent');\n\nconst MAX_SEARCH_QUERIES = 5;\nconst MAX_QUERY_LENGTH = 250;\n\nexport interface AgentPlan {\n searches: string[];\n urls: string[];\n notes: string;\n samplingUsed: boolean;\n excluded_urls?: { url: string; reason: 'invalid_url' | 'blocklisted_domain' }[];\n}\n\nfunction applyUrlFilter(urls: string[]): {\n kept: string[];\n excluded: { url: string; reason: 'invalid_url' | 'blocklisted_domain' }[];\n} {\n const filtered = preFilterCandidates(urls.map((url) => ({ url })));\n const kept = filtered.kept.map((k) => k.url);\n const excluded = filtered.excluded.map((e) => ({ url: e.item.url, reason: e.reason }));\n if (excluded.length > 0) {\n log.info('agent pre-filter', { kept: kept.length, excluded: excluded.length });\n }\n return { kept, excluded };\n}\n\nexport async function planExecution(\n prompt: string,\n urls?: string[],\n server?: SamplingCapableServer,\n): Promise<AgentPlan> {\n const trimmedPrompt = prompt.trim();\n\n if (!trimmedPrompt) {\n const { kept, excluded } = applyUrlFilter(urls ?? []);\n return {\n searches: [],\n urls: kept,\n notes: 'Empty prompt provided',\n samplingUsed: false,\n excluded_urls: excluded,\n };\n }\n\n if (server) {\n try {\n const samplingResult = await planWithSampling(trimmedPrompt, server);\n if (samplingResult) {\n const mergedUrls = mergeUrls(samplingResult.urls, urls ?? []);\n const { kept, excluded } = applyUrlFilter(mergedUrls);\n return {\n searches: samplingResult.searches,\n urls: kept,\n notes: samplingResult.notes,\n samplingUsed: true,\n excluded_urls: excluded,\n };\n }\n } catch (err) {\n log.warn('sampling planning failed, using fallback', {\n error: err instanceof Error ? err.message : String(err),\n });\n }\n }\n\n const fallback = planWithFallback(trimmedPrompt);\n const mergedUrls = mergeUrls(fallback.urls, urls ?? []);\n const { kept, excluded } = applyUrlFilter(mergedUrls);\n\n return {\n searches: fallback.searches,\n urls: kept,\n notes: fallback.notes,\n samplingUsed: false,\n excluded_urls: excluded,\n };\n}\n\nasync function planWithSampling(\n prompt: string,\n server: SamplingCapableServer,\n): Promise<{ searches: string[]; urls: string[]; notes: string } | null> {\n try {\n if (!checkSamplingSupport(server)) {\n log.debug('client does not support sampling for planning');\n return null;\n }\n\n const samplingPrompt = `You are a data gathering assistant. Given the user's prompt, create an execution plan.\n\nReturn a JSON object with:\n- \"searches\": array of 1-5 search engine queries to find the needed data\n- \"urls\": array of specific URLs to visit (if any are obvious from the prompt)\n- \"notes\": brief string with any relevant observations\n\nPrompt: ${prompt}\n\nRespond with ONLY valid JSON: {\"searches\": [...], \"urls\": [...], \"notes\": \"...\"}`;\n\n const response = await requestSampling(\n server,\n [{ role: 'user', content: { type: 'text', text: samplingPrompt } }],\n 500,\n );\n\n if (!response?.content?.text) {\n log.debug('sampling returned empty response for planning');\n return null;\n }\n\n const text = response.content.text.trim();\n let parsed: unknown;\n try {\n parsed = JSON.parse(text);\n } catch {\n const jsonMatch = text.match(/\\{[\\s\\S]*\\}/);\n if (jsonMatch) {\n try {\n parsed = JSON.parse(jsonMatch[0]);\n } catch {\n log.debug('could not extract JSON from sampling plan response');\n return null;\n }\n } else {\n return null;\n }\n }\n\n if (typeof parsed !== 'object' || parsed === null) return null;\n\n const obj = parsed as Record<string, unknown>;\n const searches = Array.isArray(obj.searches)\n ? obj.searches.filter((s): s is string => typeof s === 'string' && s.trim().length > 0).map((s) => s.trim())\n : [];\n const extractedUrls = Array.isArray(obj.urls)\n ? obj.urls.filter((u): u is string => typeof u === 'string' && isValidUrl(u))\n : [];\n const notes = typeof obj.notes === 'string' ? obj.notes : '';\n\n if (searches.length === 0 && extractedUrls.length === 0) {\n log.debug('sampling plan had no searches or URLs');\n return null;\n }\n\n return { searches: searches.slice(0, MAX_SEARCH_QUERIES), urls: extractedUrls, notes };\n } catch (err) {\n log.debug('sampling planning request failed', {\n error: err instanceof Error ? err.message : String(err),\n });\n return null;\n }\n}\n\nfunction planWithFallback(prompt: string): { searches: string[]; urls: string[]; notes: string } {\n const extractedUrls = extractUrlsFromText(prompt);\n const searches = generateSearchQueries(prompt);\n\n return {\n searches,\n urls: extractedUrls,\n notes: 'Fallback plan from keyword extraction',\n };\n}\n\nfunction extractUrlsFromText(text: string): string[] {\n const urlRegex = /https?:\\/\\/[^\\s,;\"')\\]]+/gi;\n const matches = text.match(urlRegex) ?? [];\n const cleaned = matches.map((url) => url.replace(/[.,;:!?)]+$/, ''));\n return [...new Set(cleaned)].filter(isValidUrl);\n}\n\nfunction isValidUrl(url: string): boolean {\n try {\n new URL(url);\n return true;\n } catch {\n return false;\n }\n}\n\nfunction generateSearchQueries(prompt: string): string[] {\n const stopWords = new Set([\n 'the', 'a', 'an', 'is', 'are', 'was', 'were', 'be', 'been', 'being',\n 'have', 'has', 'had', 'do', 'does', 'did', 'will', 'would', 'could',\n 'should', 'may', 'might', 'can', 'shall', 'to', 'of', 'in', 'for',\n 'on', 'with', 'at', 'by', 'from', 'as', 'into', 'through', 'and',\n 'but', 'or', 'not', 'so', 'yet', 'find', 'get', 'search', 'look',\n 'show', 'me', 'i', 'we', 'you', 'they', 'it', 'this', 'that',\n 'my', 'your', 'our', 'their', 'all', 'each', 'every', 'some',\n 'any', 'also', 'about', 'up', 'out', 'if', 'then', 'than',\n 'too', 'very', 'just', 'please', 'need', 'want',\n ]);\n\n const urlFree = prompt.replace(/https?:\\/\\/[^\\s]+/g, '').trim();\n if (!urlFree) return [];\n\n const words = urlFree\n .replace(/[?!.,;:'\"()\\[\\]{}]/g, ' ')\n .split(/\\s+/)\n .filter(Boolean);\n\n const contentWords = words.filter((w) => !stopWords.has(w.toLowerCase()) && w.length > 1);\n\n if (contentWords.length === 0) return [];\n\n const queries: string[] = [];\n\n const fullQuery = contentWords.join(' ');\n if (fullQuery.length <= MAX_QUERY_LENGTH) {\n queries.push(fullQuery);\n } else {\n queries.push(fullQuery.slice(0, MAX_QUERY_LENGTH));\n }\n\n if (contentWords.length >= 4) {\n const half = Math.ceil(contentWords.length / 2);\n queries.push(contentWords.slice(0, half).join(' '));\n }\n\n if (contentWords.length >= 4) {\n const half = Math.ceil(contentWords.length / 2);\n queries.push(contentWords.slice(half).join(' '));\n }\n\n if (contentWords.length >= 3) {\n const bigrams: string[] = [];\n for (let i = 0; i < contentWords.length - 1 && bigrams.length < 3; i++) {\n bigrams.push(`${contentWords[i]} ${contentWords[i + 1]}`);\n }\n if (bigrams.length > 0) {\n queries.push(bigrams.join(' '));\n }\n }\n\n const keyTerms = contentWords.filter(\n (w) => w.length > 4 || w[0] === w[0].toUpperCase(),\n );\n if (keyTerms.length >= 2) {\n queries.push(keyTerms.slice(0, 5).join(' '));\n }\n\n const unique = [...new Set(queries)].map((q) =>\n q.length > MAX_QUERY_LENGTH ? q.slice(0, MAX_QUERY_LENGTH) : q,\n );\n return unique.slice(0, MAX_SEARCH_QUERIES);\n}\n\nfunction mergeUrls(samplingUrls: string[], explicitUrls: string[]): string[] {\n const all = [...samplingUrls, ...explicitUrls];\n return [...new Set(all)];\n}\n"],"mappings":"AAAA,SAAS,oBAAoB;AAC7B;AAAA,EAEE;AAAA,EACA;AAAA,OACK;AACP,SAAS,2BAA2B;AAEpC,MAAM,MAAM,aAAa,OAAO;AAEhC,MAAM,qBAAqB;AAC3B,MAAM,mBAAmB;AAUzB,SAAS,eAAe,MAGtB;AACA,QAAM,WAAW,oBAAoB,KAAK,IAAI,CAAC,SAAS,EAAE,IAAI,EAAE,CAAC;AACjE,QAAM,OAAO,SAAS,KAAK,IAAI,CAAC,MAAM,EAAE,GAAG;AAC3C,QAAM,WAAW,SAAS,SAAS,IAAI,CAAC,OAAO,EAAE,KAAK,EAAE,KAAK,KAAK,QAAQ,EAAE,OAAO,EAAE;AACrF,MAAI,SAAS,SAAS,GAAG;AACvB,QAAI,KAAK,oBAAoB,EAAE,MAAM,KAAK,QAAQ,UAAU,SAAS,OAAO,CAAC;AAAA,EAC/E;AACA,SAAO,EAAE,MAAM,SAAS;AAC1B;AAEA,eAAsB,cACpB,QACA,MACA,QACoB;AACpB,QAAM,gBAAgB,OAAO,KAAK;AAElC,MAAI,CAAC,eAAe;AAClB,UAAM,EAAE,MAAAA,OAAM,UAAAC,UAAS,IAAI,eAAe,QAAQ,CAAC,CAAC;AACpD,WAAO;AAAA,MACL,UAAU,CAAC;AAAA,MACX,MAAMD;AAAA,MACN,OAAO;AAAA,MACP,cAAc;AAAA,MACd,eAAeC;AAAA,IACjB;AAAA,EACF;AAEA,MAAI,QAAQ;AACV,QAAI;AACF,YAAM,iBAAiB,MAAM,iBAAiB,eAAe,MAAM;AACnE,UAAI,gBAAgB;AAClB,cAAMC,cAAa,UAAU,eAAe,MAAM,QAAQ,CAAC,CAAC;AAC5D,cAAM,EAAE,MAAAF,OAAM,UAAAC,UAAS,IAAI,eAAeC,WAAU;AACpD,eAAO;AAAA,UACL,UAAU,eAAe;AAAA,UACzB,MAAMF;AAAA,UACN,OAAO,eAAe;AAAA,UACtB,cAAc;AAAA,UACd,eAAeC;AAAA,QACjB;AAAA,MACF;AAAA,IACF,SAAS,KAAK;AACZ,UAAI,KAAK,4CAA4C;AAAA,QACnD,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,MACxD,CAAC;AAAA,IACH;AAAA,EACF;AAEA,QAAM,WAAW,iBAAiB,aAAa;AAC/C,QAAM,aAAa,UAAU,SAAS,MAAM,QAAQ,CAAC,CAAC;AACtD,QAAM,EAAE,MAAM,SAAS,IAAI,eAAe,UAAU;AAEpD,SAAO;AAAA,IACL,UAAU,SAAS;AAAA,IACnB,MAAM;AAAA,IACN,OAAO,SAAS;AAAA,IAChB,cAAc;AAAA,IACd,eAAe;AAAA,EACjB;AACF;AAEA,eAAe,iBACb,QACA,QACuE;AACvE,MAAI;AACF,QAAI,CAAC,qBAAqB,MAAM,GAAG;AACjC,UAAI,MAAM,+CAA+C;AACzD,aAAO;AAAA,IACT;AAEA,UAAM,iBAAiB;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,UAOjB,MAAM;AAAA;AAAA;AAIZ,UAAM,WAAW,MAAM;AAAA,MACrB;AAAA,MACA,CAAC,EAAE,MAAM,QAAQ,SAAS,EAAE,MAAM,QAAQ,MAAM,eAAe,EAAE,CAAC;AAAA,MAClE;AAAA,IACF;AAEA,QAAI,CAAC,UAAU,SAAS,MAAM;AAC5B,UAAI,MAAM,+CAA+C;AACzD,aAAO;AAAA,IACT;AAEA,UAAM,OAAO,SAAS,QAAQ,KAAK,KAAK;AACxC,QAAI;AACJ,QAAI;AACF,eAAS,KAAK,MAAM,IAAI;AAAA,IAC1B,QAAQ;AACN,YAAM,YAAY,KAAK,MAAM,aAAa;AAC1C,UAAI,WAAW;AACb,YAAI;AACF,mBAAS,KAAK,MAAM,UAAU,CAAC,CAAC;AAAA,QAClC,QAAQ;AACN,cAAI,MAAM,oDAAoD;AAC9D,iBAAO;AAAA,QACT;AAAA,MACF,OAAO;AACL,eAAO;AAAA,MACT;AAAA,IACF;AAEA,QAAI,OAAO,WAAW,YAAY,WAAW,KAAM,QAAO;AAE1D,UAAM,MAAM;AACZ,UAAM,WAAW,MAAM,QAAQ,IAAI,QAAQ,IACvC,IAAI,SAAS,OAAO,CAAC,MAAmB,OAAO,MAAM,YAAY,EAAE,KAAK,EAAE,SAAS,CAAC,EAAE,IAAI,CAAC,MAAM,EAAE,KAAK,CAAC,IACzG,CAAC;AACL,UAAM,gBAAgB,MAAM,QAAQ,IAAI,IAAI,IACxC,IAAI,KAAK,OAAO,CAAC,MAAmB,OAAO,MAAM,YAAY,WAAW,CAAC,CAAC,IAC1E,CAAC;AACL,UAAM,QAAQ,OAAO,IAAI,UAAU,WAAW,IAAI,QAAQ;AAE1D,QAAI,SAAS,WAAW,KAAK,cAAc,WAAW,GAAG;AACvD,UAAI,MAAM,uCAAuC;AACjD,aAAO;AAAA,IACT;AAEA,WAAO,EAAE,UAAU,SAAS,MAAM,GAAG,kBAAkB,GAAG,MAAM,eAAe,MAAM;AAAA,EACvF,SAAS,KAAK;AACZ,QAAI,MAAM,oCAAoC;AAAA,MAC5C,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD,CAAC;AACD,WAAO;AAAA,EACT;AACF;AAEA,SAAS,iBAAiB,QAAuE;AAC/F,QAAM,gBAAgB,oBAAoB,MAAM;AAChD,QAAM,WAAW,sBAAsB,MAAM;AAE7C,SAAO;AAAA,IACL;AAAA,IACA,MAAM;AAAA,IACN,OAAO;AAAA,EACT;AACF;AAEA,SAAS,oBAAoB,MAAwB;AACnD,QAAM,WAAW;AACjB,QAAM,UAAU,KAAK,MAAM,QAAQ,KAAK,CAAC;AACzC,QAAM,UAAU,QAAQ,IAAI,CAAC,QAAQ,IAAI,QAAQ,eAAe,EAAE,CAAC;AACnE,SAAO,CAAC,GAAG,IAAI,IAAI,OAAO,CAAC,EAAE,OAAO,UAAU;AAChD;AAEA,SAAS,WAAW,KAAsB;AACxC,MAAI;AACF,QAAI,IAAI,GAAG;AACX,WAAO;AAAA,EACT,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAEA,SAAS,sBAAsB,QAA0B;AACvD,QAAM,YAAY,oBAAI,IAAI;AAAA,IACxB;AAAA,IAAO;AAAA,IAAK;AAAA,IAAM;AAAA,IAAM;AAAA,IAAO;AAAA,IAAO;AAAA,IAAQ;AAAA,IAAM;AAAA,IAAQ;AAAA,IAC5D;AAAA,IAAQ;AAAA,IAAO;AAAA,IAAO;AAAA,IAAM;AAAA,IAAQ;AAAA,IAAO;AAAA,IAAQ;AAAA,IAAS;AAAA,IAC5D;AAAA,IAAU;AAAA,IAAO;AAAA,IAAS;AAAA,IAAO;AAAA,IAAS;AAAA,IAAM;AAAA,IAAM;AAAA,IAAM;AAAA,IAC5D;AAAA,IAAM;AAAA,IAAQ;AAAA,IAAM;AAAA,IAAM;AAAA,IAAQ;AAAA,IAAM;AAAA,IAAQ;AAAA,IAAW;AAAA,IAC3D;AAAA,IAAO;AAAA,IAAM;AAAA,IAAO;AAAA,IAAM;AAAA,IAAO;AAAA,IAAQ;AAAA,IAAO;AAAA,IAAU;AAAA,IAC1D;AAAA,IAAQ;AAAA,IAAM;AAAA,IAAK;AAAA,IAAM;AAAA,IAAO;AAAA,IAAQ;AAAA,IAAM;AAAA,IAAQ;AAAA,IACtD;AAAA,IAAM;AAAA,IAAQ;AAAA,IAAO;AAAA,IAAS;AAAA,IAAO;AAAA,IAAQ;AAAA,IAAS;AAAA,IACtD;AAAA,IAAO;AAAA,IAAQ;AAAA,IAAS;AAAA,IAAM;AAAA,IAAO;AAAA,IAAM;AAAA,IAAQ;AAAA,IACnD;AAAA,IAAO;AAAA,IAAQ;AAAA,IAAQ;AAAA,IAAU;AAAA,IAAQ;AAAA,EAC3C,CAAC;AAED,QAAM,UAAU,OAAO,QAAQ,sBAAsB,EAAE,EAAE,KAAK;AAC9D,MAAI,CAAC,QAAS,QAAO,CAAC;AAEtB,QAAM,QAAQ,QACX,QAAQ,uBAAuB,GAAG,EAClC,MAAM,KAAK,EACX,OAAO,OAAO;AAEjB,QAAM,eAAe,MAAM,OAAO,CAAC,MAAM,CAAC,UAAU,IAAI,EAAE,YAAY,CAAC,KAAK,EAAE,SAAS,CAAC;AAExF,MAAI,aAAa,WAAW,EAAG,QAAO,CAAC;AAEvC,QAAM,UAAoB,CAAC;AAE3B,QAAM,YAAY,aAAa,KAAK,GAAG;AACvC,MAAI,UAAU,UAAU,kBAAkB;AACxC,YAAQ,KAAK,SAAS;AAAA,EACxB,OAAO;AACL,YAAQ,KAAK,UAAU,MAAM,GAAG,gBAAgB,CAAC;AAAA,EACnD;AAEA,MAAI,aAAa,UAAU,GAAG;AAC5B,UAAM,OAAO,KAAK,KAAK,aAAa,SAAS,CAAC;AAC9C,YAAQ,KAAK,aAAa,MAAM,GAAG,IAAI,EAAE,KAAK,GAAG,CAAC;AAAA,EACpD;AAEA,MAAI,aAAa,UAAU,GAAG;AAC5B,UAAM,OAAO,KAAK,KAAK,aAAa,SAAS,CAAC;AAC9C,YAAQ,KAAK,aAAa,MAAM,IAAI,EAAE,KAAK,GAAG,CAAC;AAAA,EACjD;AAEA,MAAI,aAAa,UAAU,GAAG;AAC5B,UAAM,UAAoB,CAAC;AAC3B,aAAS,IAAI,GAAG,IAAI,aAAa,SAAS,KAAK,QAAQ,SAAS,GAAG,KAAK;AACtE,cAAQ,KAAK,GAAG,aAAa,CAAC,CAAC,IAAI,aAAa,IAAI,CAAC,CAAC,EAAE;AAAA,IAC1D;AACA,QAAI,QAAQ,SAAS,GAAG;AACtB,cAAQ,KAAK,QAAQ,KAAK,GAAG,CAAC;AAAA,IAChC;AAAA,EACF;AAEA,QAAM,WAAW,aAAa;AAAA,IAC5B,CAAC,MAAM,EAAE,SAAS,KAAK,EAAE,CAAC,MAAM,EAAE,CAAC,EAAE,YAAY;AAAA,EACnD;AACA,MAAI,SAAS,UAAU,GAAG;AACxB,YAAQ,KAAK,SAAS,MAAM,GAAG,CAAC,EAAE,KAAK,GAAG,CAAC;AAAA,EAC7C;AAEA,QAAM,SAAS,CAAC,GAAG,IAAI,IAAI,OAAO,CAAC,EAAE;AAAA,IAAI,CAAC,MACxC,EAAE,SAAS,mBAAmB,EAAE,MAAM,GAAG,gBAAgB,IAAI;AAAA,EAC/D;AACA,SAAO,OAAO,MAAM,GAAG,kBAAkB;AAC3C;AAEA,SAAS,UAAU,cAAwB,cAAkC;AAC3E,QAAM,MAAM,CAAC,GAAG,cAAc,GAAG,YAAY;AAC7C,SAAO,CAAC,GAAG,IAAI,IAAI,GAAG,CAAC;AACzB;","names":["kept","excluded","mergedUrls"]}
|
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
export declare function isValidCandidateUrl(u: string): boolean;
|
|
2
|
+
export declare function isBlocklistedDomain(u: string): boolean;
|
|
3
|
+
export interface PreFilterResult<T extends {
|
|
4
|
+
url: string;
|
|
5
|
+
}> {
|
|
6
|
+
kept: T[];
|
|
7
|
+
excluded: {
|
|
8
|
+
item: T;
|
|
9
|
+
reason: 'invalid_url' | 'blocklisted_domain';
|
|
10
|
+
}[];
|
|
11
|
+
}
|
|
12
|
+
export declare function preFilterCandidates<T extends {
|
|
13
|
+
url: string;
|
|
14
|
+
}>(items: T[]): PreFilterResult<T>;
|
|
15
|
+
//# sourceMappingURL=relevance.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"relevance.d.ts","sourceRoot":"","sources":["../../src/agent/relevance.ts"],"names":[],"mappings":"AAeA,wBAAgB,mBAAmB,CAAC,CAAC,EAAE,MAAM,GAAG,OAAO,CAYtD;AAED,wBAAgB,mBAAmB,CAAC,CAAC,EAAE,MAAM,GAAG,OAAO,CAWtD;AAED,MAAM,WAAW,eAAe,CAAC,CAAC,SAAS;IAAE,GAAG,EAAE,MAAM,CAAA;CAAE;IACxD,IAAI,EAAE,CAAC,EAAE,CAAC;IACV,QAAQ,EAAE;QAAE,IAAI,EAAE,CAAC,CAAC;QAAC,MAAM,EAAE,aAAa,GAAG,oBAAoB,CAAA;KAAE,EAAE,CAAC;CACvE;AAED,wBAAgB,mBAAmB,CAAC,CAAC,SAAS;IAAE,GAAG,EAAE,MAAM,CAAA;CAAE,EAAE,KAAK,EAAE,CAAC,EAAE,GAAG,eAAe,CAAC,CAAC,CAAC,CAe7F"}
|
|
@@ -0,0 +1,60 @@
|
|
|
1
|
+
const BLOCKLIST = /* @__PURE__ */ new Set([
|
|
2
|
+
"elitepvpers.com",
|
|
3
|
+
"zhihu.com",
|
|
4
|
+
"baidu.com",
|
|
5
|
+
"zhidao.baidu.com",
|
|
6
|
+
"jingyan.baidu.com",
|
|
7
|
+
"wenku.baidu.com",
|
|
8
|
+
"tieba.baidu.com"
|
|
9
|
+
]);
|
|
10
|
+
const REDIRECT_HOSTS = /* @__PURE__ */ new Set([
|
|
11
|
+
"duckduckgo.com",
|
|
12
|
+
"r.jina.ai"
|
|
13
|
+
]);
|
|
14
|
+
function isValidCandidateUrl(u) {
|
|
15
|
+
try {
|
|
16
|
+
const parsed = new URL(u);
|
|
17
|
+
if (!["http:", "https:"].includes(parsed.protocol)) return false;
|
|
18
|
+
if (REDIRECT_HOSTS.has(parsed.hostname)) {
|
|
19
|
+
if (parsed.hostname === "duckduckgo.com" && parsed.pathname.startsWith("/l/")) return false;
|
|
20
|
+
if (parsed.hostname === "r.jina.ai") return false;
|
|
21
|
+
}
|
|
22
|
+
return true;
|
|
23
|
+
} catch {
|
|
24
|
+
return false;
|
|
25
|
+
}
|
|
26
|
+
}
|
|
27
|
+
function isBlocklistedDomain(u) {
|
|
28
|
+
try {
|
|
29
|
+
const host = new URL(u).hostname.toLowerCase();
|
|
30
|
+
if (BLOCKLIST.has(host)) return true;
|
|
31
|
+
for (const dom of BLOCKLIST) {
|
|
32
|
+
if (host.endsWith(`.${dom}`)) return true;
|
|
33
|
+
}
|
|
34
|
+
return false;
|
|
35
|
+
} catch {
|
|
36
|
+
return true;
|
|
37
|
+
}
|
|
38
|
+
}
|
|
39
|
+
function preFilterCandidates(items) {
|
|
40
|
+
const kept = [];
|
|
41
|
+
const excluded = [];
|
|
42
|
+
for (const it of items) {
|
|
43
|
+
if (!isValidCandidateUrl(it.url)) {
|
|
44
|
+
excluded.push({ item: it, reason: "invalid_url" });
|
|
45
|
+
continue;
|
|
46
|
+
}
|
|
47
|
+
if (isBlocklistedDomain(it.url)) {
|
|
48
|
+
excluded.push({ item: it, reason: "blocklisted_domain" });
|
|
49
|
+
continue;
|
|
50
|
+
}
|
|
51
|
+
kept.push(it);
|
|
52
|
+
}
|
|
53
|
+
return { kept, excluded };
|
|
54
|
+
}
|
|
55
|
+
export {
|
|
56
|
+
isBlocklistedDomain,
|
|
57
|
+
isValidCandidateUrl,
|
|
58
|
+
preFilterCandidates
|
|
59
|
+
};
|
|
60
|
+
//# sourceMappingURL=relevance.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../src/agent/relevance.ts"],"sourcesContent":["const BLOCKLIST: ReadonlySet<string> = new Set([\n 'elitepvpers.com',\n 'zhihu.com',\n 'baidu.com',\n 'zhidao.baidu.com',\n 'jingyan.baidu.com',\n 'wenku.baidu.com',\n 'tieba.baidu.com',\n]);\n\nconst REDIRECT_HOSTS: ReadonlySet<string> = new Set([\n 'duckduckgo.com',\n 'r.jina.ai',\n]);\n\nexport function isValidCandidateUrl(u: string): boolean {\n try {\n const parsed = new URL(u);\n if (!['http:', 'https:'].includes(parsed.protocol)) return false;\n if (REDIRECT_HOSTS.has(parsed.hostname)) {\n if (parsed.hostname === 'duckduckgo.com' && parsed.pathname.startsWith('/l/')) return false;\n if (parsed.hostname === 'r.jina.ai') return false;\n }\n return true;\n } catch {\n return false;\n }\n}\n\nexport function isBlocklistedDomain(u: string): boolean {\n try {\n const host = new URL(u).hostname.toLowerCase();\n if (BLOCKLIST.has(host)) return true;\n for (const dom of BLOCKLIST) {\n if (host.endsWith(`.${dom}`)) return true;\n }\n return false;\n } catch {\n return true;\n }\n}\n\nexport interface PreFilterResult<T extends { url: string }> {\n kept: T[];\n excluded: { item: T; reason: 'invalid_url' | 'blocklisted_domain' }[];\n}\n\nexport function preFilterCandidates<T extends { url: string }>(items: T[]): PreFilterResult<T> {\n const kept: T[] = [];\n const excluded: PreFilterResult<T>['excluded'] = [];\n for (const it of items) {\n if (!isValidCandidateUrl(it.url)) {\n excluded.push({ item: it, reason: 'invalid_url' });\n continue;\n }\n if (isBlocklistedDomain(it.url)) {\n excluded.push({ item: it, reason: 'blocklisted_domain' });\n continue;\n }\n kept.push(it);\n }\n return { kept, excluded };\n}\n"],"mappings":"AAAA,MAAM,YAAiC,oBAAI,IAAI;AAAA,EAC7C;AAAA,EACA;AAAA,EACA;AAAA,EACA;AAAA,EACA;AAAA,EACA;AAAA,EACA;AACF,CAAC;AAED,MAAM,iBAAsC,oBAAI,IAAI;AAAA,EAClD;AAAA,EACA;AACF,CAAC;AAEM,SAAS,oBAAoB,GAAoB;AACtD,MAAI;AACF,UAAM,SAAS,IAAI,IAAI,CAAC;AACxB,QAAI,CAAC,CAAC,SAAS,QAAQ,EAAE,SAAS,OAAO,QAAQ,EAAG,QAAO;AAC3D,QAAI,eAAe,IAAI,OAAO,QAAQ,GAAG;AACvC,UAAI,OAAO,aAAa,oBAAoB,OAAO,SAAS,WAAW,KAAK,EAAG,QAAO;AACtF,UAAI,OAAO,aAAa,YAAa,QAAO;AAAA,IAC9C;AACA,WAAO;AAAA,EACT,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAEO,SAAS,oBAAoB,GAAoB;AACtD,MAAI;AACF,UAAM,OAAO,IAAI,IAAI,CAAC,EAAE,SAAS,YAAY;AAC7C,QAAI,UAAU,IAAI,IAAI,EAAG,QAAO;AAChC,eAAW,OAAO,WAAW;AAC3B,UAAI,KAAK,SAAS,IAAI,GAAG,EAAE,EAAG,QAAO;AAAA,IACvC;AACA,WAAO;AAAA,EACT,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAOO,SAAS,oBAA+C,OAAgC;AAC7F,QAAM,OAAY,CAAC;AACnB,QAAM,WAA2C,CAAC;AAClD,aAAW,MAAM,OAAO;AACtB,QAAI,CAAC,oBAAoB,GAAG,GAAG,GAAG;AAChC,eAAS,KAAK,EAAE,MAAM,IAAI,QAAQ,cAAc,CAAC;AACjD;AAAA,IACF;AACA,QAAI,oBAAoB,GAAG,GAAG,GAAG;AAC/B,eAAS,KAAK,EAAE,MAAM,IAAI,QAAQ,qBAAqB,CAAC;AACxD;AAAA,IACF;AACA,SAAK,KAAK,EAAE;AAAA,EACd;AACA,SAAO,EAAE,MAAM,SAAS;AAC1B;","names":[]}
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
export interface BackfillOptions {
|
|
2
|
+
dataDir: string;
|
|
3
|
+
limit?: number;
|
|
4
|
+
batchSize?: number;
|
|
5
|
+
dryRun?: boolean;
|
|
6
|
+
onProgress?: (done: number, total: number) => void;
|
|
7
|
+
}
|
|
8
|
+
export interface BackfillResult {
|
|
9
|
+
scanned: number;
|
|
10
|
+
embedded: number;
|
|
11
|
+
skipped: number;
|
|
12
|
+
errors: number;
|
|
13
|
+
modelId: string;
|
|
14
|
+
reason?: string;
|
|
15
|
+
}
|
|
16
|
+
/**
|
|
17
|
+
* Walk url_cache rows that have no corresponding vec_id_map entry, embed
|
|
18
|
+
* title + a snippet of markdown, and upsert into the vector store. Used to
|
|
19
|
+
* recover pages cached before the sqlite-vec switch — find_similar's
|
|
20
|
+
* embedding path skips them otherwise.
|
|
21
|
+
*/
|
|
22
|
+
export declare function backfillEmbeddings(opts: BackfillOptions): Promise<BackfillResult>;
|
|
23
|
+
//# sourceMappingURL=backfill-embeddings.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"backfill-embeddings.d.ts","sourceRoot":"","sources":["../../src/cache/backfill-embeddings.ts"],"names":[],"mappings":"AAQA,MAAM,WAAW,eAAe;IAC9B,OAAO,EAAE,MAAM,CAAC;IAChB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,MAAM,CAAC,EAAE,OAAO,CAAC;IACjB,UAAU,CAAC,EAAE,CAAC,IAAI,EAAE,MAAM,EAAE,KAAK,EAAE,MAAM,KAAK,IAAI,CAAC;CACpD;AAED,MAAM,WAAW,cAAc;IAC7B,OAAO,EAAE,MAAM,CAAC;IAChB,QAAQ,EAAE,MAAM,CAAC;IACjB,OAAO,EAAE,MAAM,CAAC;IAChB,MAAM,EAAE,MAAM,CAAC;IACf,OAAO,EAAE,MAAM,CAAC;IAChB,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AAkBD;;;;;GAKG;AACH,wBAAsB,kBAAkB,CAAC,IAAI,EAAE,eAAe,GAAG,OAAO,CAAC,cAAc,CAAC,CA8FvF"}
|
|
@@ -0,0 +1,105 @@
|
|
|
1
|
+
import { join } from "node:path";
|
|
2
|
+
import { createLogger } from "../logger.js";
|
|
3
|
+
import { initDatabase, closeDatabase, isVecExtensionLoaded } from "./db.js";
|
|
4
|
+
import { getEmbedProvider } from "../providers/embed-provider.js";
|
|
5
|
+
import { getVectorStore } from "../providers/vector-store.js";
|
|
6
|
+
const log = createLogger("cache");
|
|
7
|
+
const SELECT_PENDING_SQL = `
|
|
8
|
+
SELECT url, title, markdown, content_hash
|
|
9
|
+
FROM url_cache uc
|
|
10
|
+
WHERE NOT EXISTS (
|
|
11
|
+
SELECT 1 FROM vec_id_map vm WHERE vm.external_id = uc.url
|
|
12
|
+
)
|
|
13
|
+
ORDER BY uc.id ASC
|
|
14
|
+
`;
|
|
15
|
+
async function backfillEmbeddings(opts) {
|
|
16
|
+
const { dataDir, limit, batchSize = 32, dryRun = false, onProgress } = opts;
|
|
17
|
+
const db = initDatabase(join(dataDir, "wigolo.db"));
|
|
18
|
+
try {
|
|
19
|
+
if (!isVecExtensionLoaded()) {
|
|
20
|
+
return {
|
|
21
|
+
scanned: 0,
|
|
22
|
+
embedded: 0,
|
|
23
|
+
skipped: 0,
|
|
24
|
+
errors: 0,
|
|
25
|
+
modelId: "",
|
|
26
|
+
reason: "sqlite-vec extension not loaded \u2014 backfill skipped"
|
|
27
|
+
};
|
|
28
|
+
}
|
|
29
|
+
let provider;
|
|
30
|
+
let store;
|
|
31
|
+
try {
|
|
32
|
+
provider = await getEmbedProvider();
|
|
33
|
+
store = await getVectorStore();
|
|
34
|
+
} catch (err) {
|
|
35
|
+
return {
|
|
36
|
+
scanned: 0,
|
|
37
|
+
embedded: 0,
|
|
38
|
+
skipped: 0,
|
|
39
|
+
errors: 0,
|
|
40
|
+
modelId: "",
|
|
41
|
+
reason: `embedding pipeline unavailable: ${err instanceof Error ? err.message : String(err)} \u2014 run \`wigolo warmup --embeddings\` first`
|
|
42
|
+
};
|
|
43
|
+
}
|
|
44
|
+
let rows = db.prepare(SELECT_PENDING_SQL).all();
|
|
45
|
+
if (typeof limit === "number" && limit > 0) {
|
|
46
|
+
rows = rows.slice(0, limit);
|
|
47
|
+
}
|
|
48
|
+
const result = {
|
|
49
|
+
scanned: rows.length,
|
|
50
|
+
embedded: 0,
|
|
51
|
+
skipped: 0,
|
|
52
|
+
errors: 0,
|
|
53
|
+
modelId: provider.modelId
|
|
54
|
+
};
|
|
55
|
+
for (let i = 0; i < rows.length; i += batchSize) {
|
|
56
|
+
const batch = rows.slice(i, i + batchSize);
|
|
57
|
+
const usable = batch.filter(
|
|
58
|
+
(r) => r.title && r.title.trim().length > 0 || r.markdown && r.markdown.trim().length > 0
|
|
59
|
+
);
|
|
60
|
+
result.skipped += batch.length - usable.length;
|
|
61
|
+
if (usable.length === 0) {
|
|
62
|
+
onProgress?.(i + batch.length, rows.length);
|
|
63
|
+
continue;
|
|
64
|
+
}
|
|
65
|
+
const texts = usable.map((r) => {
|
|
66
|
+
const title = (r.title ?? "").trim();
|
|
67
|
+
const body = (r.markdown ?? "").slice(0, 500).trim();
|
|
68
|
+
return `${title}
|
|
69
|
+
${body}`.trim();
|
|
70
|
+
});
|
|
71
|
+
try {
|
|
72
|
+
const vectors = await provider.embed(texts);
|
|
73
|
+
if (!dryRun) {
|
|
74
|
+
await store.upsert(
|
|
75
|
+
usable.map((r, idx) => ({
|
|
76
|
+
id: r.url,
|
|
77
|
+
vector: vectors[idx],
|
|
78
|
+
metadata: {
|
|
79
|
+
url: r.url,
|
|
80
|
+
contentHash: r.content_hash ?? "",
|
|
81
|
+
modelId: provider.modelId
|
|
82
|
+
}
|
|
83
|
+
}))
|
|
84
|
+
);
|
|
85
|
+
}
|
|
86
|
+
result.embedded += usable.length;
|
|
87
|
+
} catch (err) {
|
|
88
|
+
log.warn("backfill batch failed", {
|
|
89
|
+
batchStart: i,
|
|
90
|
+
batchSize: usable.length,
|
|
91
|
+
error: err instanceof Error ? err.message : String(err)
|
|
92
|
+
});
|
|
93
|
+
result.errors += usable.length;
|
|
94
|
+
}
|
|
95
|
+
onProgress?.(i + batch.length, rows.length);
|
|
96
|
+
}
|
|
97
|
+
return result;
|
|
98
|
+
} finally {
|
|
99
|
+
closeDatabase();
|
|
100
|
+
}
|
|
101
|
+
}
|
|
102
|
+
export {
|
|
103
|
+
backfillEmbeddings
|
|
104
|
+
};
|
|
105
|
+
//# sourceMappingURL=backfill-embeddings.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../src/cache/backfill-embeddings.ts"],"sourcesContent":["import { join } from 'node:path';\nimport { createLogger } from '../logger.js';\nimport { initDatabase, closeDatabase, isVecExtensionLoaded } from './db.js';\nimport { getEmbedProvider } from '../providers/embed-provider.js';\nimport { getVectorStore } from '../providers/vector-store.js';\n\nconst log = createLogger('cache');\n\nexport interface BackfillOptions {\n dataDir: string;\n limit?: number;\n batchSize?: number;\n dryRun?: boolean;\n onProgress?: (done: number, total: number) => void;\n}\n\nexport interface BackfillResult {\n scanned: number;\n embedded: number;\n skipped: number;\n errors: number;\n modelId: string;\n reason?: string;\n}\n\ninterface CacheRow {\n url: string;\n title: string | null;\n markdown: string | null;\n content_hash: string | null;\n}\n\nconst SELECT_PENDING_SQL = `\n SELECT url, title, markdown, content_hash\n FROM url_cache uc\n WHERE NOT EXISTS (\n SELECT 1 FROM vec_id_map vm WHERE vm.external_id = uc.url\n )\n ORDER BY uc.id ASC\n`;\n\n/**\n * Walk url_cache rows that have no corresponding vec_id_map entry, embed\n * title + a snippet of markdown, and upsert into the vector store. Used to\n * recover pages cached before the sqlite-vec switch — find_similar's\n * embedding path skips them otherwise.\n */\nexport async function backfillEmbeddings(opts: BackfillOptions): Promise<BackfillResult> {\n const { dataDir, limit, batchSize = 32, dryRun = false, onProgress } = opts;\n\n const db = initDatabase(join(dataDir, 'wigolo.db'));\n try {\n if (!isVecExtensionLoaded()) {\n return {\n scanned: 0,\n embedded: 0,\n skipped: 0,\n errors: 0,\n modelId: '',\n reason: 'sqlite-vec extension not loaded — backfill skipped',\n };\n }\n\n let provider: Awaited<ReturnType<typeof getEmbedProvider>>;\n let store: Awaited<ReturnType<typeof getVectorStore>>;\n try {\n provider = await getEmbedProvider();\n store = await getVectorStore();\n } catch (err) {\n return {\n scanned: 0,\n embedded: 0,\n skipped: 0,\n errors: 0,\n modelId: '',\n reason: `embedding pipeline unavailable: ${err instanceof Error ? err.message : String(err)} — run \\`wigolo warmup --embeddings\\` first`,\n };\n }\n\n let rows = db.prepare(SELECT_PENDING_SQL).all() as CacheRow[];\n if (typeof limit === 'number' && limit > 0) {\n rows = rows.slice(0, limit);\n }\n\n const result: BackfillResult = {\n scanned: rows.length,\n embedded: 0,\n skipped: 0,\n errors: 0,\n modelId: provider.modelId,\n };\n\n for (let i = 0; i < rows.length; i += batchSize) {\n const batch = rows.slice(i, i + batchSize);\n const usable = batch.filter(\n (r) => (r.title && r.title.trim().length > 0) || (r.markdown && r.markdown.trim().length > 0),\n );\n result.skipped += batch.length - usable.length;\n if (usable.length === 0) {\n onProgress?.(i + batch.length, rows.length);\n continue;\n }\n\n const texts = usable.map((r) => {\n const title = (r.title ?? '').trim();\n const body = (r.markdown ?? '').slice(0, 500).trim();\n return `${title}\\n${body}`.trim();\n });\n\n try {\n const vectors = await provider.embed(texts);\n if (!dryRun) {\n await store.upsert(\n usable.map((r, idx) => ({\n id: r.url,\n vector: vectors[idx],\n metadata: {\n url: r.url,\n contentHash: r.content_hash ?? '',\n modelId: provider.modelId,\n },\n })),\n );\n }\n result.embedded += usable.length;\n } catch (err) {\n log.warn('backfill batch failed', {\n batchStart: i,\n batchSize: usable.length,\n error: err instanceof Error ? err.message : String(err),\n });\n result.errors += usable.length;\n }\n\n onProgress?.(i + batch.length, rows.length);\n }\n\n return result;\n } finally {\n closeDatabase();\n }\n}\n"],"mappings":"AAAA,SAAS,YAAY;AACrB,SAAS,oBAAoB;AAC7B,SAAS,cAAc,eAAe,4BAA4B;AAClE,SAAS,wBAAwB;AACjC,SAAS,sBAAsB;AAE/B,MAAM,MAAM,aAAa,OAAO;AA0BhC,MAAM,qBAAqB;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAe3B,eAAsB,mBAAmB,MAAgD;AACvF,QAAM,EAAE,SAAS,OAAO,YAAY,IAAI,SAAS,OAAO,WAAW,IAAI;AAEvE,QAAM,KAAK,aAAa,KAAK,SAAS,WAAW,CAAC;AAClD,MAAI;AACF,QAAI,CAAC,qBAAqB,GAAG;AAC3B,aAAO;AAAA,QACL,SAAS;AAAA,QACT,UAAU;AAAA,QACV,SAAS;AAAA,QACT,QAAQ;AAAA,QACR,SAAS;AAAA,QACT,QAAQ;AAAA,MACV;AAAA,IACF;AAEA,QAAI;AACJ,QAAI;AACJ,QAAI;AACF,iBAAW,MAAM,iBAAiB;AAClC,cAAQ,MAAM,eAAe;AAAA,IAC/B,SAAS,KAAK;AACZ,aAAO;AAAA,QACL,SAAS;AAAA,QACT,UAAU;AAAA,QACV,SAAS;AAAA,QACT,QAAQ;AAAA,QACR,SAAS;AAAA,QACT,QAAQ,mCAAmC,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG,CAAC;AAAA,MAC7F;AAAA,IACF;AAEA,QAAI,OAAO,GAAG,QAAQ,kBAAkB,EAAE,IAAI;AAC9C,QAAI,OAAO,UAAU,YAAY,QAAQ,GAAG;AAC1C,aAAO,KAAK,MAAM,GAAG,KAAK;AAAA,IAC5B;AAEA,UAAM,SAAyB;AAAA,MAC7B,SAAS,KAAK;AAAA,MACd,UAAU;AAAA,MACV,SAAS;AAAA,MACT,QAAQ;AAAA,MACR,SAAS,SAAS;AAAA,IACpB;AAEA,aAAS,IAAI,GAAG,IAAI,KAAK,QAAQ,KAAK,WAAW;AAC/C,YAAM,QAAQ,KAAK,MAAM,GAAG,IAAI,SAAS;AACzC,YAAM,SAAS,MAAM;AAAA,QACnB,CAAC,MAAO,EAAE,SAAS,EAAE,MAAM,KAAK,EAAE,SAAS,KAAO,EAAE,YAAY,EAAE,SAAS,KAAK,EAAE,SAAS;AAAA,MAC7F;AACA,aAAO,WAAW,MAAM,SAAS,OAAO;AACxC,UAAI,OAAO,WAAW,GAAG;AACvB,qBAAa,IAAI,MAAM,QAAQ,KAAK,MAAM;AAC1C;AAAA,MACF;AAEA,YAAM,QAAQ,OAAO,IAAI,CAAC,MAAM;AAC9B,cAAM,SAAS,EAAE,SAAS,IAAI,KAAK;AACnC,cAAM,QAAQ,EAAE,YAAY,IAAI,MAAM,GAAG,GAAG,EAAE,KAAK;AACnD,eAAO,GAAG,KAAK;AAAA,EAAK,IAAI,GAAG,KAAK;AAAA,MAClC,CAAC;AAED,UAAI;AACF,cAAM,UAAU,MAAM,SAAS,MAAM,KAAK;AAC1C,YAAI,CAAC,QAAQ;AACX,gBAAM,MAAM;AAAA,YACV,OAAO,IAAI,CAAC,GAAG,SAAS;AAAA,cACtB,IAAI,EAAE;AAAA,cACN,QAAQ,QAAQ,GAAG;AAAA,cACnB,UAAU;AAAA,gBACR,KAAK,EAAE;AAAA,gBACP,aAAa,EAAE,gBAAgB;AAAA,gBAC/B,SAAS,SAAS;AAAA,cACpB;AAAA,YACF,EAAE;AAAA,UACJ;AAAA,QACF;AACA,eAAO,YAAY,OAAO;AAAA,MAC5B,SAAS,KAAK;AACZ,YAAI,KAAK,yBAAyB;AAAA,UAChC,YAAY;AAAA,UACZ,WAAW,OAAO;AAAA,UAClB,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,QACxD,CAAC;AACD,eAAO,UAAU,OAAO;AAAA,MAC1B;AAEA,mBAAa,IAAI,MAAM,QAAQ,KAAK,MAAM;AAAA,IAC5C;AAEA,WAAO;AAAA,EACT,UAAE;AACA,kBAAc;AAAA,EAChB;AACF;","names":[]}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"change-detector.d.ts","sourceRoot":"","sources":["../../src/cache/change-detector.ts"],"names":[],"mappings":"AAOA,MAAM,WAAW,YAAY;IAC3B,OAAO,EAAE,OAAO,CAAC;IACjB,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,WAAW,CAAC,EAAE,MAAM,CAAC;CACtB;AAED,wBAAgB,YAAY,CAAC,GAAG,EAAE,MAAM,EAAE,WAAW,EAAE,MAAM,GAAG,YAAY,CAyC3E"}
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
import { createHash } from "node:crypto";
|
|
2
|
+
import { createLogger } from "../logger.js";
|
|
3
|
+
import { normalizeUrl, getHashForNormalizedUrl, getMarkdownForNormalizedUrl } from "./store.js";
|
|
4
|
+
import { computeDiffSummary } from "./diff-summary.js";
|
|
5
|
+
const log = createLogger("cache");
|
|
6
|
+
function detectChange(url, newMarkdown) {
|
|
7
|
+
try {
|
|
8
|
+
const normalizedUrl = normalizeUrl(url);
|
|
9
|
+
const previousHash = getHashForNormalizedUrl(normalizedUrl);
|
|
10
|
+
if (previousHash === null) {
|
|
11
|
+
log.debug("no cached entry for change detection", { url: normalizedUrl });
|
|
12
|
+
return { changed: false };
|
|
13
|
+
}
|
|
14
|
+
const newHash = createHash("sha256").update(newMarkdown).digest("hex");
|
|
15
|
+
if (newHash === previousHash) {
|
|
16
|
+
log.debug("content unchanged", { url: normalizedUrl, hash: newHash });
|
|
17
|
+
return { changed: false };
|
|
18
|
+
}
|
|
19
|
+
const previousMarkdown = getMarkdownForNormalizedUrl(normalizedUrl);
|
|
20
|
+
const diffSummary = previousMarkdown !== null ? computeDiffSummary(previousMarkdown, newMarkdown) : void 0;
|
|
21
|
+
log.info("content change detected", {
|
|
22
|
+
url: normalizedUrl,
|
|
23
|
+
previousHash,
|
|
24
|
+
newHash,
|
|
25
|
+
diffSummary
|
|
26
|
+
});
|
|
27
|
+
return {
|
|
28
|
+
changed: true,
|
|
29
|
+
previousHash,
|
|
30
|
+
diffSummary
|
|
31
|
+
};
|
|
32
|
+
} catch (err) {
|
|
33
|
+
log.error("change detection failed", {
|
|
34
|
+
url,
|
|
35
|
+
error: err instanceof Error ? err.message : String(err)
|
|
36
|
+
});
|
|
37
|
+
return { changed: false };
|
|
38
|
+
}
|
|
39
|
+
}
|
|
40
|
+
export {
|
|
41
|
+
detectChange
|
|
42
|
+
};
|
|
43
|
+
//# sourceMappingURL=change-detector.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../src/cache/change-detector.ts"],"sourcesContent":["import { createHash } from 'node:crypto';\nimport { createLogger } from '../logger.js';\nimport { normalizeUrl, getHashForNormalizedUrl, getMarkdownForNormalizedUrl } from './store.js';\nimport { computeDiffSummary } from './diff-summary.js';\n\nconst log = createLogger('cache');\n\nexport interface ChangeResult {\n changed: boolean;\n previousHash?: string;\n diffSummary?: string;\n}\n\nexport function detectChange(url: string, newMarkdown: string): ChangeResult {\n try {\n const normalizedUrl = normalizeUrl(url);\n const previousHash = getHashForNormalizedUrl(normalizedUrl);\n\n if (previousHash === null) {\n log.debug('no cached entry for change detection', { url: normalizedUrl });\n return { changed: false };\n }\n\n const newHash = createHash('sha256').update(newMarkdown).digest('hex');\n\n if (newHash === previousHash) {\n log.debug('content unchanged', { url: normalizedUrl, hash: newHash });\n return { changed: false };\n }\n\n const previousMarkdown = getMarkdownForNormalizedUrl(normalizedUrl);\n const diffSummary = previousMarkdown !== null\n ? computeDiffSummary(previousMarkdown, newMarkdown)\n : undefined;\n\n log.info('content change detected', {\n url: normalizedUrl,\n previousHash,\n newHash,\n diffSummary,\n });\n\n return {\n changed: true,\n previousHash,\n diffSummary,\n };\n } catch (err) {\n log.error('change detection failed', {\n url,\n error: err instanceof Error ? err.message : String(err),\n });\n return { changed: false };\n }\n}\n"],"mappings":"AAAA,SAAS,kBAAkB;AAC3B,SAAS,oBAAoB;AAC7B,SAAS,cAAc,yBAAyB,mCAAmC;AACnF,SAAS,0BAA0B;AAEnC,MAAM,MAAM,aAAa,OAAO;AAQzB,SAAS,aAAa,KAAa,aAAmC;AAC3E,MAAI;AACF,UAAM,gBAAgB,aAAa,GAAG;AACtC,UAAM,eAAe,wBAAwB,aAAa;AAE1D,QAAI,iBAAiB,MAAM;AACzB,UAAI,MAAM,wCAAwC,EAAE,KAAK,cAAc,CAAC;AACxE,aAAO,EAAE,SAAS,MAAM;AAAA,IAC1B;AAEA,UAAM,UAAU,WAAW,QAAQ,EAAE,OAAO,WAAW,EAAE,OAAO,KAAK;AAErE,QAAI,YAAY,cAAc;AAC5B,UAAI,MAAM,qBAAqB,EAAE,KAAK,eAAe,MAAM,QAAQ,CAAC;AACpE,aAAO,EAAE,SAAS,MAAM;AAAA,IAC1B;AAEA,UAAM,mBAAmB,4BAA4B,aAAa;AAClE,UAAM,cAAc,qBAAqB,OACrC,mBAAmB,kBAAkB,WAAW,IAChD;AAEJ,QAAI,KAAK,2BAA2B;AAAA,MAClC,KAAK;AAAA,MACL;AAAA,MACA;AAAA,MACA;AAAA,IACF,CAAC;AAED,WAAO;AAAA,MACL,SAAS;AAAA,MACT;AAAA,MACA;AAAA,IACF;AAAA,EACF,SAAS,KAAK;AACZ,QAAI,MAAM,2BAA2B;AAAA,MACnC;AAAA,MACA,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD,CAAC;AACD,WAAO,EAAE,SAAS,MAAM;AAAA,EAC1B;AACF;","names":[]}
|
package/dist/cache/db.d.ts
CHANGED
|
@@ -1,4 +1,5 @@
|
|
|
1
1
|
import Database from 'better-sqlite3';
|
|
2
|
+
export declare function isVecExtensionLoaded(): boolean;
|
|
2
3
|
export declare function initDatabase(dbPath: string): Database.Database;
|
|
3
4
|
export declare function getDatabase(): Database.Database;
|
|
4
5
|
export declare function closeDatabase(): void;
|
package/dist/cache/db.d.ts.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"db.d.ts","sourceRoot":"","sources":["../../src/cache/db.ts"],"names":[],"mappings":"AAAA,OAAO,QAAQ,MAAM,gBAAgB,CAAC;
|
|
1
|
+
{"version":3,"file":"db.d.ts","sourceRoot":"","sources":["../../src/cache/db.ts"],"names":[],"mappings":"AAAA,OAAO,QAAQ,MAAM,gBAAgB,CAAC;AAWtC,wBAAgB,oBAAoB,IAAI,OAAO,CAE9C;AAkBD,wBAAgB,YAAY,CAAC,MAAM,EAAE,MAAM,GAAG,QAAQ,CAAC,QAAQ,CAkJ9D;AAED,wBAAgB,WAAW,IAAI,QAAQ,CAAC,QAAQ,CAK/C;AAED,wBAAgB,aAAa,IAAI,IAAI,CAMpC"}
|