@staticn0va/wigolo 0.1.0 → 0.1.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +1 -1
- package/README.md +146 -227
- package/SKILL.md +382 -0
- package/assets/blocks/claude-code/CLAUDE.md.block +20 -0
- package/assets/blocks/claude-code/wigolo-command.md +40 -0
- package/assets/blocks/cursor/wigolo.mdc +46 -0
- package/assets/blocks/gemini-cli/GEMINI.md.block +18 -0
- package/assets/blocks/vscode/copilot-instructions.md.block +18 -0
- package/assets/skills/wigolo/SKILL.md +50 -0
- package/assets/skills/wigolo/rules/cache-first.md +30 -0
- package/assets/skills/wigolo/rules/synthesis.md +43 -0
- package/assets/skills/wigolo-agent/SKILL.md +73 -0
- package/assets/skills/wigolo-crawl/SKILL.md +60 -0
- package/assets/skills/wigolo-extract/SKILL.md +59 -0
- package/assets/skills/wigolo-fetch/SKILL.md +65 -0
- package/assets/skills/wigolo-find-similar/SKILL.md +72 -0
- package/assets/skills/wigolo-research/SKILL.md +77 -0
- package/assets/skills/wigolo-search/SKILL.md +78 -0
- package/dist/agent/executor.d.ts +33 -0
- package/dist/agent/executor.d.ts.map +1 -0
- package/dist/agent/executor.js +233 -0
- package/dist/agent/executor.js.map +1 -0
- package/dist/agent/pipeline.d.ts +5 -0
- package/dist/agent/pipeline.d.ts.map +1 -0
- package/dist/agent/pipeline.js +238 -0
- package/dist/agent/pipeline.js.map +1 -0
- package/dist/agent/planner.d.ts +13 -0
- package/dist/agent/planner.d.ts.map +1 -0
- package/dist/agent/planner.js +271 -0
- package/dist/agent/planner.js.map +1 -0
- package/dist/agent/relevance.d.ts +15 -0
- package/dist/agent/relevance.d.ts.map +1 -0
- package/dist/agent/relevance.js +60 -0
- package/dist/agent/relevance.js.map +1 -0
- package/dist/cache/backfill-embeddings.d.ts +23 -0
- package/dist/cache/backfill-embeddings.d.ts.map +1 -0
- package/dist/cache/backfill-embeddings.js +105 -0
- package/dist/cache/backfill-embeddings.js.map +1 -0
- package/dist/cache/change-detector.d.ts +7 -0
- package/dist/cache/change-detector.d.ts.map +1 -0
- package/dist/cache/change-detector.js +43 -0
- package/dist/cache/change-detector.js.map +1 -0
- package/dist/cache/db.d.ts +1 -0
- package/dist/cache/db.d.ts.map +1 -1
- package/dist/cache/db.js +94 -22
- package/dist/cache/db.js.map +1 -1
- package/dist/cache/diff-summary.d.ts +2 -0
- package/dist/cache/diff-summary.d.ts.map +1 -0
- package/dist/cache/diff-summary.js +82 -0
- package/dist/cache/diff-summary.js.map +1 -0
- package/dist/cache/migrations/runner.d.ts +29 -0
- package/dist/cache/migrations/runner.d.ts.map +1 -0
- package/dist/cache/migrations/runner.js +147 -0
- package/dist/cache/migrations/runner.js.map +1 -0
- package/dist/cache/sqlite-vec-store.d.ts +42 -0
- package/dist/cache/sqlite-vec-store.d.ts.map +1 -0
- package/dist/cache/sqlite-vec-store.js +176 -0
- package/dist/cache/sqlite-vec-store.js.map +1 -0
- package/dist/cache/store.d.ts +47 -1
- package/dist/cache/store.d.ts.map +1 -1
- package/dist/cache/store.js +364 -168
- package/dist/cache/store.js.map +1 -1
- package/dist/cli/agents/antigravity.d.ts +20 -0
- package/dist/cli/agents/antigravity.d.ts.map +1 -0
- package/dist/cli/agents/antigravity.js +49 -0
- package/dist/cli/agents/antigravity.js.map +1 -0
- package/dist/cli/agents/claude-code.d.ts +25 -0
- package/dist/cli/agents/claude-code.d.ts.map +1 -0
- package/dist/cli/agents/claude-code.js +111 -0
- package/dist/cli/agents/claude-code.js.map +1 -0
- package/dist/cli/agents/cursor.d.ts +21 -0
- package/dist/cli/agents/cursor.d.ts.map +1 -0
- package/dist/cli/agents/cursor.js +58 -0
- package/dist/cli/agents/cursor.js.map +1 -0
- package/dist/cli/agents/gemini-cli.d.ts +21 -0
- package/dist/cli/agents/gemini-cli.d.ts.map +1 -0
- package/dist/cli/agents/gemini-cli.js +55 -0
- package/dist/cli/agents/gemini-cli.js.map +1 -0
- package/dist/cli/agents/registry.d.ts +21 -0
- package/dist/cli/agents/registry.d.ts.map +1 -0
- package/dist/cli/agents/registry.js +27 -0
- package/dist/cli/agents/registry.js.map +1 -0
- package/dist/cli/agents/utils.d.ts +26 -0
- package/dist/cli/agents/utils.d.ts.map +1 -0
- package/dist/cli/agents/utils.js +136 -0
- package/dist/cli/agents/utils.js.map +1 -0
- package/dist/cli/agents/vscode.d.ts +21 -0
- package/dist/cli/agents/vscode.d.ts.map +1 -0
- package/dist/cli/agents/vscode.js +62 -0
- package/dist/cli/agents/vscode.js.map +1 -0
- package/dist/cli/auth.d.ts +2 -0
- package/dist/cli/auth.d.ts.map +1 -0
- package/dist/cli/auth.js +94 -0
- package/dist/cli/auth.js.map +1 -0
- package/dist/cli/backfill.d.ts +2 -0
- package/dist/cli/backfill.d.ts.map +1 -0
- package/dist/cli/backfill.js +58 -0
- package/dist/cli/backfill.js.map +1 -0
- package/dist/cli/daemon.d.ts +6 -1
- package/dist/cli/daemon.d.ts.map +1 -1
- package/dist/cli/daemon.js +61 -3
- package/dist/cli/daemon.js.map +1 -1
- package/dist/cli/doctor.d.ts +8 -0
- package/dist/cli/doctor.d.ts.map +1 -0
- package/dist/cli/doctor.js +344 -0
- package/dist/cli/doctor.js.map +1 -0
- package/dist/cli/health.d.ts +1 -1
- package/dist/cli/health.d.ts.map +1 -1
- package/dist/cli/health.js +42 -3
- package/dist/cli/health.js.map +1 -1
- package/dist/cli/help.d.ts +6 -0
- package/dist/cli/help.d.ts.map +1 -0
- package/dist/cli/help.js +63 -0
- package/dist/cli/help.js.map +1 -0
- package/dist/cli/index.d.ts +1 -1
- package/dist/cli/index.d.ts.map +1 -1
- package/dist/cli/index.js +35 -7
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/init.d.ts +2 -0
- package/dist/cli/init.d.ts.map +1 -0
- package/dist/cli/init.js +201 -0
- package/dist/cli/init.js.map +1 -0
- package/dist/cli/plugin.d.ts +5 -0
- package/dist/cli/plugin.d.ts.map +1 -0
- package/dist/cli/plugin.js +185 -0
- package/dist/cli/plugin.js.map +1 -0
- package/dist/cli/setup-mcp.d.ts +2 -0
- package/dist/cli/setup-mcp.d.ts.map +1 -0
- package/dist/cli/setup-mcp.js +114 -0
- package/dist/cli/setup-mcp.js.map +1 -0
- package/dist/cli/shell.d.ts +2 -0
- package/dist/cli/shell.d.ts.map +1 -0
- package/dist/cli/shell.js +86 -0
- package/dist/cli/shell.js.map +1 -0
- package/dist/cli/shutdown.d.ts +2 -0
- package/dist/cli/shutdown.d.ts.map +1 -0
- package/dist/cli/shutdown.js +26 -0
- package/dist/cli/shutdown.js.map +1 -0
- package/dist/cli/status.d.ts +2 -0
- package/dist/cli/status.d.ts.map +1 -0
- package/dist/cli/status.js +31 -0
- package/dist/cli/status.js.map +1 -0
- package/dist/cli/telemetry.d.ts +10 -0
- package/dist/cli/telemetry.d.ts.map +1 -0
- package/dist/cli/telemetry.js +56 -0
- package/dist/cli/telemetry.js.map +1 -0
- package/dist/cli/tui/agents-types.d.ts +28 -0
- package/dist/cli/tui/agents-types.d.ts.map +1 -0
- package/dist/cli/tui/agents-types.js +1 -0
- package/dist/cli/tui/agents-types.js.map +1 -0
- package/dist/cli/tui/agents.d.ts +11 -0
- package/dist/cli/tui/agents.d.ts.map +1 -0
- package/dist/cli/tui/agents.js +93 -0
- package/dist/cli/tui/agents.js.map +1 -0
- package/dist/cli/tui/banner.d.ts +3 -0
- package/dist/cli/tui/banner.d.ts.map +1 -0
- package/dist/cli/tui/banner.js +30 -0
- package/dist/cli/tui/banner.js.map +1 -0
- package/dist/cli/tui/components/AgentSelect.d.ts +13 -0
- package/dist/cli/tui/components/AgentSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/AgentSelect.js +116 -0
- package/dist/cli/tui/components/AgentSelect.js.map +1 -0
- package/dist/cli/tui/components/Banner.d.ts +6 -0
- package/dist/cli/tui/components/Banner.d.ts.map +1 -0
- package/dist/cli/tui/components/Banner.js +25 -0
- package/dist/cli/tui/components/Banner.js.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts +7 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.js +19 -0
- package/dist/cli/tui/components/BrowserSelect.js.map +1 -0
- package/dist/cli/tui/components/InstallProgress.d.ts +9 -0
- package/dist/cli/tui/components/InstallProgress.d.ts.map +1 -0
- package/dist/cli/tui/components/InstallProgress.js +67 -0
- package/dist/cli/tui/components/InstallProgress.js.map +1 -0
- package/dist/cli/tui/components/SkillInstall.d.ts +14 -0
- package/dist/cli/tui/components/SkillInstall.d.ts.map +1 -0
- package/dist/cli/tui/components/SkillInstall.js +94 -0
- package/dist/cli/tui/components/SkillInstall.js.map +1 -0
- package/dist/cli/tui/components/Summary.d.ts +22 -0
- package/dist/cli/tui/components/Summary.d.ts.map +1 -0
- package/dist/cli/tui/components/Summary.js +135 -0
- package/dist/cli/tui/components/Summary.js.map +1 -0
- package/dist/cli/tui/components/SystemCheck.d.ts +8 -0
- package/dist/cli/tui/components/SystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/components/SystemCheck.js +71 -0
- package/dist/cli/tui/components/SystemCheck.js.map +1 -0
- package/dist/cli/tui/components/Verification.d.ts +8 -0
- package/dist/cli/tui/components/Verification.d.ts.map +1 -0
- package/dist/cli/tui/components/Verification.js +63 -0
- package/dist/cli/tui/components/Verification.js.map +1 -0
- package/dist/cli/tui/config-writer-cli.d.ts +12 -0
- package/dist/cli/tui/config-writer-cli.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-cli.js +39 -0
- package/dist/cli/tui/config-writer-cli.js.map +1 -0
- package/dist/cli/tui/config-writer-json.d.ts +16 -0
- package/dist/cli/tui/config-writer-json.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-json.js +86 -0
- package/dist/cli/tui/config-writer-json.js.map +1 -0
- package/dist/cli/tui/config-writer-toml.d.ts +16 -0
- package/dist/cli/tui/config-writer-toml.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-toml.js +83 -0
- package/dist/cli/tui/config-writer-toml.js.map +1 -0
- package/dist/cli/tui/config-writer.d.ts +25 -0
- package/dist/cli/tui/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/config-writer.js +101 -0
- package/dist/cli/tui/config-writer.js.map +1 -0
- package/dist/cli/tui/detect-helpers.d.ts +6 -0
- package/dist/cli/tui/detect-helpers.d.ts.map +1 -0
- package/dist/cli/tui/detect-helpers.js +45 -0
- package/dist/cli/tui/detect-helpers.js.map +1 -0
- package/dist/cli/tui/extras-prompt.d.ts +7 -0
- package/dist/cli/tui/extras-prompt.d.ts.map +1 -0
- package/dist/cli/tui/extras-prompt.js +42 -0
- package/dist/cli/tui/extras-prompt.js.map +1 -0
- package/dist/cli/tui/flags-types.d.ts +19 -0
- package/dist/cli/tui/flags-types.d.ts.map +1 -0
- package/dist/cli/tui/flags-types.js +23 -0
- package/dist/cli/tui/flags-types.js.map +1 -0
- package/dist/cli/tui/flags.d.ts +5 -0
- package/dist/cli/tui/flags.d.ts.map +1 -0
- package/dist/cli/tui/flags.js +132 -0
- package/dist/cli/tui/flags.js.map +1 -0
- package/dist/cli/tui/format.d.ts +14 -0
- package/dist/cli/tui/format.d.ts.map +1 -0
- package/dist/cli/tui/format.js +37 -0
- package/dist/cli/tui/format.js.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts +6 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.js +19 -0
- package/dist/cli/tui/hooks/useAgentDetect.js.map +1 -0
- package/dist/cli/tui/hooks/useInstall.d.ts +14 -0
- package/dist/cli/tui/hooks/useInstall.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useInstall.js +90 -0
- package/dist/cli/tui/hooks/useInstall.js.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts +13 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.js +95 -0
- package/dist/cli/tui/hooks/useSystemCheck.js.map +1 -0
- package/dist/cli/tui/hooks/useVerify.d.ts +14 -0
- package/dist/cli/tui/hooks/useVerify.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useVerify.js +71 -0
- package/dist/cli/tui/hooks/useVerify.js.map +1 -0
- package/dist/cli/tui/ink-init.d.ts +2 -0
- package/dist/cli/tui/ink-init.d.ts.map +1 -0
- package/dist/cli/tui/ink-init.js +198 -0
- package/dist/cli/tui/ink-init.js.map +1 -0
- package/dist/cli/tui/reporter-auto.d.ts +7 -0
- package/dist/cli/tui/reporter-auto.d.ts.map +1 -0
- package/dist/cli/tui/reporter-auto.js +15 -0
- package/dist/cli/tui/reporter-auto.js.map +1 -0
- package/dist/cli/tui/reporter.d.ts +26 -0
- package/dist/cli/tui/reporter.d.ts.map +1 -0
- package/dist/cli/tui/reporter.js +32 -0
- package/dist/cli/tui/reporter.js.map +1 -0
- package/dist/cli/tui/run-command.d.ts +14 -0
- package/dist/cli/tui/run-command.d.ts.map +1 -0
- package/dist/cli/tui/run-command.js +72 -0
- package/dist/cli/tui/run-command.js.map +1 -0
- package/dist/cli/tui/select-agents.d.ts +6 -0
- package/dist/cli/tui/select-agents.d.ts.map +1 -0
- package/dist/cli/tui/select-agents.js +32 -0
- package/dist/cli/tui/select-agents.js.map +1 -0
- package/dist/cli/tui/status-agents.d.ts +11 -0
- package/dist/cli/tui/status-agents.d.ts.map +1 -0
- package/dist/cli/tui/status-agents.js +53 -0
- package/dist/cli/tui/status-agents.js.map +1 -0
- package/dist/cli/tui/status-cache.d.ts +6 -0
- package/dist/cli/tui/status-cache.d.ts.map +1 -0
- package/dist/cli/tui/status-cache.js +39 -0
- package/dist/cli/tui/status-cache.js.map +1 -0
- package/dist/cli/tui/status-format.d.ts +14 -0
- package/dist/cli/tui/status-format.d.ts.map +1 -0
- package/dist/cli/tui/status-format.js +41 -0
- package/dist/cli/tui/status-format.js.map +1 -0
- package/dist/cli/tui/status-python.d.ts +6 -0
- package/dist/cli/tui/status-python.d.ts.map +1 -0
- package/dist/cli/tui/status-python.js +30 -0
- package/dist/cli/tui/status-python.js.map +1 -0
- package/dist/cli/tui/system-check.d.ts +24 -0
- package/dist/cli/tui/system-check.d.ts.map +1 -0
- package/dist/cli/tui/system-check.js +103 -0
- package/dist/cli/tui/system-check.js.map +1 -0
- package/dist/cli/tui/tui-reporter.d.ts +19 -0
- package/dist/cli/tui/tui-reporter.d.ts.map +1 -0
- package/dist/cli/tui/tui-reporter.js +95 -0
- package/dist/cli/tui/tui-reporter.js.map +1 -0
- package/dist/cli/tui/utils/config-writer.d.ts +3 -0
- package/dist/cli/tui/utils/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/utils/config-writer.js +22 -0
- package/dist/cli/tui/utils/config-writer.js.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts +3 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.js +11 -0
- package/dist/cli/tui/utils/suppress-logs.js.map +1 -0
- package/dist/cli/tui/verify-suggestions.d.ts +5 -0
- package/dist/cli/tui/verify-suggestions.d.ts.map +1 -0
- package/dist/cli/tui/verify-suggestions.js +20 -0
- package/dist/cli/tui/verify-suggestions.js.map +1 -0
- package/dist/cli/tui/verify.d.ts +14 -0
- package/dist/cli/tui/verify.d.ts.map +1 -0
- package/dist/cli/tui/verify.js +101 -0
- package/dist/cli/tui/verify.js.map +1 -0
- package/dist/cli/tui/version.d.ts +2 -0
- package/dist/cli/tui/version.d.ts.map +1 -0
- package/dist/cli/tui/version.js +14 -0
- package/dist/cli/tui/version.js.map +1 -0
- package/dist/cli/uninstall.d.ts +2 -0
- package/dist/cli/uninstall.d.ts.map +1 -0
- package/dist/cli/uninstall.js +57 -0
- package/dist/cli/uninstall.js.map +1 -0
- package/dist/cli/warmup.d.ts +10 -2
- package/dist/cli/warmup.d.ts.map +1 -1
- package/dist/cli/warmup.js +226 -93
- package/dist/cli/warmup.js.map +1 -1
- package/dist/config.d.ts +28 -2
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +106 -56
- package/dist/config.js.map +1 -1
- package/dist/crawl/crawler.d.ts +6 -0
- package/dist/crawl/crawler.d.ts.map +1 -1
- package/dist/crawl/crawler.js +210 -209
- package/dist/crawl/crawler.js.map +1 -1
- package/dist/crawl/dedup.d.ts +1 -0
- package/dist/crawl/dedup.d.ts.map +1 -1
- package/dist/crawl/dedup.js +124 -81
- package/dist/crawl/dedup.js.map +1 -1
- package/dist/crawl/etag-incremental.d.ts +43 -0
- package/dist/crawl/etag-incremental.d.ts.map +1 -0
- package/dist/crawl/etag-incremental.js +94 -0
- package/dist/crawl/etag-incremental.js.map +1 -0
- package/dist/crawl/index-to-vec.d.ts +10 -0
- package/dist/crawl/index-to-vec.d.ts.map +1 -0
- package/dist/crawl/index-to-vec.js +44 -0
- package/dist/crawl/index-to-vec.js.map +1 -0
- package/dist/crawl/mapper.js +136 -164
- package/dist/crawl/mapper.js.map +1 -1
- package/dist/crawl/rate-limiter.js +63 -66
- package/dist/crawl/rate-limiter.js.map +1 -1
- package/dist/crawl/robots.js +58 -57
- package/dist/crawl/robots.js.map +1 -1
- package/dist/crawl/sitemap-first.d.ts +12 -0
- package/dist/crawl/sitemap-first.d.ts.map +1 -0
- package/dist/crawl/sitemap-first.js +47 -0
- package/dist/crawl/sitemap-first.js.map +1 -0
- package/dist/crawl/sitemap.js +33 -32
- package/dist/crawl/sitemap.js.map +1 -1
- package/dist/crawl/url-utils.d.ts +1 -0
- package/dist/crawl/url-utils.d.ts.map +1 -1
- package/dist/crawl/url-utils.js +49 -37
- package/dist/crawl/url-utils.js.map +1 -1
- package/dist/daemon/health-check.d.ts +16 -0
- package/dist/daemon/health-check.d.ts.map +1 -0
- package/dist/daemon/health-check.js +33 -0
- package/dist/daemon/health-check.js.map +1 -0
- package/dist/daemon/http-server.d.ts +26 -0
- package/dist/daemon/http-server.d.ts.map +1 -0
- package/dist/daemon/http-server.js +275 -0
- package/dist/daemon/http-server.js.map +1 -0
- package/dist/daemon/proxy.d.ts +10 -0
- package/dist/daemon/proxy.d.ts.map +1 -0
- package/dist/daemon/proxy.js +93 -0
- package/dist/daemon/proxy.js.map +1 -0
- package/dist/embedding/embed.d.ts +59 -0
- package/dist/embedding/embed.d.ts.map +1 -0
- package/dist/embedding/embed.js +233 -0
- package/dist/embedding/embed.js.map +1 -0
- package/dist/embedding/fastembed-provider.d.ts +19 -0
- package/dist/embedding/fastembed-provider.d.ts.map +1 -0
- package/dist/embedding/fastembed-provider.js +51 -0
- package/dist/embedding/fastembed-provider.js.map +1 -0
- package/dist/embedding/key-terms.d.ts +12 -0
- package/dist/embedding/key-terms.d.ts.map +1 -0
- package/dist/embedding/key-terms.js +234 -0
- package/dist/embedding/key-terms.js.map +1 -0
- package/dist/extraction/boilerplate.d.ts +15 -0
- package/dist/extraction/boilerplate.d.ts.map +1 -0
- package/dist/extraction/boilerplate.js +52 -0
- package/dist/extraction/boilerplate.js.map +1 -0
- package/dist/extraction/defuddle.d.ts.map +1 -1
- package/dist/extraction/defuddle.js +27 -23
- package/dist/extraction/defuddle.js.map +1 -1
- package/dist/extraction/extract.d.ts.map +1 -1
- package/dist/extraction/extract.js +76 -76
- package/dist/extraction/extract.js.map +1 -1
- package/dist/extraction/jsonld.js +50 -54
- package/dist/extraction/jsonld.js.map +1 -1
- package/dist/extraction/lang-hints.d.ts +2 -0
- package/dist/extraction/lang-hints.d.ts.map +1 -0
- package/dist/extraction/lang-hints.js +30 -0
- package/dist/extraction/lang-hints.js.map +1 -0
- package/dist/extraction/llm-fallback.d.ts +17 -0
- package/dist/extraction/llm-fallback.d.ts.map +1 -0
- package/dist/extraction/llm-fallback.js +130 -0
- package/dist/extraction/llm-fallback.js.map +1 -0
- package/dist/extraction/markdown-sanitize.d.ts +2 -0
- package/dist/extraction/markdown-sanitize.d.ts.map +1 -0
- package/dist/extraction/markdown-sanitize.js +151 -0
- package/dist/extraction/markdown-sanitize.js.map +1 -0
- package/dist/extraction/markdown.d.ts +11 -0
- package/dist/extraction/markdown.d.ts.map +1 -1
- package/dist/extraction/markdown.js +195 -91
- package/dist/extraction/markdown.js.map +1 -1
- package/dist/extraction/pipeline.d.ts +8 -0
- package/dist/extraction/pipeline.d.ts.map +1 -1
- package/dist/extraction/pipeline.js +57 -91
- package/dist/extraction/pipeline.js.map +1 -1
- package/dist/extraction/readability.d.ts +1 -1
- package/dist/extraction/readability.d.ts.map +1 -1
- package/dist/extraction/readability.js +28 -29
- package/dist/extraction/readability.js.map +1 -1
- package/dist/extraction/schema.d.ts +12 -0
- package/dist/extraction/schema.d.ts.map +1 -1
- package/dist/extraction/schema.js +135 -72
- package/dist/extraction/schema.js.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.d.ts.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.js +81 -91
- package/dist/extraction/site-extractors/docs-generic.js.map +1 -1
- package/dist/extraction/site-extractors/github.d.ts.map +1 -1
- package/dist/extraction/site-extractors/github.js +87 -95
- package/dist/extraction/site-extractors/github.js.map +1 -1
- package/dist/extraction/site-extractors/mdn.d.ts.map +1 -1
- package/dist/extraction/site-extractors/mdn.js +46 -54
- package/dist/extraction/site-extractors/mdn.js.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.d.ts.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.js +71 -80
- package/dist/extraction/site-extractors/stackoverflow.js.map +1 -1
- package/dist/extraction/structured-data.d.ts +4 -0
- package/dist/extraction/structured-data.d.ts.map +1 -0
- package/dist/extraction/structured-data.js +173 -0
- package/dist/extraction/structured-data.js.map +1 -0
- package/dist/extraction/structured.d.ts +4 -0
- package/dist/extraction/structured.d.ts.map +1 -0
- package/dist/extraction/structured.js +163 -0
- package/dist/extraction/structured.js.map +1 -0
- package/dist/extraction/v1/classifier.d.ts +3 -0
- package/dist/extraction/v1/classifier.d.ts.map +1 -0
- package/dist/extraction/v1/classifier.js +110 -0
- package/dist/extraction/v1/classifier.js.map +1 -0
- package/dist/extraction/v1/extract-provider.d.ts +16 -0
- package/dist/extraction/v1/extract-provider.d.ts.map +1 -0
- package/dist/extraction/v1/extract-provider.js +43 -0
- package/dist/extraction/v1/extract-provider.js.map +1 -0
- package/dist/extraction/v1/local-llm.d.ts +8 -0
- package/dist/extraction/v1/local-llm.d.ts.map +1 -0
- package/dist/extraction/v1/local-llm.js +34 -0
- package/dist/extraction/v1/local-llm.js.map +1 -0
- package/dist/extraction/v1/news.d.ts +3 -0
- package/dist/extraction/v1/news.d.ts.map +1 -0
- package/dist/extraction/v1/news.js +61 -0
- package/dist/extraction/v1/news.js.map +1 -0
- package/dist/extraction/v1/product.d.ts +3 -0
- package/dist/extraction/v1/product.d.ts.map +1 -0
- package/dist/extraction/v1/product.js +166 -0
- package/dist/extraction/v1/product.js.map +1 -0
- package/dist/extraction/v1/recipe.d.ts +3 -0
- package/dist/extraction/v1/recipe.d.ts.map +1 -0
- package/dist/extraction/v1/recipe.js +136 -0
- package/dist/extraction/v1/recipe.js.map +1 -0
- package/dist/extraction/v1/routed.d.ts +17 -0
- package/dist/extraction/v1/routed.d.ts.map +1 -0
- package/dist/extraction/v1/routed.js +68 -0
- package/dist/extraction/v1/routed.js.map +1 -0
- package/dist/extraction/v1/schemas/Article.d.ts +11 -0
- package/dist/extraction/v1/schemas/Article.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Article.js +23 -0
- package/dist/extraction/v1/schemas/Article.js.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts +9 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js +90 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts +10 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.js +122 -0
- package/dist/extraction/v1/schemas/EventListing.js.map +1 -0
- package/dist/extraction/v1/schemas/Paper.d.ts +10 -0
- package/dist/extraction/v1/schemas/Paper.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Paper.js +156 -0
- package/dist/extraction/v1/schemas/Paper.js.map +1 -0
- package/dist/extraction/v1/schemas/Product.d.ts +17 -0
- package/dist/extraction/v1/schemas/Product.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Product.js +149 -0
- package/dist/extraction/v1/schemas/Product.js.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts +14 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.js +160 -0
- package/dist/extraction/v1/schemas/Recipe.js.map +1 -0
- package/dist/extraction/v1/schemas/index.d.ts +13 -0
- package/dist/extraction/v1/schemas/index.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/index.js +44 -0
- package/dist/extraction/v1/schemas/index.js.map +1 -0
- package/dist/extraction/v1/site-extractors.d.ts +5 -0
- package/dist/extraction/v1/site-extractors.d.ts.map +1 -0
- package/dist/extraction/v1/site-extractors.js +31 -0
- package/dist/extraction/v1/site-extractors.js.map +1 -0
- package/dist/fetch/action-executor.d.ts +28 -0
- package/dist/fetch/action-executor.d.ts.map +1 -0
- package/dist/fetch/action-executor.js +88 -0
- package/dist/fetch/action-executor.js.map +1 -0
- package/dist/fetch/auth.d.ts +2 -1
- package/dist/fetch/auth.d.ts.map +1 -1
- package/dist/fetch/auth.js +56 -26
- package/dist/fetch/auth.js.map +1 -1
- package/dist/fetch/browser-pool.d.ts +30 -11
- package/dist/fetch/browser-pool.d.ts.map +1 -1
- package/dist/fetch/browser-pool.js +303 -127
- package/dist/fetch/browser-pool.js.map +1 -1
- package/dist/fetch/browser-selector.d.ts +17 -0
- package/dist/fetch/browser-selector.d.ts.map +1 -0
- package/dist/fetch/browser-selector.js +72 -0
- package/dist/fetch/browser-selector.js.map +1 -0
- package/dist/fetch/browser-types.d.ts +3 -0
- package/dist/fetch/browser-types.d.ts.map +1 -0
- package/dist/fetch/browser-types.js +45 -0
- package/dist/fetch/browser-types.js.map +1 -0
- package/dist/fetch/cdp-client.d.ts +9 -0
- package/dist/fetch/cdp-client.d.ts.map +1 -0
- package/dist/fetch/cdp-client.js +89 -0
- package/dist/fetch/cdp-client.js.map +1 -0
- package/dist/fetch/content-check.js +39 -46
- package/dist/fetch/content-check.js.map +1 -1
- package/dist/fetch/error-describe.d.ts +7 -0
- package/dist/fetch/error-describe.d.ts.map +1 -0
- package/dist/fetch/error-describe.js +37 -0
- package/dist/fetch/error-describe.js.map +1 -0
- package/dist/fetch/http-client.d.ts +4 -0
- package/dist/fetch/http-client.d.ts.map +1 -1
- package/dist/fetch/http-client.js +147 -128
- package/dist/fetch/http-client.js.map +1 -1
- package/dist/fetch/lightpanda.d.ts +28 -0
- package/dist/fetch/lightpanda.d.ts.map +1 -0
- package/dist/fetch/lightpanda.js +174 -0
- package/dist/fetch/lightpanda.js.map +1 -0
- package/dist/fetch/playwright-tier.d.ts +19 -0
- package/dist/fetch/playwright-tier.d.ts.map +1 -0
- package/dist/fetch/playwright-tier.js +76 -0
- package/dist/fetch/playwright-tier.js.map +1 -0
- package/dist/fetch/router.d.ts +49 -3
- package/dist/fetch/router.d.ts.map +1 -1
- package/dist/fetch/router.js +187 -81
- package/dist/fetch/router.js.map +1 -1
- package/dist/index.js +102 -17
- package/dist/index.js.map +1 -1
- package/dist/instructions.d.ts +31 -0
- package/dist/instructions.d.ts.map +1 -0
- package/dist/instructions.js +245 -0
- package/dist/instructions.js.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts +3 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.js +41 -0
- package/dist/integrations/cloud/llm/anthropic.js.map +1 -0
- package/dist/integrations/cloud/llm/cache.d.ts +5 -0
- package/dist/integrations/cloud/llm/cache.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/cache.js +49 -0
- package/dist/integrations/cloud/llm/cache.js.map +1 -0
- package/dist/integrations/cloud/llm/gemini.d.ts +3 -0
- package/dist/integrations/cloud/llm/gemini.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/gemini.js +37 -0
- package/dist/integrations/cloud/llm/gemini.js.map +1 -0
- package/dist/integrations/cloud/llm/groq.d.ts +3 -0
- package/dist/integrations/cloud/llm/groq.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/groq.js +74 -0
- package/dist/integrations/cloud/llm/groq.js.map +1 -0
- package/dist/integrations/cloud/llm/hash.d.ts +3 -0
- package/dist/integrations/cloud/llm/hash.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/hash.js +26 -0
- package/dist/integrations/cloud/llm/hash.js.map +1 -0
- package/dist/integrations/cloud/llm/model-select.d.ts +5 -0
- package/dist/integrations/cloud/llm/model-select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/model-select.js +32 -0
- package/dist/integrations/cloud/llm/model-select.js.map +1 -0
- package/dist/integrations/cloud/llm/openai.d.ts +3 -0
- package/dist/integrations/cloud/llm/openai.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/openai.js +43 -0
- package/dist/integrations/cloud/llm/openai.js.map +1 -0
- package/dist/integrations/cloud/llm/run.d.ts +27 -0
- package/dist/integrations/cloud/llm/run.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/run.js +99 -0
- package/dist/integrations/cloud/llm/run.js.map +1 -0
- package/dist/integrations/cloud/llm/select.d.ts +5 -0
- package/dist/integrations/cloud/llm/select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/select.js +30 -0
- package/dist/integrations/cloud/llm/select.js.map +1 -0
- package/dist/integrations/cloud/llm/text-adapters.d.ts +19 -0
- package/dist/integrations/cloud/llm/text-adapters.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/text-adapters.js +103 -0
- package/dist/integrations/cloud/llm/text-adapters.js.map +1 -0
- package/dist/integrations/cloud/llm/types.d.ts +24 -0
- package/dist/integrations/cloud/llm/types.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/types.js +1 -0
- package/dist/integrations/cloud/llm/types.js.map +1 -0
- package/dist/integrations/cloud/llm/validate.d.ts +6 -0
- package/dist/integrations/cloud/llm/validate.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/validate.js +63 -0
- package/dist/integrations/cloud/llm/validate.js.map +1 -0
- package/dist/logger.d.ts +4 -1
- package/dist/logger.d.ts.map +1 -1
- package/dist/logger.js +71 -30
- package/dist/logger.js.map +1 -1
- package/dist/pdf-parse.d.js +1 -0
- package/dist/pdf-parse.d.js.map +1 -0
- package/dist/plugins/loader.d.ts +20 -0
- package/dist/plugins/loader.d.ts.map +1 -0
- package/dist/plugins/loader.js +157 -0
- package/dist/plugins/loader.js.map +1 -0
- package/dist/plugins/registry.d.ts +26 -0
- package/dist/plugins/registry.d.ts.map +1 -0
- package/dist/plugins/registry.js +71 -0
- package/dist/plugins/registry.js.map +1 -0
- package/dist/plugins/validate.d.ts +9 -0
- package/dist/plugins/validate.d.ts.map +1 -0
- package/dist/plugins/validate.js +79 -0
- package/dist/plugins/validate.js.map +1 -0
- package/dist/providers/embed-provider.d.ts +11 -0
- package/dist/providers/embed-provider.d.ts.map +1 -0
- package/dist/providers/embed-provider.js +24 -0
- package/dist/providers/embed-provider.js.map +1 -0
- package/dist/providers/extract-provider.d.ts +23 -0
- package/dist/providers/extract-provider.d.ts.map +1 -0
- package/dist/providers/extract-provider.js +25 -0
- package/dist/providers/extract-provider.js.map +1 -0
- package/dist/providers/rerank-provider.d.ts +17 -0
- package/dist/providers/rerank-provider.d.ts.map +1 -0
- package/dist/providers/rerank-provider.js +41 -0
- package/dist/providers/rerank-provider.js.map +1 -0
- package/dist/providers/search-provider.d.ts +25 -0
- package/dist/providers/search-provider.d.ts.map +1 -0
- package/dist/providers/search-provider.js +44 -0
- package/dist/providers/search-provider.js.map +1 -0
- package/dist/providers/vector-store.d.ts +27 -0
- package/dist/providers/vector-store.d.ts.map +1 -0
- package/dist/providers/vector-store.js +27 -0
- package/dist/providers/vector-store.js.map +1 -0
- package/dist/python-env.d.ts +9 -0
- package/dist/python-env.d.ts.map +1 -0
- package/dist/python-env.js +13 -0
- package/dist/python-env.js.map +1 -0
- package/dist/repl/commands/agent.d.ts +5 -0
- package/dist/repl/commands/agent.d.ts.map +1 -0
- package/dist/repl/commands/agent.js +62 -0
- package/dist/repl/commands/agent.js.map +1 -0
- package/dist/repl/commands/cache.d.ts +4 -0
- package/dist/repl/commands/cache.d.ts.map +1 -0
- package/dist/repl/commands/cache.js +43 -0
- package/dist/repl/commands/cache.js.map +1 -0
- package/dist/repl/commands/crawl.d.ts +7 -0
- package/dist/repl/commands/crawl.d.ts.map +1 -0
- package/dist/repl/commands/crawl.js +44 -0
- package/dist/repl/commands/crawl.js.map +1 -0
- package/dist/repl/commands/extract.d.ts +5 -0
- package/dist/repl/commands/extract.d.ts.map +1 -0
- package/dist/repl/commands/extract.js +47 -0
- package/dist/repl/commands/extract.js.map +1 -0
- package/dist/repl/commands/fetch.d.ts +5 -0
- package/dist/repl/commands/fetch.d.ts.map +1 -0
- package/dist/repl/commands/fetch.js +67 -0
- package/dist/repl/commands/fetch.js.map +1 -0
- package/dist/repl/commands/find-similar.d.ts +5 -0
- package/dist/repl/commands/find-similar.d.ts.map +1 -0
- package/dist/repl/commands/find-similar.js +74 -0
- package/dist/repl/commands/find-similar.js.map +1 -0
- package/dist/repl/commands/research.d.ts +5 -0
- package/dist/repl/commands/research.d.ts.map +1 -0
- package/dist/repl/commands/research.js +65 -0
- package/dist/repl/commands/research.js.map +1 -0
- package/dist/repl/commands/search.d.ts +5 -0
- package/dist/repl/commands/search.d.ts.map +1 -0
- package/dist/repl/commands/search.js +74 -0
- package/dist/repl/commands/search.js.map +1 -0
- package/dist/repl/commands/types.d.ts +9 -0
- package/dist/repl/commands/types.d.ts.map +1 -0
- package/dist/repl/commands/types.js +1 -0
- package/dist/repl/commands/types.js.map +1 -0
- package/dist/repl/formatters.d.ts +13 -0
- package/dist/repl/formatters.d.ts.map +1 -0
- package/dist/repl/formatters.js +283 -0
- package/dist/repl/formatters.js.map +1 -0
- package/dist/repl/parser.d.ts +9 -0
- package/dist/repl/parser.d.ts.map +1 -0
- package/dist/repl/parser.js +86 -0
- package/dist/repl/parser.js.map +1 -0
- package/dist/repl/shell.d.ts +8 -0
- package/dist/repl/shell.d.ts.map +1 -0
- package/dist/repl/shell.js +184 -0
- package/dist/repl/shell.js.map +1 -0
- package/dist/research/branch-exploration.d.ts +14 -0
- package/dist/research/branch-exploration.d.ts.map +1 -0
- package/dist/research/branch-exploration.js +100 -0
- package/dist/research/branch-exploration.js.map +1 -0
- package/dist/research/brief.d.ts +6 -0
- package/dist/research/brief.d.ts.map +1 -0
- package/dist/research/brief.js +246 -0
- package/dist/research/brief.js.map +1 -0
- package/dist/research/citation-graph.d.ts +9 -0
- package/dist/research/citation-graph.d.ts.map +1 -0
- package/dist/research/citation-graph.js +114 -0
- package/dist/research/citation-graph.js.map +1 -0
- package/dist/research/decompose.d.ts +14 -0
- package/dist/research/decompose.d.ts.map +1 -0
- package/dist/research/decompose.js +439 -0
- package/dist/research/decompose.js.map +1 -0
- package/dist/research/pipeline.d.ts +5 -0
- package/dist/research/pipeline.d.ts.map +1 -0
- package/dist/research/pipeline.js +269 -0
- package/dist/research/pipeline.js.map +1 -0
- package/dist/research/synthesis-local.d.ts +19 -0
- package/dist/research/synthesis-local.d.ts.map +1 -0
- package/dist/research/synthesis-local.js +62 -0
- package/dist/research/synthesis-local.js.map +1 -0
- package/dist/research/synthesize.d.ts +10 -0
- package/dist/research/synthesize.d.ts.map +1 -0
- package/dist/research/synthesize.js +137 -0
- package/dist/research/synthesize.js.map +1 -0
- package/dist/search/answer-synthesis.d.ts +33 -0
- package/dist/search/answer-synthesis.d.ts.map +1 -0
- package/dist/search/answer-synthesis.js +244 -0
- package/dist/search/answer-synthesis.js.map +1 -0
- package/dist/search/context-formatter.d.ts +3 -0
- package/dist/search/context-formatter.d.ts.map +1 -0
- package/dist/search/context-formatter.js +56 -0
- package/dist/search/context-formatter.js.map +1 -0
- package/dist/search/dedup.d.ts +1 -0
- package/dist/search/dedup.d.ts.map +1 -1
- package/dist/search/dedup.js +40 -32
- package/dist/search/dedup.js.map +1 -1
- package/dist/search/engines/arxiv.d.ts +7 -0
- package/dist/search/engines/arxiv.d.ts.map +1 -0
- package/dist/search/engines/arxiv.js +70 -0
- package/dist/search/engines/arxiv.js.map +1 -0
- package/dist/search/engines/bing-news.d.ts +7 -0
- package/dist/search/engines/bing-news.d.ts.map +1 -0
- package/dist/search/engines/bing-news.js +97 -0
- package/dist/search/engines/bing-news.js.map +1 -0
- package/dist/search/engines/bing.d.ts +1 -0
- package/dist/search/engines/bing.d.ts.map +1 -1
- package/dist/search/engines/bing.js +100 -44
- package/dist/search/engines/bing.js.map +1 -1
- package/dist/search/engines/devdocs.d.ts +6 -0
- package/dist/search/engines/devdocs.d.ts.map +1 -0
- package/dist/search/engines/devdocs.js +56 -0
- package/dist/search/engines/devdocs.js.map +1 -0
- package/dist/search/engines/duckduckgo.d.ts.map +1 -1
- package/dist/search/engines/duckduckgo.js +56 -44
- package/dist/search/engines/duckduckgo.js.map +1 -1
- package/dist/search/engines/github-code.d.ts +7 -0
- package/dist/search/engines/github-code.d.ts.map +1 -0
- package/dist/search/engines/github-code.js +55 -0
- package/dist/search/engines/github-code.js.map +1 -0
- package/dist/search/engines/hn-algolia.d.ts +7 -0
- package/dist/search/engines/hn-algolia.d.ts.map +1 -0
- package/dist/search/engines/hn-algolia.js +76 -0
- package/dist/search/engines/hn-algolia.js.map +1 -0
- package/dist/search/engines/lobsters.d.ts +7 -0
- package/dist/search/engines/lobsters.d.ts.map +1 -0
- package/dist/search/engines/lobsters.js +83 -0
- package/dist/search/engines/lobsters.js.map +1 -0
- package/dist/search/engines/mdn.d.ts +7 -0
- package/dist/search/engines/mdn.d.ts.map +1 -0
- package/dist/search/engines/mdn.js +48 -0
- package/dist/search/engines/mdn.js.map +1 -0
- package/dist/search/engines/semantic-scholar.d.ts +7 -0
- package/dist/search/engines/semantic-scholar.d.ts.map +1 -0
- package/dist/search/engines/semantic-scholar.js +69 -0
- package/dist/search/engines/semantic-scholar.js.map +1 -0
- package/dist/search/engines/stackoverflow.d.ts +7 -0
- package/dist/search/engines/stackoverflow.d.ts.map +1 -0
- package/dist/search/engines/stackoverflow.js +73 -0
- package/dist/search/engines/stackoverflow.js.map +1 -0
- package/dist/search/engines/startpage.d.ts.map +1 -1
- package/dist/search/engines/startpage.js +65 -46
- package/dist/search/engines/startpage.js.map +1 -1
- package/dist/search/evidence.d.ts +25 -0
- package/dist/search/evidence.d.ts.map +1 -0
- package/dist/search/evidence.js +220 -0
- package/dist/search/evidence.js.map +1 -0
- package/dist/search/filters.d.ts.map +1 -1
- package/dist/search/filters.js +58 -54
- package/dist/search/filters.js.map +1 -1
- package/dist/search/find-similar/crawl-rank.d.ts +9 -0
- package/dist/search/find-similar/crawl-rank.d.ts.map +1 -0
- package/dist/search/find-similar/crawl-rank.js +272 -0
- package/dist/search/find-similar/crawl-rank.js.map +1 -0
- package/dist/search/find-similar/mode.d.ts +4 -0
- package/dist/search/find-similar/mode.d.ts.map +1 -0
- package/dist/search/find-similar/mode.js +12 -0
- package/dist/search/find-similar/mode.js.map +1 -0
- package/dist/search/find-similar.d.ts +5 -0
- package/dist/search/find-similar.d.ts.map +1 -0
- package/dist/search/find-similar.js +509 -0
- package/dist/search/find-similar.js.map +1 -0
- package/dist/search/highlights.d.ts +19 -0
- package/dist/search/highlights.d.ts.map +1 -0
- package/dist/search/highlights.js +167 -0
- package/dist/search/highlights.js.map +1 -0
- package/dist/search/language-filter.d.ts +29 -0
- package/dist/search/language-filter.d.ts.map +1 -0
- package/dist/search/language-filter.js +126 -0
- package/dist/search/language-filter.js.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts +4 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.js +501 -0
- package/dist/search/legacy/searxng-orchestrator.js.map +1 -0
- package/dist/search/legacy/searxng-provider.d.ts +7 -0
- package/dist/search/legacy/searxng-provider.d.ts.map +1 -0
- package/dist/search/legacy/searxng-provider.js +11 -0
- package/dist/search/legacy/searxng-provider.js.map +1 -0
- package/dist/search/multi-query.d.ts +25 -0
- package/dist/search/multi-query.d.ts.map +1 -0
- package/dist/search/multi-query.js +228 -0
- package/dist/search/multi-query.js.map +1 -0
- package/dist/search/query.js +32 -34
- package/dist/search/query.js.map +1 -1
- package/dist/search/rerank.d.ts +3 -1
- package/dist/search/rerank.d.ts.map +1 -1
- package/dist/search/rerank.js +44 -35
- package/dist/search/rerank.js.map +1 -1
- package/dist/search/reranker/authority-boost.d.ts +3 -0
- package/dist/search/reranker/authority-boost.d.ts.map +1 -0
- package/dist/search/reranker/authority-boost.js +179 -0
- package/dist/search/reranker/authority-boost.js.map +1 -0
- package/dist/search/reranker/consensus-boost.d.ts +3 -0
- package/dist/search/reranker/consensus-boost.d.ts.map +1 -0
- package/dist/search/reranker/consensus-boost.js +27 -0
- package/dist/search/reranker/consensus-boost.js.map +1 -0
- package/dist/search/reranker/recency-boost.d.ts +3 -0
- package/dist/search/reranker/recency-boost.d.ts.map +1 -0
- package/dist/search/reranker/recency-boost.js +13 -0
- package/dist/search/reranker/recency-boost.js.map +1 -0
- package/dist/search/reranker/recency.d.ts +3 -0
- package/dist/search/reranker/recency.d.ts.map +1 -0
- package/dist/search/reranker/recency.js +23 -0
- package/dist/search/reranker/recency.js.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts +13 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.js +94 -0
- package/dist/search/reranker/transformers-rerank-provider.js.map +1 -0
- package/dist/search/rrf.d.ts +17 -0
- package/dist/search/rrf.d.ts.map +1 -0
- package/dist/search/rrf.js +39 -0
- package/dist/search/rrf.js.map +1 -0
- package/dist/search/sampling.d.ts +25 -0
- package/dist/search/sampling.d.ts.map +1 -0
- package/dist/search/sampling.js +52 -0
- package/dist/search/sampling.js.map +1 -0
- package/dist/search/searxng.d.ts.map +1 -1
- package/dist/search/searxng.js +69 -79
- package/dist/search/searxng.js.map +1 -1
- package/dist/search/tokens.d.ts +3 -0
- package/dist/search/tokens.d.ts.map +1 -0
- package/dist/search/tokens.js +39 -0
- package/dist/search/tokens.js.map +1 -0
- package/dist/search/truncate.d.ts +6 -0
- package/dist/search/truncate.d.ts.map +1 -0
- package/dist/search/truncate.js +26 -0
- package/dist/search/truncate.js.map +1 -0
- package/dist/search/url-unwrap.d.ts +3 -0
- package/dist/search/url-unwrap.d.ts.map +1 -0
- package/dist/search/url-unwrap.js +43 -0
- package/dist/search/url-unwrap.js.map +1 -0
- package/dist/search/v1/context-rank.d.ts +13 -0
- package/dist/search/v1/context-rank.d.ts.map +1 -0
- package/dist/search/v1/context-rank.js +74 -0
- package/dist/search/v1/context-rank.js.map +1 -0
- package/dist/search/v1/engine-base.d.ts +27 -0
- package/dist/search/v1/engine-base.d.ts.map +1 -0
- package/dist/search/v1/engine-base.js +110 -0
- package/dist/search/v1/engine-base.js.map +1 -0
- package/dist/search/v1/intent-router.d.ts +22 -0
- package/dist/search/v1/intent-router.d.ts.map +1 -0
- package/dist/search/v1/intent-router.js +138 -0
- package/dist/search/v1/intent-router.js.map +1 -0
- package/dist/search/v1/orchestrator.d.ts +24 -0
- package/dist/search/v1/orchestrator.d.ts.map +1 -0
- package/dist/search/v1/orchestrator.js +163 -0
- package/dist/search/v1/orchestrator.js.map +1 -0
- package/dist/search/v1/recency-boost.d.ts +9 -0
- package/dist/search/v1/recency-boost.d.ts.map +1 -0
- package/dist/search/v1/recency-boost.js +37 -0
- package/dist/search/v1/recency-boost.js.map +1 -0
- package/dist/search/v1/recent-cache-dedup.d.ts +6 -0
- package/dist/search/v1/recent-cache-dedup.d.ts.map +1 -0
- package/dist/search/v1/recent-cache-dedup.js +85 -0
- package/dist/search/v1/recent-cache-dedup.js.map +1 -0
- package/dist/search/v1/rss/feed-config.d.ts +21 -0
- package/dist/search/v1/rss/feed-config.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-config.js +90 -0
- package/dist/search/v1/rss/feed-config.js.map +1 -0
- package/dist/search/v1/rss/feed-parser.d.ts +14 -0
- package/dist/search/v1/rss/feed-parser.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-parser.js +104 -0
- package/dist/search/v1/rss/feed-parser.js.map +1 -0
- package/dist/search/v1/rss/feed-poller.d.ts +22 -0
- package/dist/search/v1/rss/feed-poller.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-poller.js +102 -0
- package/dist/search/v1/rss/feed-poller.js.map +1 -0
- package/dist/search/v1/rss/feed-store.d.ts +30 -0
- package/dist/search/v1/rss/feed-store.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-store.js +134 -0
- package/dist/search/v1/rss/feed-store.js.map +1 -0
- package/dist/search/v1/rss/rss-engine.d.ts +6 -0
- package/dist/search/v1/rss/rss-engine.d.ts.map +1 -0
- package/dist/search/v1/rss/rss-engine.js +28 -0
- package/dist/search/v1/rss/rss-engine.js.map +1 -0
- package/dist/search/v1/v1-provider.d.ts +7 -0
- package/dist/search/v1/v1-provider.d.ts.map +1 -0
- package/dist/search/v1/v1-provider.js +68 -0
- package/dist/search/v1/v1-provider.js.map +1 -0
- package/dist/search/v1/verticals/code.d.ts +4 -0
- package/dist/search/v1/verticals/code.d.ts.map +1 -0
- package/dist/search/v1/verticals/code.js +20 -0
- package/dist/search/v1/verticals/code.js.map +1 -0
- package/dist/search/v1/verticals/docs.d.ts +4 -0
- package/dist/search/v1/verticals/docs.d.ts.map +1 -0
- package/dist/search/v1/verticals/docs.js +20 -0
- package/dist/search/v1/verticals/docs.js.map +1 -0
- package/dist/search/v1/verticals/general.d.ts +4 -0
- package/dist/search/v1/verticals/general.d.ts.map +1 -0
- package/dist/search/v1/verticals/general.js +22 -0
- package/dist/search/v1/verticals/general.js.map +1 -0
- package/dist/search/v1/verticals/news.d.ts +10 -0
- package/dist/search/v1/verticals/news.d.ts.map +1 -0
- package/dist/search/v1/verticals/news.js +52 -0
- package/dist/search/v1/verticals/news.js.map +1 -0
- package/dist/search/v1/verticals/papers.d.ts +4 -0
- package/dist/search/v1/verticals/papers.d.ts.map +1 -0
- package/dist/search/v1/verticals/papers.js +23 -0
- package/dist/search/v1/verticals/papers.js.map +1 -0
- package/dist/search/validator.js +31 -31
- package/dist/search/validator.js.map +1 -1
- package/dist/searxng/bootstrap.d.ts +30 -0
- package/dist/searxng/bootstrap.d.ts.map +1 -1
- package/dist/searxng/bootstrap.js +223 -85
- package/dist/searxng/bootstrap.js.map +1 -1
- package/dist/searxng/docker.d.ts.map +1 -1
- package/dist/searxng/docker.js +69 -60
- package/dist/searxng/docker.js.map +1 -1
- package/dist/searxng/process.d.ts +13 -1
- package/dist/searxng/process.d.ts.map +1 -1
- package/dist/searxng/process.js +231 -164
- package/dist/searxng/process.js.map +1 -1
- package/dist/server/backend-status.d.ts +13 -0
- package/dist/server/backend-status.d.ts.map +1 -0
- package/dist/server/backend-status.js +40 -0
- package/dist/server/backend-status.js.map +1 -0
- package/dist/server/tool-schemas.d.ts +549 -0
- package/dist/server/tool-schemas.d.ts.map +1 -0
- package/dist/server/tool-schemas.js +464 -0
- package/dist/server/tool-schemas.js.map +1 -0
- package/dist/server/warmup-on-start.d.ts +9 -0
- package/dist/server/warmup-on-start.d.ts.map +1 -0
- package/dist/server/warmup-on-start.js +55 -0
- package/dist/server/warmup-on-start.js.map +1 -0
- package/dist/server.d.ts +17 -0
- package/dist/server.d.ts.map +1 -1
- package/dist/server.js +454 -297
- package/dist/server.js.map +1 -1
- package/dist/tools/agent.d.ts +5 -0
- package/dist/tools/agent.d.ts.map +1 -0
- package/dist/tools/agent.js +128 -0
- package/dist/tools/agent.js.map +1 -0
- package/dist/tools/cache.d.ts +2 -1
- package/dist/tools/cache.d.ts.map +1 -1
- package/dist/tools/cache.js +177 -44
- package/dist/tools/cache.js.map +1 -1
- package/dist/tools/crawl.d.ts.map +1 -1
- package/dist/tools/crawl.js +171 -88
- package/dist/tools/crawl.js.map +1 -1
- package/dist/tools/extract.d.ts +2 -2
- package/dist/tools/extract.d.ts.map +1 -1
- package/dist/tools/extract.js +175 -59
- package/dist/tools/extract.js.map +1 -1
- package/dist/tools/fetch.d.ts +2 -2
- package/dist/tools/fetch.d.ts.map +1 -1
- package/dist/tools/fetch.js +174 -68
- package/dist/tools/fetch.js.map +1 -1
- package/dist/tools/find-similar.d.ts +5 -0
- package/dist/tools/find-similar.d.ts.map +1 -0
- package/dist/tools/find-similar.js +127 -0
- package/dist/tools/find-similar.js.map +1 -0
- package/dist/tools/research.d.ts +5 -0
- package/dist/tools/research.d.ts.map +1 -0
- package/dist/tools/research.js +107 -0
- package/dist/tools/research.js.map +1 -0
- package/dist/tools/search.d.ts +10 -2
- package/dist/tools/search.d.ts.map +1 -1
- package/dist/tools/search.js +13 -158
- package/dist/tools/search.js.map +1 -1
- package/dist/types.d.ts +350 -7
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js +6 -1
- package/dist/types.js.map +1 -1
- package/dist/util/mode.d.ts +4 -0
- package/dist/util/mode.d.ts.map +1 -0
- package/dist/util/mode.js +34 -0
- package/dist/util/mode.js.map +1 -0
- package/package.json +78 -8
- package/dist/extraction/trafilatura.d.ts +0 -6
- package/dist/extraction/trafilatura.d.ts.map +0 -1
- package/dist/extraction/trafilatura.js +0 -105
- package/dist/extraction/trafilatura.js.map +0 -1
- package/dist/search/flashrank.d.ts +0 -12
- package/dist/search/flashrank.d.ts.map +0 -1
- package/dist/search/flashrank.js +0 -63
- package/dist/search/flashrank.js.map +0 -1
|
@@ -0,0 +1,269 @@
|
|
|
1
|
+
import { createLogger } from "../logger.js";
|
|
2
|
+
import { decomposeQuestion, extractComparisonEntities } from "./decompose.js";
|
|
3
|
+
import { synthesizeReport } from "./synthesize.js";
|
|
4
|
+
import { synthesizeLocal } from "./synthesis-local.js";
|
|
5
|
+
import { buildResearchBrief } from "./brief.js";
|
|
6
|
+
import { deduplicateResults } from "../search/dedup.js";
|
|
7
|
+
import { rerankResults } from "../search/rerank.js";
|
|
8
|
+
import { applyAllFilters } from "../search/filters.js";
|
|
9
|
+
import { exploreInParallel } from "./branch-exploration.js";
|
|
10
|
+
import { getExtractProvider } from "../providers/extract-provider.js";
|
|
11
|
+
import { truncateSmartly } from "../search/truncate.js";
|
|
12
|
+
import { cacheContent } from "../cache/store.js";
|
|
13
|
+
import { getEmbeddingService } from "../embedding/embed.js";
|
|
14
|
+
import { checkSamplingSupport } from "../search/sampling.js";
|
|
15
|
+
import { isLlmConfigured as isLocalLlmEnabled } from "../integrations/cloud/llm/run.js";
|
|
16
|
+
const log = createLogger("research");
|
|
17
|
+
const DEPTH_CONFIG = {
|
|
18
|
+
quick: { subQueries: 2, minSources: 5, maxSources: 8 },
|
|
19
|
+
standard: { subQueries: 4, minSources: 10, maxSources: 15 },
|
|
20
|
+
comprehensive: { subQueries: 7, minSources: 20, maxSources: 25 }
|
|
21
|
+
};
|
|
22
|
+
const SEARCH_TOTAL_BUDGET_MS = {
|
|
23
|
+
quick: 15e3,
|
|
24
|
+
standard: 3e4,
|
|
25
|
+
comprehensive: 6e4
|
|
26
|
+
};
|
|
27
|
+
const SEARCH_PER_QUERY_BUDGET_MS = {
|
|
28
|
+
quick: 8e3,
|
|
29
|
+
standard: 1e4,
|
|
30
|
+
comprehensive: 15e3
|
|
31
|
+
};
|
|
32
|
+
const PER_SOURCE_CHAR_CAP = 3e3;
|
|
33
|
+
const TOTAL_SOURCES_CHAR_CAP = 4e4;
|
|
34
|
+
async function runResearchPipeline(input, engines, router, server) {
|
|
35
|
+
const start = Date.now();
|
|
36
|
+
const depth = input.depth ?? "standard";
|
|
37
|
+
const config = DEPTH_CONFIG[depth] ?? DEPTH_CONFIG.standard;
|
|
38
|
+
const maxSources = input.max_sources ?? config.maxSources;
|
|
39
|
+
try {
|
|
40
|
+
log.info("research pipeline started", { question: input.question, depth });
|
|
41
|
+
const decomposeResult = await decomposeQuestion(
|
|
42
|
+
input.question,
|
|
43
|
+
depth,
|
|
44
|
+
server
|
|
45
|
+
);
|
|
46
|
+
const subQueries = decomposeResult.subQueries;
|
|
47
|
+
const queryType = decomposeResult.queryType;
|
|
48
|
+
log.info("decomposition complete", { subQueryCount: subQueries.length, samplingUsed: decomposeResult.samplingUsed, queryType });
|
|
49
|
+
const effEngines = subQueries.length >= 3 && engines.length > 2 ? engines.slice(0, 2) : engines;
|
|
50
|
+
const perEngineMaxResults = Math.ceil(maxSources / subQueries.length) * 2;
|
|
51
|
+
const branchResults = await exploreInParallel(
|
|
52
|
+
subQueries,
|
|
53
|
+
async (subQuery, signal) => {
|
|
54
|
+
const results = [];
|
|
55
|
+
const usedHere = /* @__PURE__ */ new Set();
|
|
56
|
+
const engineOpts = {
|
|
57
|
+
maxResults: perEngineMaxResults,
|
|
58
|
+
includeDomains: input.include_domains,
|
|
59
|
+
excludeDomains: input.exclude_domains
|
|
60
|
+
};
|
|
61
|
+
await Promise.allSettled(
|
|
62
|
+
effEngines.map(async (engine) => {
|
|
63
|
+
if (signal.aborted) return;
|
|
64
|
+
try {
|
|
65
|
+
const rs = await engine.search(subQuery, engineOpts);
|
|
66
|
+
for (const r of rs) results.push(r);
|
|
67
|
+
usedHere.add(engine.name);
|
|
68
|
+
} catch (err) {
|
|
69
|
+
log.warn("research engine search failed", {
|
|
70
|
+
engine: engine.name,
|
|
71
|
+
query: subQuery,
|
|
72
|
+
error: err instanceof Error ? err.message : String(err)
|
|
73
|
+
});
|
|
74
|
+
}
|
|
75
|
+
})
|
|
76
|
+
);
|
|
77
|
+
return { results, enginesUsed: [...usedHere] };
|
|
78
|
+
},
|
|
79
|
+
{
|
|
80
|
+
maxConcurrent: 3,
|
|
81
|
+
totalBudgetMs: SEARCH_TOTAL_BUDGET_MS[depth] ?? SEARCH_TOTAL_BUDGET_MS.standard,
|
|
82
|
+
perQueryBudgetMs: SEARCH_PER_QUERY_BUDGET_MS[depth] ?? SEARCH_PER_QUERY_BUDGET_MS.standard
|
|
83
|
+
}
|
|
84
|
+
);
|
|
85
|
+
const allRaw = [];
|
|
86
|
+
const enginesUsed = /* @__PURE__ */ new Set();
|
|
87
|
+
const searchErrors = [];
|
|
88
|
+
for (const br of branchResults) {
|
|
89
|
+
if (br.ok && br.result) {
|
|
90
|
+
allRaw.push(...br.result.results);
|
|
91
|
+
for (const e of br.result.enginesUsed) enginesUsed.add(e);
|
|
92
|
+
} else if (br.error) {
|
|
93
|
+
searchErrors.push(`${br.query}: ${br.error}`);
|
|
94
|
+
}
|
|
95
|
+
}
|
|
96
|
+
if (searchErrors.length > 0) {
|
|
97
|
+
log.warn("some search sub-queries failed", { errors: searchErrors });
|
|
98
|
+
}
|
|
99
|
+
log.info("search phase complete", { totalRaw: allRaw.length, engines: [...enginesUsed] });
|
|
100
|
+
let merged = deduplicateResults(allRaw);
|
|
101
|
+
merged = applyAllFilters(merged, {
|
|
102
|
+
includeDomains: input.include_domains,
|
|
103
|
+
excludeDomains: input.exclude_domains
|
|
104
|
+
});
|
|
105
|
+
merged = await rerankResults(input.question, merged);
|
|
106
|
+
merged = merged.slice(0, maxSources);
|
|
107
|
+
if (merged.length === 0) {
|
|
108
|
+
return {
|
|
109
|
+
report: `## Research: ${input.question}
|
|
110
|
+
|
|
111
|
+
No sources could be found for this query.`,
|
|
112
|
+
citations: [],
|
|
113
|
+
sources: [],
|
|
114
|
+
sub_queries: subQueries,
|
|
115
|
+
depth,
|
|
116
|
+
total_time_ms: Date.now() - start,
|
|
117
|
+
sampling_supported: !!server && checkSamplingSupport(server)
|
|
118
|
+
};
|
|
119
|
+
}
|
|
120
|
+
const sources = await fetchSources(merged, router, maxSources);
|
|
121
|
+
applySourceBudget(sources, PER_SOURCE_CHAR_CAP, TOTAL_SOURCES_CHAR_CAP);
|
|
122
|
+
log.info("fetch phase complete", {
|
|
123
|
+
fetched: sources.filter((s) => s.fetched).length,
|
|
124
|
+
failed: sources.filter((s) => !s.fetched).length
|
|
125
|
+
});
|
|
126
|
+
const synthesisResult = await synthesizeReport(
|
|
127
|
+
input.question,
|
|
128
|
+
sources,
|
|
129
|
+
depth,
|
|
130
|
+
server
|
|
131
|
+
);
|
|
132
|
+
log.info("synthesis complete", { samplingUsed: synthesisResult.samplingUsed, reportLength: synthesisResult.report.length });
|
|
133
|
+
let finalReport = synthesisResult.report;
|
|
134
|
+
let finalCitations = synthesisResult.citations;
|
|
135
|
+
let localSynthesisText;
|
|
136
|
+
if (!synthesisResult.samplingUsed && isLocalLlmEnabled()) {
|
|
137
|
+
try {
|
|
138
|
+
const localSources = sources.filter((s) => s.fetched && s.markdown_content.length > 0).map((s) => ({ url: s.url, title: s.title, markdown: s.markdown_content }));
|
|
139
|
+
if (localSources.length > 0) {
|
|
140
|
+
const local = await synthesizeLocal(input.question, localSources);
|
|
141
|
+
finalReport = local.text;
|
|
142
|
+
localSynthesisText = local.text;
|
|
143
|
+
finalCitations = local.citations.filter((idx) => idx >= 0 && idx < localSources.length).map((idx) => {
|
|
144
|
+
const s = localSources[idx];
|
|
145
|
+
return {
|
|
146
|
+
index: idx + 1,
|
|
147
|
+
url: s.url,
|
|
148
|
+
title: s.title,
|
|
149
|
+
snippet: s.markdown.slice(0, 200)
|
|
150
|
+
};
|
|
151
|
+
});
|
|
152
|
+
log.info("local synthesis succeeded", { reportLength: finalReport.length });
|
|
153
|
+
}
|
|
154
|
+
} catch (err) {
|
|
155
|
+
log.warn("local LLM synthesis failed; using heuristic fallback", {
|
|
156
|
+
error: err instanceof Error ? err.message : String(err)
|
|
157
|
+
});
|
|
158
|
+
}
|
|
159
|
+
}
|
|
160
|
+
const comparisonEntities = queryType === "comparison" ? extractComparisonEntities(input.question).entities : [];
|
|
161
|
+
const brief = !synthesisResult.samplingUsed ? await buildResearchBrief(
|
|
162
|
+
input.question,
|
|
163
|
+
sources,
|
|
164
|
+
subQueries,
|
|
165
|
+
PER_SOURCE_CHAR_CAP,
|
|
166
|
+
TOTAL_SOURCES_CHAR_CAP,
|
|
167
|
+
queryType,
|
|
168
|
+
comparisonEntities,
|
|
169
|
+
localSynthesisText
|
|
170
|
+
) : void 0;
|
|
171
|
+
return {
|
|
172
|
+
report: finalReport,
|
|
173
|
+
citations: finalCitations,
|
|
174
|
+
sources,
|
|
175
|
+
sub_queries: subQueries,
|
|
176
|
+
depth,
|
|
177
|
+
total_time_ms: Date.now() - start,
|
|
178
|
+
sampling_supported: !!server && checkSamplingSupport(server),
|
|
179
|
+
...brief ? { brief } : {}
|
|
180
|
+
};
|
|
181
|
+
} catch (err) {
|
|
182
|
+
log.error("research pipeline failed", {
|
|
183
|
+
question: input.question,
|
|
184
|
+
error: err instanceof Error ? err.message : String(err)
|
|
185
|
+
});
|
|
186
|
+
return {
|
|
187
|
+
report: "",
|
|
188
|
+
citations: [],
|
|
189
|
+
sources: [],
|
|
190
|
+
sub_queries: [],
|
|
191
|
+
depth,
|
|
192
|
+
total_time_ms: Date.now() - start,
|
|
193
|
+
sampling_supported: !!server && checkSamplingSupport(server),
|
|
194
|
+
error: err instanceof Error ? err.message : String(err)
|
|
195
|
+
};
|
|
196
|
+
}
|
|
197
|
+
}
|
|
198
|
+
async function fetchSources(merged, router, maxSources) {
|
|
199
|
+
const fetchPromises = merged.slice(0, maxSources).map(async (result) => {
|
|
200
|
+
try {
|
|
201
|
+
const raw = await Promise.race([
|
|
202
|
+
router.fetch(result.url, { renderJs: "auto" }),
|
|
203
|
+
new Promise(
|
|
204
|
+
(_, reject) => setTimeout(() => reject(new Error("fetch timeout")), 15e3)
|
|
205
|
+
)
|
|
206
|
+
]);
|
|
207
|
+
const extractor = await getExtractProvider();
|
|
208
|
+
const extraction = await extractor.extract(raw.html, raw.finalUrl, {
|
|
209
|
+
maxChars: 3e4,
|
|
210
|
+
contentType: raw.contentType
|
|
211
|
+
});
|
|
212
|
+
const truncated = truncateSmartly(extraction.markdown, PER_SOURCE_CHAR_CAP);
|
|
213
|
+
try {
|
|
214
|
+
cacheContent(raw, extraction);
|
|
215
|
+
} catch (err) {
|
|
216
|
+
log.warn("failed to cache research source", { url: result.url, error: String(err) });
|
|
217
|
+
}
|
|
218
|
+
try {
|
|
219
|
+
const embeddingService = getEmbeddingService();
|
|
220
|
+
if (embeddingService.isAvailable()) {
|
|
221
|
+
embeddingService.embedAsync(raw.finalUrl, extraction.markdown);
|
|
222
|
+
}
|
|
223
|
+
} catch (err) {
|
|
224
|
+
log.debug("embedding hook skipped for research source", { error: String(err) });
|
|
225
|
+
}
|
|
226
|
+
return {
|
|
227
|
+
url: result.url,
|
|
228
|
+
title: extraction.title || result.title,
|
|
229
|
+
markdown_content: truncated,
|
|
230
|
+
relevance_score: result.relevance_score,
|
|
231
|
+
fetched: true
|
|
232
|
+
};
|
|
233
|
+
} catch (err) {
|
|
234
|
+
log.debug("failed to fetch research source", {
|
|
235
|
+
url: result.url,
|
|
236
|
+
error: err instanceof Error ? err.message : String(err)
|
|
237
|
+
});
|
|
238
|
+
return {
|
|
239
|
+
url: result.url,
|
|
240
|
+
title: result.title,
|
|
241
|
+
markdown_content: result.snippet,
|
|
242
|
+
relevance_score: result.relevance_score,
|
|
243
|
+
fetched: false,
|
|
244
|
+
fetch_error: err instanceof Error ? err.message : String(err)
|
|
245
|
+
};
|
|
246
|
+
}
|
|
247
|
+
});
|
|
248
|
+
return Promise.all(fetchPromises);
|
|
249
|
+
}
|
|
250
|
+
function applySourceBudget(sources, perSourceCap, totalCap) {
|
|
251
|
+
let used = 0;
|
|
252
|
+
for (const s of sources) {
|
|
253
|
+
if (!s.markdown_content) continue;
|
|
254
|
+
if (used >= totalCap) {
|
|
255
|
+
s.markdown_content = "";
|
|
256
|
+
continue;
|
|
257
|
+
}
|
|
258
|
+
const remaining = totalCap - used;
|
|
259
|
+
const cap = Math.min(perSourceCap, remaining);
|
|
260
|
+
if (s.markdown_content.length > cap) {
|
|
261
|
+
s.markdown_content = truncateSmartly(s.markdown_content, cap);
|
|
262
|
+
}
|
|
263
|
+
used += s.markdown_content.length;
|
|
264
|
+
}
|
|
265
|
+
}
|
|
266
|
+
export {
|
|
267
|
+
runResearchPipeline
|
|
268
|
+
};
|
|
269
|
+
//# sourceMappingURL=pipeline.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../src/research/pipeline.ts"],"sourcesContent":["import { createLogger } from '../logger.js';\nimport { decomposeQuestion, detectQueryType, extractComparisonEntities, type QueryType } from './decompose.js';\nimport { synthesizeReport } from './synthesize.js';\nimport { synthesizeLocal } from './synthesis-local.js';\nimport { buildResearchBrief } from './brief.js';\nimport { deduplicateResults } from '../search/dedup.js';\nimport { rerankResults } from '../search/rerank.js';\nimport { applyAllFilters } from '../search/filters.js';\nimport { exploreInParallel } from './branch-exploration.js';\nimport type { RawSearchResult, SearchEngineOptions } from '../types.js';\nimport { getExtractProvider } from '../providers/extract-provider.js';\nimport { truncateSmartly } from '../search/truncate.js';\nimport { cacheContent } from '../cache/store.js';\nimport { getEmbeddingService } from '../embedding/embed.js';\nimport { checkSamplingSupport, type SamplingCapableServer } from '../search/sampling.js';\nimport { isLlmConfigured as isLocalLlmEnabled } from '../integrations/cloud/llm/run.js';\nimport type {\n ResearchInput,\n ResearchOutput,\n ResearchSource,\n SearchEngine,\n Citation,\n} from '../types.js';\nimport type { SmartRouter } from '../fetch/router.js';\n\nconst log = createLogger('research');\n\nconst DEPTH_CONFIG: Record<string, { subQueries: number; minSources: number; maxSources: number }> = {\n quick: { subQueries: 2, minSources: 5, maxSources: 8 },\n standard: { subQueries: 4, minSources: 10, maxSources: 15 },\n comprehensive: { subQueries: 7, minSources: 20, maxSources: 25 },\n};\n\n// Per-depth budgets for the sub-query fan-out. exploreInParallel guarantees\n// a single slow sub-query can't burn the whole research budget — comprehensive\n// runs cap at ~60s total and 15s per sub-query.\nconst SEARCH_TOTAL_BUDGET_MS: Record<string, number> = {\n quick: 15_000,\n standard: 30_000,\n comprehensive: 60_000,\n};\nconst SEARCH_PER_QUERY_BUDGET_MS: Record<string, number> = {\n quick: 8_000,\n standard: 10_000,\n comprehensive: 15_000,\n};\n\nconst PER_SOURCE_CHAR_CAP = 3000;\nconst TOTAL_SOURCES_CHAR_CAP = 40000;\n\nexport async function runResearchPipeline(\n input: ResearchInput,\n engines: SearchEngine[],\n router: SmartRouter,\n server?: SamplingCapableServer,\n): Promise<ResearchOutput> {\n const start = Date.now();\n const depth = input.depth ?? 'standard';\n const config = DEPTH_CONFIG[depth] ?? DEPTH_CONFIG.standard;\n const maxSources = input.max_sources ?? config.maxSources;\n\n try {\n // Phase 1: Decompose question into sub-queries\n log.info('research pipeline started', { question: input.question, depth });\n const decomposeResult = await decomposeQuestion(\n input.question,\n depth as 'quick' | 'standard' | 'comprehensive',\n server,\n );\n const subQueries = decomposeResult.subQueries;\n const queryType = decomposeResult.queryType;\n log.info('decomposition complete', { subQueryCount: subQueries.length, samplingUsed: decomposeResult.samplingUsed, queryType });\n\n // Phase 2: Parallel search across sub-queries with per-query + total\n // budget enforcement via exploreInParallel. A single hung engine no\n // longer wedges the whole research call — the per-query timer aborts\n // it and the rest of the fan-out keeps going. Engine cap when\n // sub-queries are many preserves the multi-query.ts invariant.\n const effEngines = subQueries.length >= 3 && engines.length > 2 ? engines.slice(0, 2) : engines;\n const perEngineMaxResults = Math.ceil(maxSources / subQueries.length) * 2;\n\n const branchResults = await exploreInParallel(\n subQueries,\n async (subQuery, signal) => {\n const results: RawSearchResult[] = [];\n const usedHere = new Set<string>();\n const engineOpts: SearchEngineOptions = {\n maxResults: perEngineMaxResults,\n includeDomains: input.include_domains,\n excludeDomains: input.exclude_domains,\n };\n\n await Promise.allSettled(\n effEngines.map(async (engine) => {\n if (signal.aborted) return;\n try {\n const rs = await engine.search(subQuery, engineOpts);\n for (const r of rs) results.push(r);\n usedHere.add(engine.name);\n } catch (err) {\n log.warn('research engine search failed', {\n engine: engine.name,\n query: subQuery,\n error: err instanceof Error ? err.message : String(err),\n });\n }\n }),\n );\n\n return { results, enginesUsed: [...usedHere] };\n },\n {\n maxConcurrent: 3,\n totalBudgetMs: SEARCH_TOTAL_BUDGET_MS[depth] ?? SEARCH_TOTAL_BUDGET_MS.standard,\n perQueryBudgetMs: SEARCH_PER_QUERY_BUDGET_MS[depth] ?? SEARCH_PER_QUERY_BUDGET_MS.standard,\n },\n );\n\n const allRaw: RawSearchResult[] = [];\n const enginesUsed = new Set<string>();\n const searchErrors: string[] = [];\n for (const br of branchResults) {\n if (br.ok && br.result) {\n allRaw.push(...br.result.results);\n for (const e of br.result.enginesUsed) enginesUsed.add(e);\n } else if (br.error) {\n searchErrors.push(`${br.query}: ${br.error}`);\n }\n }\n if (searchErrors.length > 0) {\n log.warn('some search sub-queries failed', { errors: searchErrors });\n }\n\n log.info('search phase complete', { totalRaw: allRaw.length, engines: [...enginesUsed] });\n\n // Phase 3: Deduplicate, filter, rerank\n let merged = deduplicateResults(allRaw);\n\n merged = applyAllFilters(merged, {\n includeDomains: input.include_domains,\n excludeDomains: input.exclude_domains,\n });\n\n merged = await rerankResults(input.question, merged);\n merged = merged.slice(0, maxSources);\n\n if (merged.length === 0) {\n return {\n report: `## Research: ${input.question}\\n\\nNo sources could be found for this query.`,\n citations: [],\n sources: [],\n sub_queries: subQueries,\n depth,\n total_time_ms: Date.now() - start,\n sampling_supported: !!server && checkSamplingSupport(server),\n };\n }\n\n // Phase 4: Fetch top sources in parallel\n const sources: ResearchSource[] = await fetchSources(merged, router, maxSources);\n applySourceBudget(sources, PER_SOURCE_CHAR_CAP, TOTAL_SOURCES_CHAR_CAP);\n log.info('fetch phase complete', {\n fetched: sources.filter((s) => s.fetched).length,\n failed: sources.filter((s) => !s.fetched).length,\n });\n\n // Phase 5: Synthesize report\n const synthesisResult = await synthesizeReport(\n input.question,\n sources,\n depth as 'quick' | 'standard' | 'comprehensive',\n server,\n );\n log.info('synthesis complete', { samplingUsed: synthesisResult.samplingUsed, reportLength: synthesisResult.report.length });\n\n // Phase 5b: Local-LLM synthesis fallback — only when host LLM did not\n // produce output AND a local provider is configured. Failures fall through\n // to the existing heuristic report in synthesisResult.\n let finalReport = synthesisResult.report;\n let finalCitations: Citation[] = synthesisResult.citations;\n let localSynthesisText: string | undefined;\n if (!synthesisResult.samplingUsed && isLocalLlmEnabled()) {\n try {\n const localSources = sources\n .filter((s) => s.fetched && s.markdown_content.length > 0)\n .map((s) => ({ url: s.url, title: s.title, markdown: s.markdown_content }));\n if (localSources.length > 0) {\n const local = await synthesizeLocal(input.question, localSources);\n finalReport = local.text;\n localSynthesisText = local.text;\n finalCitations = local.citations\n .filter((idx) => idx >= 0 && idx < localSources.length)\n .map((idx) => {\n const s = localSources[idx];\n return {\n index: idx + 1,\n url: s.url,\n title: s.title,\n snippet: s.markdown.slice(0, 200),\n };\n });\n log.info('local synthesis succeeded', { reportLength: finalReport.length });\n }\n } catch (err) {\n log.warn('local LLM synthesis failed; using heuristic fallback', {\n error: err instanceof Error ? err.message : String(err),\n });\n }\n }\n\n // Phase 6: Structured brief — populated when internal sampling is\n // unavailable so the host LLM has well-shaped data to write the report\n // from without re-reading raw markdown.\n const comparisonEntities = queryType === 'comparison'\n ? extractComparisonEntities(input.question).entities\n : [];\n const brief = !synthesisResult.samplingUsed\n ? await buildResearchBrief(\n input.question,\n sources,\n subQueries,\n PER_SOURCE_CHAR_CAP,\n TOTAL_SOURCES_CHAR_CAP,\n queryType,\n comparisonEntities,\n localSynthesisText,\n )\n : undefined;\n\n return {\n report: finalReport,\n citations: finalCitations,\n sources,\n sub_queries: subQueries,\n depth,\n total_time_ms: Date.now() - start,\n sampling_supported: !!server && checkSamplingSupport(server),\n ...(brief ? { brief } : {}),\n };\n } catch (err) {\n log.error('research pipeline failed', {\n question: input.question,\n error: err instanceof Error ? err.message : String(err),\n });\n return {\n report: '',\n citations: [],\n sources: [],\n sub_queries: [],\n depth,\n total_time_ms: Date.now() - start,\n sampling_supported: !!server && checkSamplingSupport(server),\n error: err instanceof Error ? err.message : String(err),\n };\n }\n}\n\ninterface MergedResult {\n title: string;\n url: string;\n snippet: string;\n relevance_score: number;\n engines: string[];\n}\n\nasync function fetchSources(\n merged: MergedResult[],\n router: SmartRouter,\n maxSources: number,\n): Promise<ResearchSource[]> {\n const fetchPromises = merged.slice(0, maxSources).map(async (result): Promise<ResearchSource> => {\n try {\n const raw = await Promise.race([\n router.fetch(result.url, { renderJs: 'auto' }),\n new Promise<never>((_, reject) =>\n setTimeout(() => reject(new Error('fetch timeout')), 15000),\n ),\n ]);\n\n const extractor = await getExtractProvider();\n const extraction = await extractor.extract(raw.html, raw.finalUrl, {\n maxChars: 30000,\n contentType: raw.contentType,\n });\n const truncated = truncateSmartly(extraction.markdown, PER_SOURCE_CHAR_CAP);\n\n try {\n cacheContent(raw, extraction);\n } catch (err) {\n log.warn('failed to cache research source', { url: result.url, error: String(err) });\n }\n\n try {\n const embeddingService = getEmbeddingService();\n if (embeddingService.isAvailable()) {\n embeddingService.embedAsync(raw.finalUrl, extraction.markdown);\n }\n } catch (err) {\n log.debug('embedding hook skipped for research source', { error: String(err) });\n }\n\n return {\n url: result.url,\n title: extraction.title || result.title,\n markdown_content: truncated,\n relevance_score: result.relevance_score,\n fetched: true,\n };\n } catch (err) {\n log.debug('failed to fetch research source', {\n url: result.url,\n error: err instanceof Error ? err.message : String(err),\n });\n return {\n url: result.url,\n title: result.title,\n markdown_content: result.snippet,\n relevance_score: result.relevance_score,\n fetched: false,\n fetch_error: err instanceof Error ? err.message : String(err),\n };\n }\n });\n\n return Promise.all(fetchPromises);\n}\n\n// Cap total returned markdown_content across sources in relevance order.\n// Later (lower-relevance) sources get trimmed further when budget runs low;\n// any source past the cap is set to empty content (caller still sees url/title).\nfunction applySourceBudget(\n sources: ResearchSource[],\n perSourceCap: number,\n totalCap: number,\n): void {\n let used = 0;\n for (const s of sources) {\n if (!s.markdown_content) continue;\n if (used >= totalCap) {\n s.markdown_content = '';\n continue;\n }\n const remaining = totalCap - used;\n const cap = Math.min(perSourceCap, remaining);\n if (s.markdown_content.length > cap) {\n s.markdown_content = truncateSmartly(s.markdown_content, cap);\n }\n used += s.markdown_content.length;\n }\n}\n"],"mappings":"AAAA,SAAS,oBAAoB;AAC7B,SAAS,mBAAoC,iCAAiD;AAC9F,SAAS,wBAAwB;AACjC,SAAS,uBAAuB;AAChC,SAAS,0BAA0B;AACnC,SAAS,0BAA0B;AACnC,SAAS,qBAAqB;AAC9B,SAAS,uBAAuB;AAChC,SAAS,yBAAyB;AAElC,SAAS,0BAA0B;AACnC,SAAS,uBAAuB;AAChC,SAAS,oBAAoB;AAC7B,SAAS,2BAA2B;AACpC,SAAS,4BAAwD;AACjE,SAAS,mBAAmB,yBAAyB;AAUrD,MAAM,MAAM,aAAa,UAAU;AAEnC,MAAM,eAA+F;AAAA,EACnG,OAAO,EAAE,YAAY,GAAG,YAAY,GAAG,YAAY,EAAE;AAAA,EACrD,UAAU,EAAE,YAAY,GAAG,YAAY,IAAI,YAAY,GAAG;AAAA,EAC1D,eAAe,EAAE,YAAY,GAAG,YAAY,IAAI,YAAY,GAAG;AACjE;AAKA,MAAM,yBAAiD;AAAA,EACrD,OAAO;AAAA,EACP,UAAU;AAAA,EACV,eAAe;AACjB;AACA,MAAM,6BAAqD;AAAA,EACzD,OAAO;AAAA,EACP,UAAU;AAAA,EACV,eAAe;AACjB;AAEA,MAAM,sBAAsB;AAC5B,MAAM,yBAAyB;AAE/B,eAAsB,oBACpB,OACA,SACA,QACA,QACyB;AACzB,QAAM,QAAQ,KAAK,IAAI;AACvB,QAAM,QAAQ,MAAM,SAAS;AAC7B,QAAM,SAAS,aAAa,KAAK,KAAK,aAAa;AACnD,QAAM,aAAa,MAAM,eAAe,OAAO;AAE/C,MAAI;AAEF,QAAI,KAAK,6BAA6B,EAAE,UAAU,MAAM,UAAU,MAAM,CAAC;AACzE,UAAM,kBAAkB,MAAM;AAAA,MAC5B,MAAM;AAAA,MACN;AAAA,MACA;AAAA,IACF;AACA,UAAM,aAAa,gBAAgB;AACnC,UAAM,YAAY,gBAAgB;AAClC,QAAI,KAAK,0BAA0B,EAAE,eAAe,WAAW,QAAQ,cAAc,gBAAgB,cAAc,UAAU,CAAC;AAO9H,UAAM,aAAa,WAAW,UAAU,KAAK,QAAQ,SAAS,IAAI,QAAQ,MAAM,GAAG,CAAC,IAAI;AACxF,UAAM,sBAAsB,KAAK,KAAK,aAAa,WAAW,MAAM,IAAI;AAExE,UAAM,gBAAgB,MAAM;AAAA,MAC1B;AAAA,MACA,OAAO,UAAU,WAAW;AAC1B,cAAM,UAA6B,CAAC;AACpC,cAAM,WAAW,oBAAI,IAAY;AACjC,cAAM,aAAkC;AAAA,UACtC,YAAY;AAAA,UACZ,gBAAgB,MAAM;AAAA,UACtB,gBAAgB,MAAM;AAAA,QACxB;AAEA,cAAM,QAAQ;AAAA,UACZ,WAAW,IAAI,OAAO,WAAW;AAC/B,gBAAI,OAAO,QAAS;AACpB,gBAAI;AACF,oBAAM,KAAK,MAAM,OAAO,OAAO,UAAU,UAAU;AACnD,yBAAW,KAAK,GAAI,SAAQ,KAAK,CAAC;AAClC,uBAAS,IAAI,OAAO,IAAI;AAAA,YAC1B,SAAS,KAAK;AACZ,kBAAI,KAAK,iCAAiC;AAAA,gBACxC,QAAQ,OAAO;AAAA,gBACf,OAAO;AAAA,gBACP,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,cACxD,CAAC;AAAA,YACH;AAAA,UACF,CAAC;AAAA,QACH;AAEA,eAAO,EAAE,SAAS,aAAa,CAAC,GAAG,QAAQ,EAAE;AAAA,MAC/C;AAAA,MACA;AAAA,QACE,eAAe;AAAA,QACf,eAAe,uBAAuB,KAAK,KAAK,uBAAuB;AAAA,QACvE,kBAAkB,2BAA2B,KAAK,KAAK,2BAA2B;AAAA,MACpF;AAAA,IACF;AAEA,UAAM,SAA4B,CAAC;AACnC,UAAM,cAAc,oBAAI,IAAY;AACpC,UAAM,eAAyB,CAAC;AAChC,eAAW,MAAM,eAAe;AAC9B,UAAI,GAAG,MAAM,GAAG,QAAQ;AACtB,eAAO,KAAK,GAAG,GAAG,OAAO,OAAO;AAChC,mBAAW,KAAK,GAAG,OAAO,YAAa,aAAY,IAAI,CAAC;AAAA,MAC1D,WAAW,GAAG,OAAO;AACnB,qBAAa,KAAK,GAAG,GAAG,KAAK,KAAK,GAAG,KAAK,EAAE;AAAA,MAC9C;AAAA,IACF;AACA,QAAI,aAAa,SAAS,GAAG;AAC3B,UAAI,KAAK,kCAAkC,EAAE,QAAQ,aAAa,CAAC;AAAA,IACrE;AAEA,QAAI,KAAK,yBAAyB,EAAE,UAAU,OAAO,QAAQ,SAAS,CAAC,GAAG,WAAW,EAAE,CAAC;AAGxF,QAAI,SAAS,mBAAmB,MAAM;AAEtC,aAAS,gBAAgB,QAAQ;AAAA,MAC/B,gBAAgB,MAAM;AAAA,MACtB,gBAAgB,MAAM;AAAA,IACxB,CAAC;AAED,aAAS,MAAM,cAAc,MAAM,UAAU,MAAM;AACnD,aAAS,OAAO,MAAM,GAAG,UAAU;AAEnC,QAAI,OAAO,WAAW,GAAG;AACvB,aAAO;AAAA,QACL,QAAQ,gBAAgB,MAAM,QAAQ;AAAA;AAAA;AAAA,QACtC,WAAW,CAAC;AAAA,QACZ,SAAS,CAAC;AAAA,QACV,aAAa;AAAA,QACb;AAAA,QACA,eAAe,KAAK,IAAI,IAAI;AAAA,QAC5B,oBAAoB,CAAC,CAAC,UAAU,qBAAqB,MAAM;AAAA,MAC7D;AAAA,IACF;AAGA,UAAM,UAA4B,MAAM,aAAa,QAAQ,QAAQ,UAAU;AAC/E,sBAAkB,SAAS,qBAAqB,sBAAsB;AACtE,QAAI,KAAK,wBAAwB;AAAA,MAC/B,SAAS,QAAQ,OAAO,CAAC,MAAM,EAAE,OAAO,EAAE;AAAA,MAC1C,QAAQ,QAAQ,OAAO,CAAC,MAAM,CAAC,EAAE,OAAO,EAAE;AAAA,IAC5C,CAAC;AAGD,UAAM,kBAAkB,MAAM;AAAA,MAC5B,MAAM;AAAA,MACN;AAAA,MACA;AAAA,MACA;AAAA,IACF;AACA,QAAI,KAAK,sBAAsB,EAAE,cAAc,gBAAgB,cAAc,cAAc,gBAAgB,OAAO,OAAO,CAAC;AAK1H,QAAI,cAAc,gBAAgB;AAClC,QAAI,iBAA6B,gBAAgB;AACjD,QAAI;AACJ,QAAI,CAAC,gBAAgB,gBAAgB,kBAAkB,GAAG;AACxD,UAAI;AACF,cAAM,eAAe,QAClB,OAAO,CAAC,MAAM,EAAE,WAAW,EAAE,iBAAiB,SAAS,CAAC,EACxD,IAAI,CAAC,OAAO,EAAE,KAAK,EAAE,KAAK,OAAO,EAAE,OAAO,UAAU,EAAE,iBAAiB,EAAE;AAC5E,YAAI,aAAa,SAAS,GAAG;AAC3B,gBAAM,QAAQ,MAAM,gBAAgB,MAAM,UAAU,YAAY;AAChE,wBAAc,MAAM;AACpB,+BAAqB,MAAM;AAC3B,2BAAiB,MAAM,UACpB,OAAO,CAAC,QAAQ,OAAO,KAAK,MAAM,aAAa,MAAM,EACrD,IAAI,CAAC,QAAQ;AACZ,kBAAM,IAAI,aAAa,GAAG;AAC1B,mBAAO;AAAA,cACL,OAAO,MAAM;AAAA,cACb,KAAK,EAAE;AAAA,cACP,OAAO,EAAE;AAAA,cACT,SAAS,EAAE,SAAS,MAAM,GAAG,GAAG;AAAA,YAClC;AAAA,UACF,CAAC;AACH,cAAI,KAAK,6BAA6B,EAAE,cAAc,YAAY,OAAO,CAAC;AAAA,QAC5E;AAAA,MACF,SAAS,KAAK;AACZ,YAAI,KAAK,wDAAwD;AAAA,UAC/D,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,QACxD,CAAC;AAAA,MACH;AAAA,IACF;AAKA,UAAM,qBAAqB,cAAc,eACrC,0BAA0B,MAAM,QAAQ,EAAE,WAC1C,CAAC;AACL,UAAM,QAAQ,CAAC,gBAAgB,eAC3B,MAAM;AAAA,MACJ,MAAM;AAAA,MACN;AAAA,MACA;AAAA,MACA;AAAA,MACA;AAAA,MACA;AAAA,MACA;AAAA,MACA;AAAA,IACF,IACA;AAEJ,WAAO;AAAA,MACL,QAAQ;AAAA,MACR,WAAW;AAAA,MACX;AAAA,MACA,aAAa;AAAA,MACb;AAAA,MACA,eAAe,KAAK,IAAI,IAAI;AAAA,MAC5B,oBAAoB,CAAC,CAAC,UAAU,qBAAqB,MAAM;AAAA,MAC3D,GAAI,QAAQ,EAAE,MAAM,IAAI,CAAC;AAAA,IAC3B;AAAA,EACF,SAAS,KAAK;AACZ,QAAI,MAAM,4BAA4B;AAAA,MACpC,UAAU,MAAM;AAAA,MAChB,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD,CAAC;AACD,WAAO;AAAA,MACL,QAAQ;AAAA,MACR,WAAW,CAAC;AAAA,MACZ,SAAS,CAAC;AAAA,MACV,aAAa,CAAC;AAAA,MACd;AAAA,MACA,eAAe,KAAK,IAAI,IAAI;AAAA,MAC5B,oBAAoB,CAAC,CAAC,UAAU,qBAAqB,MAAM;AAAA,MAC3D,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD;AAAA,EACF;AACF;AAUA,eAAe,aACb,QACA,QACA,YAC2B;AAC3B,QAAM,gBAAgB,OAAO,MAAM,GAAG,UAAU,EAAE,IAAI,OAAO,WAAoC;AAC/F,QAAI;AACF,YAAM,MAAM,MAAM,QAAQ,KAAK;AAAA,QAC7B,OAAO,MAAM,OAAO,KAAK,EAAE,UAAU,OAAO,CAAC;AAAA,QAC7C,IAAI;AAAA,UAAe,CAAC,GAAG,WACrB,WAAW,MAAM,OAAO,IAAI,MAAM,eAAe,CAAC,GAAG,IAAK;AAAA,QAC5D;AAAA,MACF,CAAC;AAED,YAAM,YAAY,MAAM,mBAAmB;AAC3C,YAAM,aAAa,MAAM,UAAU,QAAQ,IAAI,MAAM,IAAI,UAAU;AAAA,QACjE,UAAU;AAAA,QACV,aAAa,IAAI;AAAA,MACnB,CAAC;AACD,YAAM,YAAY,gBAAgB,WAAW,UAAU,mBAAmB;AAE1E,UAAI;AACF,qBAAa,KAAK,UAAU;AAAA,MAC9B,SAAS,KAAK;AACZ,YAAI,KAAK,mCAAmC,EAAE,KAAK,OAAO,KAAK,OAAO,OAAO,GAAG,EAAE,CAAC;AAAA,MACrF;AAEA,UAAI;AACF,cAAM,mBAAmB,oBAAoB;AAC7C,YAAI,iBAAiB,YAAY,GAAG;AAClC,2BAAiB,WAAW,IAAI,UAAU,WAAW,QAAQ;AAAA,QAC/D;AAAA,MACF,SAAS,KAAK;AACZ,YAAI,MAAM,8CAA8C,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AAAA,MAChF;AAEA,aAAO;AAAA,QACL,KAAK,OAAO;AAAA,QACZ,OAAO,WAAW,SAAS,OAAO;AAAA,QAClC,kBAAkB;AAAA,QAClB,iBAAiB,OAAO;AAAA,QACxB,SAAS;AAAA,MACX;AAAA,IACF,SAAS,KAAK;AACZ,UAAI,MAAM,mCAAmC;AAAA,QAC3C,KAAK,OAAO;AAAA,QACZ,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,MACxD,CAAC;AACD,aAAO;AAAA,QACL,KAAK,OAAO;AAAA,QACZ,OAAO,OAAO;AAAA,QACd,kBAAkB,OAAO;AAAA,QACzB,iBAAiB,OAAO;AAAA,QACxB,SAAS;AAAA,QACT,aAAa,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,MAC9D;AAAA,IACF;AAAA,EACF,CAAC;AAED,SAAO,QAAQ,IAAI,aAAa;AAClC;AAKA,SAAS,kBACP,SACA,cACA,UACM;AACN,MAAI,OAAO;AACX,aAAW,KAAK,SAAS;AACvB,QAAI,CAAC,EAAE,iBAAkB;AACzB,QAAI,QAAQ,UAAU;AACpB,QAAE,mBAAmB;AACrB;AAAA,IACF;AACA,UAAM,YAAY,WAAW;AAC7B,UAAM,MAAM,KAAK,IAAI,cAAc,SAAS;AAC5C,QAAI,EAAE,iBAAiB,SAAS,KAAK;AACnC,QAAE,mBAAmB,gBAAgB,EAAE,kBAAkB,GAAG;AAAA,IAC9D;AACA,YAAQ,EAAE,iBAAiB;AAAA,EAC7B;AACF;","names":[]}
|
|
@@ -0,0 +1,19 @@
|
|
|
1
|
+
export interface LocalSynthesisOptions {
|
|
2
|
+
maxSources?: number;
|
|
3
|
+
maxCharsPerSource?: number;
|
|
4
|
+
timeoutMs?: number;
|
|
5
|
+
maxTokens?: number;
|
|
6
|
+
modelOverride?: string;
|
|
7
|
+
}
|
|
8
|
+
export interface LocalSynthesisSource {
|
|
9
|
+
url: string;
|
|
10
|
+
title: string;
|
|
11
|
+
markdown: string;
|
|
12
|
+
}
|
|
13
|
+
export interface LocalSynthesisResult {
|
|
14
|
+
text: string;
|
|
15
|
+
citations: number[];
|
|
16
|
+
}
|
|
17
|
+
export declare function synthesizeLocal(question: string, sources: LocalSynthesisSource[], opts?: LocalSynthesisOptions): Promise<LocalSynthesisResult>;
|
|
18
|
+
export declare function isLocalLlmEnabled(): boolean;
|
|
19
|
+
//# sourceMappingURL=synthesis-local.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"synthesis-local.d.ts","sourceRoot":"","sources":["../../src/research/synthesis-local.ts"],"names":[],"mappings":"AAUA,MAAM,WAAW,qBAAqB;IACpC,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,iBAAiB,CAAC,EAAE,MAAM,CAAC;IAC3B,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,aAAa,CAAC,EAAE,MAAM,CAAC;CACxB;AAED,MAAM,WAAW,oBAAoB;IACnC,GAAG,EAAE,MAAM,CAAC;IACZ,KAAK,EAAE,MAAM,CAAC;IACd,QAAQ,EAAE,MAAM,CAAC;CAClB;AAED,MAAM,WAAW,oBAAoB;IACnC,IAAI,EAAE,MAAM,CAAC;IACb,SAAS,EAAE,MAAM,EAAE,CAAC;CACrB;AAED,wBAAsB,eAAe,CACnC,QAAQ,EAAE,MAAM,EAChB,OAAO,EAAE,oBAAoB,EAAE,EAC/B,IAAI,GAAE,qBAA0B,GAC/B,OAAO,CAAC,oBAAoB,CAAC,CAkC/B;AAID,wBAAgB,iBAAiB,IAAI,OAAO,CAE3C"}
|
|
@@ -0,0 +1,62 @@
|
|
|
1
|
+
import { createLogger } from "../logger.js";
|
|
2
|
+
import { isLlmConfigured, runLlmText } from "../integrations/cloud/llm/run.js";
|
|
3
|
+
const log = createLogger("research");
|
|
4
|
+
const DEFAULT_MAX_SOURCES = 8;
|
|
5
|
+
const DEFAULT_MAX_CHARS_PER_SOURCE = 4e3;
|
|
6
|
+
const DEFAULT_TIMEOUT_MS = 6e4;
|
|
7
|
+
const DEFAULT_MAX_TOKENS = 3e3;
|
|
8
|
+
async function synthesizeLocal(question, sources, opts = {}) {
|
|
9
|
+
if (!isLlmConfigured()) {
|
|
10
|
+
throw new Error("LLM not configured. Set WIGOLO_LLM_PROVIDER or a provider API key.");
|
|
11
|
+
}
|
|
12
|
+
const maxSources = opts.maxSources ?? DEFAULT_MAX_SOURCES;
|
|
13
|
+
const maxCharsPerSource = opts.maxCharsPerSource ?? DEFAULT_MAX_CHARS_PER_SOURCE;
|
|
14
|
+
const sliced = sources.slice(0, maxSources);
|
|
15
|
+
const sourceBlocks = sliced.map((s, i) => {
|
|
16
|
+
const body = s.markdown.length > maxCharsPerSource ? s.markdown.slice(0, maxCharsPerSource) : s.markdown;
|
|
17
|
+
return `[${i + 1}] ${s.title}
|
|
18
|
+
${body}`;
|
|
19
|
+
});
|
|
20
|
+
const prompt = `You answer questions using ONLY the provided sources. Cite each fact with [N] where N is the source number.
|
|
21
|
+
|
|
22
|
+
Question: ${question}
|
|
23
|
+
|
|
24
|
+
Sources:
|
|
25
|
+
${sourceBlocks.join("\n\n")}`;
|
|
26
|
+
try {
|
|
27
|
+
const result = await runLlmText({
|
|
28
|
+
prompt,
|
|
29
|
+
maxTokens: opts.maxTokens ?? DEFAULT_MAX_TOKENS,
|
|
30
|
+
modelOverride: opts.modelOverride,
|
|
31
|
+
timeoutMs: opts.timeoutMs ?? DEFAULT_TIMEOUT_MS
|
|
32
|
+
});
|
|
33
|
+
log.info("local synthesis ok", { provider: result.provider, model: result.model, latencyMs: result.latencyMs });
|
|
34
|
+
return { text: result.text, citations: extractCitations(result.text) };
|
|
35
|
+
} catch (err) {
|
|
36
|
+
log.error("local synthesis request failed", { error: err instanceof Error ? err.message : String(err) });
|
|
37
|
+
throw err;
|
|
38
|
+
}
|
|
39
|
+
}
|
|
40
|
+
function isLocalLlmEnabled() {
|
|
41
|
+
return isLlmConfigured();
|
|
42
|
+
}
|
|
43
|
+
function extractCitations(text) {
|
|
44
|
+
const matches = text.match(/\[(\d+)\]/g);
|
|
45
|
+
if (!matches) return [];
|
|
46
|
+
const seen = /* @__PURE__ */ new Set();
|
|
47
|
+
const out = [];
|
|
48
|
+
for (const m of matches) {
|
|
49
|
+
const n = Number(m.slice(1, -1));
|
|
50
|
+
if (!Number.isFinite(n) || n < 1) continue;
|
|
51
|
+
const idx = n - 1;
|
|
52
|
+
if (seen.has(idx)) continue;
|
|
53
|
+
seen.add(idx);
|
|
54
|
+
out.push(idx);
|
|
55
|
+
}
|
|
56
|
+
return out;
|
|
57
|
+
}
|
|
58
|
+
export {
|
|
59
|
+
isLocalLlmEnabled,
|
|
60
|
+
synthesizeLocal
|
|
61
|
+
};
|
|
62
|
+
//# sourceMappingURL=synthesis-local.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../src/research/synthesis-local.ts"],"sourcesContent":["import { createLogger } from '../logger.js';\nimport { isLlmConfigured, runLlmText } from '../integrations/cloud/llm/run.js';\n\nconst log = createLogger('research');\n\nconst DEFAULT_MAX_SOURCES = 8;\nconst DEFAULT_MAX_CHARS_PER_SOURCE = 4000;\nconst DEFAULT_TIMEOUT_MS = 60_000;\nconst DEFAULT_MAX_TOKENS = 3000;\n\nexport interface LocalSynthesisOptions {\n maxSources?: number;\n maxCharsPerSource?: number;\n timeoutMs?: number;\n maxTokens?: number;\n modelOverride?: string;\n}\n\nexport interface LocalSynthesisSource {\n url: string;\n title: string;\n markdown: string;\n}\n\nexport interface LocalSynthesisResult {\n text: string;\n citations: number[];\n}\n\nexport async function synthesizeLocal(\n question: string,\n sources: LocalSynthesisSource[],\n opts: LocalSynthesisOptions = {},\n): Promise<LocalSynthesisResult> {\n if (!isLlmConfigured()) {\n throw new Error('LLM not configured. Set WIGOLO_LLM_PROVIDER or a provider API key.');\n }\n\n const maxSources = opts.maxSources ?? DEFAULT_MAX_SOURCES;\n const maxCharsPerSource = opts.maxCharsPerSource ?? DEFAULT_MAX_CHARS_PER_SOURCE;\n\n const sliced = sources.slice(0, maxSources);\n const sourceBlocks = sliced.map((s, i) => {\n const body = s.markdown.length > maxCharsPerSource\n ? s.markdown.slice(0, maxCharsPerSource)\n : s.markdown;\n return `[${i + 1}] ${s.title}\\n${body}`;\n });\n\n const prompt =\n 'You answer questions using ONLY the provided sources. Cite each fact with [N] where N is the source number.\\n\\n' +\n `Question: ${question}\\n\\n` +\n `Sources:\\n${sourceBlocks.join('\\n\\n')}`;\n\n try {\n const result = await runLlmText({\n prompt,\n maxTokens: opts.maxTokens ?? DEFAULT_MAX_TOKENS,\n modelOverride: opts.modelOverride,\n timeoutMs: opts.timeoutMs ?? DEFAULT_TIMEOUT_MS,\n });\n log.info('local synthesis ok', { provider: result.provider, model: result.model, latencyMs: result.latencyMs });\n return { text: result.text, citations: extractCitations(result.text) };\n } catch (err) {\n log.error('local synthesis request failed', { error: err instanceof Error ? err.message : String(err) });\n throw err;\n }\n}\n\n// Backwards-compat shim — callers (research/pipeline.ts) used isLocalLlmEnabled()\n// to gate this fallback. Keep the same gate name pointing at the unified runner.\nexport function isLocalLlmEnabled(): boolean {\n return isLlmConfigured();\n}\n\nfunction extractCitations(text: string): number[] {\n const matches = text.match(/\\[(\\d+)\\]/g);\n if (!matches) return [];\n const seen = new Set<number>();\n const out: number[] = [];\n for (const m of matches) {\n const n = Number(m.slice(1, -1));\n if (!Number.isFinite(n) || n < 1) continue;\n const idx = n - 1;\n if (seen.has(idx)) continue;\n seen.add(idx);\n out.push(idx);\n }\n return out;\n}\n"],"mappings":"AAAA,SAAS,oBAAoB;AAC7B,SAAS,iBAAiB,kBAAkB;AAE5C,MAAM,MAAM,aAAa,UAAU;AAEnC,MAAM,sBAAsB;AAC5B,MAAM,+BAA+B;AACrC,MAAM,qBAAqB;AAC3B,MAAM,qBAAqB;AAqB3B,eAAsB,gBACpB,UACA,SACA,OAA8B,CAAC,GACA;AAC/B,MAAI,CAAC,gBAAgB,GAAG;AACtB,UAAM,IAAI,MAAM,oEAAoE;AAAA,EACtF;AAEA,QAAM,aAAa,KAAK,cAAc;AACtC,QAAM,oBAAoB,KAAK,qBAAqB;AAEpD,QAAM,SAAS,QAAQ,MAAM,GAAG,UAAU;AAC1C,QAAM,eAAe,OAAO,IAAI,CAAC,GAAG,MAAM;AACxC,UAAM,OAAO,EAAE,SAAS,SAAS,oBAC7B,EAAE,SAAS,MAAM,GAAG,iBAAiB,IACrC,EAAE;AACN,WAAO,IAAI,IAAI,CAAC,KAAK,EAAE,KAAK;AAAA,EAAK,IAAI;AAAA,EACvC,CAAC;AAED,QAAM,SACJ;AAAA;AAAA,YACa,QAAQ;AAAA;AAAA;AAAA,EACR,aAAa,KAAK,MAAM,CAAC;AAExC,MAAI;AACF,UAAM,SAAS,MAAM,WAAW;AAAA,MAC9B;AAAA,MACA,WAAW,KAAK,aAAa;AAAA,MAC7B,eAAe,KAAK;AAAA,MACpB,WAAW,KAAK,aAAa;AAAA,IAC/B,CAAC;AACD,QAAI,KAAK,sBAAsB,EAAE,UAAU,OAAO,UAAU,OAAO,OAAO,OAAO,WAAW,OAAO,UAAU,CAAC;AAC9G,WAAO,EAAE,MAAM,OAAO,MAAM,WAAW,iBAAiB,OAAO,IAAI,EAAE;AAAA,EACvE,SAAS,KAAK;AACZ,QAAI,MAAM,kCAAkC,EAAE,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG,EAAE,CAAC;AACvG,UAAM;AAAA,EACR;AACF;AAIO,SAAS,oBAA6B;AAC3C,SAAO,gBAAgB;AACzB;AAEA,SAAS,iBAAiB,MAAwB;AAChD,QAAM,UAAU,KAAK,MAAM,YAAY;AACvC,MAAI,CAAC,QAAS,QAAO,CAAC;AACtB,QAAM,OAAO,oBAAI,IAAY;AAC7B,QAAM,MAAgB,CAAC;AACvB,aAAW,KAAK,SAAS;AACvB,UAAM,IAAI,OAAO,EAAE,MAAM,GAAG,EAAE,CAAC;AAC/B,QAAI,CAAC,OAAO,SAAS,CAAC,KAAK,IAAI,EAAG;AAClC,UAAM,MAAM,IAAI;AAChB,QAAI,KAAK,IAAI,GAAG,EAAG;AACnB,SAAK,IAAI,GAAG;AACZ,QAAI,KAAK,GAAG;AAAA,EACd;AACA,SAAO;AACT;","names":[]}
|
|
@@ -0,0 +1,10 @@
|
|
|
1
|
+
import { type SamplingCapableServer } from '../search/sampling.js';
|
|
2
|
+
import type { ResearchSource, Citation } from '../types.js';
|
|
3
|
+
export interface SynthesisResult {
|
|
4
|
+
report: string;
|
|
5
|
+
citations: Citation[];
|
|
6
|
+
samplingUsed: boolean;
|
|
7
|
+
}
|
|
8
|
+
export declare function synthesizeReport(question: string, sources: ResearchSource[], depth: 'quick' | 'standard' | 'comprehensive', server?: SamplingCapableServer): Promise<SynthesisResult>;
|
|
9
|
+
export declare function buildFallbackReport(question: string, sources: ResearchSource[], maxLength: number): string;
|
|
10
|
+
//# sourceMappingURL=synthesize.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"synthesize.d.ts","sourceRoot":"","sources":["../../src/research/synthesize.ts"],"names":[],"mappings":"AACA,OAAO,EACL,KAAK,qBAAqB,EAG3B,MAAM,uBAAuB,CAAC;AAC/B,OAAO,KAAK,EAAE,cAAc,EAAE,QAAQ,EAAE,MAAM,aAAa,CAAC;AAU5D,MAAM,WAAW,eAAe;IAC9B,MAAM,EAAE,MAAM,CAAC;IACf,SAAS,EAAE,QAAQ,EAAE,CAAC;IACtB,YAAY,EAAE,OAAO,CAAC;CACvB;AAED,wBAAsB,gBAAgB,CACpC,QAAQ,EAAE,MAAM,EAChB,OAAO,EAAE,cAAc,EAAE,EACzB,KAAK,EAAE,OAAO,GAAG,UAAU,GAAG,eAAe,EAC7C,MAAM,CAAC,EAAE,qBAAqB,GAC7B,OAAO,CAAC,eAAe,CAAC,CAkC1B;AAkED,wBAAgB,mBAAmB,CACjC,QAAQ,EAAE,MAAM,EAChB,OAAO,EAAE,cAAc,EAAE,EACzB,SAAS,EAAE,MAAM,GAChB,MAAM,CAsCR"}
|
|
@@ -0,0 +1,137 @@
|
|
|
1
|
+
import { createLogger } from "../logger.js";
|
|
2
|
+
import {
|
|
3
|
+
requestSampling,
|
|
4
|
+
checkSamplingSupport
|
|
5
|
+
} from "../search/sampling.js";
|
|
6
|
+
const log = createLogger("research");
|
|
7
|
+
const DEPTH_TOKEN_LIMITS = {
|
|
8
|
+
quick: { reportChars: 2e3, perSourceChars: 3e3, totalSourceChars: 2e4 },
|
|
9
|
+
standard: { reportChars: 4e3, perSourceChars: 3e3, totalSourceChars: 3e4 },
|
|
10
|
+
comprehensive: { reportChars: 6e3, perSourceChars: 3e3, totalSourceChars: 4e4 }
|
|
11
|
+
};
|
|
12
|
+
async function synthesizeReport(question, sources, depth, server) {
|
|
13
|
+
const limits = DEPTH_TOKEN_LIMITS[depth] ?? DEPTH_TOKEN_LIMITS.standard;
|
|
14
|
+
const fetchedSources = sources.filter((s) => s.fetched && s.markdown_content.length > 0);
|
|
15
|
+
if (fetchedSources.length === 0) {
|
|
16
|
+
return {
|
|
17
|
+
report: `## Research: ${question}
|
|
18
|
+
|
|
19
|
+
No sources could be fetched for this query.`,
|
|
20
|
+
citations: [],
|
|
21
|
+
samplingUsed: false
|
|
22
|
+
};
|
|
23
|
+
}
|
|
24
|
+
const citations = fetchedSources.map((s, i) => ({
|
|
25
|
+
index: i + 1,
|
|
26
|
+
url: s.url,
|
|
27
|
+
title: s.title,
|
|
28
|
+
snippet: s.markdown_content.slice(0, 200)
|
|
29
|
+
}));
|
|
30
|
+
if (server) {
|
|
31
|
+
try {
|
|
32
|
+
const result = await synthesizeWithSampling(question, fetchedSources, citations, limits, server);
|
|
33
|
+
if (result) {
|
|
34
|
+
return { report: result, citations, samplingUsed: true };
|
|
35
|
+
}
|
|
36
|
+
} catch (err) {
|
|
37
|
+
log.warn("sampling synthesis failed, using fallback", {
|
|
38
|
+
error: err instanceof Error ? err.message : String(err)
|
|
39
|
+
});
|
|
40
|
+
}
|
|
41
|
+
}
|
|
42
|
+
const report = buildFallbackReport(question, fetchedSources, limits.reportChars);
|
|
43
|
+
return { report, citations, samplingUsed: false };
|
|
44
|
+
}
|
|
45
|
+
async function synthesizeWithSampling(question, sources, _citations, limits, server) {
|
|
46
|
+
try {
|
|
47
|
+
if (!checkSamplingSupport(server)) {
|
|
48
|
+
log.debug("client does not support sampling for synthesis");
|
|
49
|
+
return null;
|
|
50
|
+
}
|
|
51
|
+
let totalChars = 0;
|
|
52
|
+
const sourceBlocks = [];
|
|
53
|
+
for (let i = 0; i < sources.length; i++) {
|
|
54
|
+
if (totalChars >= limits.totalSourceChars) break;
|
|
55
|
+
const source = sources[i];
|
|
56
|
+
const content = source.markdown_content.slice(0, limits.perSourceChars);
|
|
57
|
+
const block = `[${i + 1}] ${source.title} (${source.url})
|
|
58
|
+
${content}`;
|
|
59
|
+
totalChars += block.length;
|
|
60
|
+
sourceBlocks.push(block);
|
|
61
|
+
}
|
|
62
|
+
const prompt = `You are a research assistant. Synthesize a comprehensive report answering the following question based on the provided sources. Use [N] citation markers to reference sources.
|
|
63
|
+
|
|
64
|
+
Question: ${question}
|
|
65
|
+
|
|
66
|
+
Sources:
|
|
67
|
+
${sourceBlocks.join("\n\n")}
|
|
68
|
+
|
|
69
|
+
Write a well-structured markdown report of approximately ${limits.reportChars} characters. Include:
|
|
70
|
+
1. A clear answer to the question
|
|
71
|
+
2. Key findings from the sources
|
|
72
|
+
3. Citation markers [1], [2], etc. referencing the source numbers above
|
|
73
|
+
4. A brief conclusion
|
|
74
|
+
|
|
75
|
+
Report:`;
|
|
76
|
+
const maxTokens = Math.ceil(limits.reportChars / 3);
|
|
77
|
+
const response = await requestSampling(
|
|
78
|
+
server,
|
|
79
|
+
[{ role: "user", content: { type: "text", text: prompt } }],
|
|
80
|
+
maxTokens
|
|
81
|
+
);
|
|
82
|
+
if (!response?.content?.text || response.content.text.trim().length === 0) {
|
|
83
|
+
log.debug("sampling synthesis returned empty response");
|
|
84
|
+
return null;
|
|
85
|
+
}
|
|
86
|
+
return response.content.text.trim();
|
|
87
|
+
} catch (err) {
|
|
88
|
+
log.debug("sampling synthesis request failed", {
|
|
89
|
+
error: err instanceof Error ? err.message : String(err)
|
|
90
|
+
});
|
|
91
|
+
return null;
|
|
92
|
+
}
|
|
93
|
+
}
|
|
94
|
+
function buildFallbackReport(question, sources, maxLength) {
|
|
95
|
+
const fetchedSources = sources.filter((s) => s.markdown_content.length > 0);
|
|
96
|
+
if (fetchedSources.length === 0) {
|
|
97
|
+
return `## Research: ${question}
|
|
98
|
+
|
|
99
|
+
No sources available.`;
|
|
100
|
+
}
|
|
101
|
+
const header = `## Research: ${question}
|
|
102
|
+
|
|
103
|
+
Based on ${fetchedSources.length} source(s):
|
|
104
|
+
|
|
105
|
+
`;
|
|
106
|
+
let report = header;
|
|
107
|
+
let remaining = maxLength - header.length;
|
|
108
|
+
for (let i = 0; i < fetchedSources.length; i++) {
|
|
109
|
+
if (remaining <= 0) break;
|
|
110
|
+
const source = fetchedSources[i];
|
|
111
|
+
const sourceHeader = `### [${i + 1}] ${source.title}
|
|
112
|
+
**URL:** ${source.url}
|
|
113
|
+
|
|
114
|
+
`;
|
|
115
|
+
if (remaining < sourceHeader.length + 20) break;
|
|
116
|
+
report += sourceHeader;
|
|
117
|
+
remaining -= sourceHeader.length;
|
|
118
|
+
const contentBudget = Math.min(remaining - 10, source.markdown_content.length);
|
|
119
|
+
if (contentBudget > 0) {
|
|
120
|
+
let content = source.markdown_content.slice(0, contentBudget);
|
|
121
|
+
if (content.length < source.markdown_content.length) {
|
|
122
|
+
content = content.slice(0, Math.max(contentBudget - 3, 0)) + "...";
|
|
123
|
+
}
|
|
124
|
+
report += content + "\n\n";
|
|
125
|
+
remaining -= content.length + 2;
|
|
126
|
+
}
|
|
127
|
+
}
|
|
128
|
+
if (report.length > maxLength) {
|
|
129
|
+
report = report.slice(0, maxLength - 3) + "...";
|
|
130
|
+
}
|
|
131
|
+
return report.trimEnd();
|
|
132
|
+
}
|
|
133
|
+
export {
|
|
134
|
+
buildFallbackReport,
|
|
135
|
+
synthesizeReport
|
|
136
|
+
};
|
|
137
|
+
//# sourceMappingURL=synthesize.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../src/research/synthesize.ts"],"sourcesContent":["import { createLogger } from '../logger.js';\nimport {\n type SamplingCapableServer,\n requestSampling,\n checkSamplingSupport,\n} from '../search/sampling.js';\nimport type { ResearchSource, Citation } from '../types.js';\n\nconst log = createLogger('research');\n\nconst DEPTH_TOKEN_LIMITS: Record<string, { reportChars: number; perSourceChars: number; totalSourceChars: number }> = {\n quick: { reportChars: 2000, perSourceChars: 3000, totalSourceChars: 20000 },\n standard: { reportChars: 4000, perSourceChars: 3000, totalSourceChars: 30000 },\n comprehensive: { reportChars: 6000, perSourceChars: 3000, totalSourceChars: 40000 },\n};\n\nexport interface SynthesisResult {\n report: string;\n citations: Citation[];\n samplingUsed: boolean;\n}\n\nexport async function synthesizeReport(\n question: string,\n sources: ResearchSource[],\n depth: 'quick' | 'standard' | 'comprehensive',\n server?: SamplingCapableServer,\n): Promise<SynthesisResult> {\n const limits = DEPTH_TOKEN_LIMITS[depth] ?? DEPTH_TOKEN_LIMITS.standard;\n const fetchedSources = sources.filter((s) => s.fetched && s.markdown_content.length > 0);\n\n if (fetchedSources.length === 0) {\n return {\n report: `## Research: ${question}\\n\\nNo sources could be fetched for this query.`,\n citations: [],\n samplingUsed: false,\n };\n }\n\n const citations: Citation[] = fetchedSources.map((s, i) => ({\n index: i + 1,\n url: s.url,\n title: s.title,\n snippet: s.markdown_content.slice(0, 200),\n }));\n\n if (server) {\n try {\n const result = await synthesizeWithSampling(question, fetchedSources, citations, limits, server);\n if (result) {\n return { report: result, citations, samplingUsed: true };\n }\n } catch (err) {\n log.warn('sampling synthesis failed, using fallback', {\n error: err instanceof Error ? err.message : String(err),\n });\n }\n }\n\n const report = buildFallbackReport(question, fetchedSources, limits.reportChars);\n return { report, citations, samplingUsed: false };\n}\n\nasync function synthesizeWithSampling(\n question: string,\n sources: ResearchSource[],\n _citations: Citation[],\n limits: { reportChars: number; perSourceChars: number; totalSourceChars: number },\n server: SamplingCapableServer,\n): Promise<string | null> {\n try {\n if (!checkSamplingSupport(server)) {\n log.debug('client does not support sampling for synthesis');\n return null;\n }\n\n let totalChars = 0;\n const sourceBlocks: string[] = [];\n\n for (let i = 0; i < sources.length; i++) {\n if (totalChars >= limits.totalSourceChars) break;\n\n const source = sources[i];\n const content = source.markdown_content.slice(0, limits.perSourceChars);\n const block = `[${i + 1}] ${source.title} (${source.url})\\n${content}`;\n\n totalChars += block.length;\n sourceBlocks.push(block);\n }\n\n const prompt = `You are a research assistant. Synthesize a comprehensive report answering the following question based on the provided sources. Use [N] citation markers to reference sources.\n\nQuestion: ${question}\n\nSources:\n${sourceBlocks.join('\\n\\n')}\n\nWrite a well-structured markdown report of approximately ${limits.reportChars} characters. Include:\n1. A clear answer to the question\n2. Key findings from the sources\n3. Citation markers [1], [2], etc. referencing the source numbers above\n4. A brief conclusion\n\nReport:`;\n\n const maxTokens = Math.ceil(limits.reportChars / 3);\n\n const response = await requestSampling(\n server,\n [{ role: 'user', content: { type: 'text', text: prompt } }],\n maxTokens,\n );\n\n if (!response?.content?.text || response.content.text.trim().length === 0) {\n log.debug('sampling synthesis returned empty response');\n return null;\n }\n\n return response.content.text.trim();\n } catch (err) {\n log.debug('sampling synthesis request failed', {\n error: err instanceof Error ? err.message : String(err),\n });\n return null;\n }\n}\n\nexport function buildFallbackReport(\n question: string,\n sources: ResearchSource[],\n maxLength: number,\n): string {\n const fetchedSources = sources.filter((s) => s.markdown_content.length > 0);\n\n if (fetchedSources.length === 0) {\n return `## Research: ${question}\\n\\nNo sources available.`;\n }\n\n const header = `## Research: ${question}\\n\\nBased on ${fetchedSources.length} source(s):\\n\\n`;\n let report = header;\n let remaining = maxLength - header.length;\n\n for (let i = 0; i < fetchedSources.length; i++) {\n if (remaining <= 0) break;\n\n const source = fetchedSources[i];\n const sourceHeader = `### [${i + 1}] ${source.title}\\n**URL:** ${source.url}\\n\\n`;\n\n if (remaining < sourceHeader.length + 20) break;\n\n report += sourceHeader;\n remaining -= sourceHeader.length;\n\n const contentBudget = Math.min(remaining - 10, source.markdown_content.length);\n if (contentBudget > 0) {\n let content = source.markdown_content.slice(0, contentBudget);\n if (content.length < source.markdown_content.length) {\n content = content.slice(0, Math.max(contentBudget - 3, 0)) + '...';\n }\n report += content + '\\n\\n';\n remaining -= content.length + 2;\n }\n }\n\n if (report.length > maxLength) {\n report = report.slice(0, maxLength - 3) + '...';\n }\n\n return report.trimEnd();\n}\n"],"mappings":"AAAA,SAAS,oBAAoB;AAC7B;AAAA,EAEE;AAAA,EACA;AAAA,OACK;AAGP,MAAM,MAAM,aAAa,UAAU;AAEnC,MAAM,qBAAgH;AAAA,EACpH,OAAO,EAAE,aAAa,KAAM,gBAAgB,KAAM,kBAAkB,IAAM;AAAA,EAC1E,UAAU,EAAE,aAAa,KAAM,gBAAgB,KAAM,kBAAkB,IAAM;AAAA,EAC7E,eAAe,EAAE,aAAa,KAAM,gBAAgB,KAAM,kBAAkB,IAAM;AACpF;AAQA,eAAsB,iBACpB,UACA,SACA,OACA,QAC0B;AAC1B,QAAM,SAAS,mBAAmB,KAAK,KAAK,mBAAmB;AAC/D,QAAM,iBAAiB,QAAQ,OAAO,CAAC,MAAM,EAAE,WAAW,EAAE,iBAAiB,SAAS,CAAC;AAEvF,MAAI,eAAe,WAAW,GAAG;AAC/B,WAAO;AAAA,MACL,QAAQ,gBAAgB,QAAQ;AAAA;AAAA;AAAA,MAChC,WAAW,CAAC;AAAA,MACZ,cAAc;AAAA,IAChB;AAAA,EACF;AAEA,QAAM,YAAwB,eAAe,IAAI,CAAC,GAAG,OAAO;AAAA,IAC1D,OAAO,IAAI;AAAA,IACX,KAAK,EAAE;AAAA,IACP,OAAO,EAAE;AAAA,IACT,SAAS,EAAE,iBAAiB,MAAM,GAAG,GAAG;AAAA,EAC1C,EAAE;AAEF,MAAI,QAAQ;AACV,QAAI;AACF,YAAM,SAAS,MAAM,uBAAuB,UAAU,gBAAgB,WAAW,QAAQ,MAAM;AAC/F,UAAI,QAAQ;AACV,eAAO,EAAE,QAAQ,QAAQ,WAAW,cAAc,KAAK;AAAA,MACzD;AAAA,IACF,SAAS,KAAK;AACZ,UAAI,KAAK,6CAA6C;AAAA,QACpD,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,MACxD,CAAC;AAAA,IACH;AAAA,EACF;AAEA,QAAM,SAAS,oBAAoB,UAAU,gBAAgB,OAAO,WAAW;AAC/E,SAAO,EAAE,QAAQ,WAAW,cAAc,MAAM;AAClD;AAEA,eAAe,uBACb,UACA,SACA,YACA,QACA,QACwB;AACxB,MAAI;AACF,QAAI,CAAC,qBAAqB,MAAM,GAAG;AACjC,UAAI,MAAM,gDAAgD;AAC1D,aAAO;AAAA,IACT;AAEA,QAAI,aAAa;AACjB,UAAM,eAAyB,CAAC;AAEhC,aAAS,IAAI,GAAG,IAAI,QAAQ,QAAQ,KAAK;AACvC,UAAI,cAAc,OAAO,iBAAkB;AAE3C,YAAM,SAAS,QAAQ,CAAC;AACxB,YAAM,UAAU,OAAO,iBAAiB,MAAM,GAAG,OAAO,cAAc;AACtE,YAAM,QAAQ,IAAI,IAAI,CAAC,KAAK,OAAO,KAAK,KAAK,OAAO,GAAG;AAAA,EAAM,OAAO;AAEpE,oBAAc,MAAM;AACpB,mBAAa,KAAK,KAAK;AAAA,IACzB;AAEA,UAAM,SAAS;AAAA;AAAA,YAEP,QAAQ;AAAA;AAAA;AAAA,EAGlB,aAAa,KAAK,MAAM,CAAC;AAAA;AAAA,2DAEgC,OAAO,WAAW;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAQzE,UAAM,YAAY,KAAK,KAAK,OAAO,cAAc,CAAC;AAElD,UAAM,WAAW,MAAM;AAAA,MACrB;AAAA,MACA,CAAC,EAAE,MAAM,QAAQ,SAAS,EAAE,MAAM,QAAQ,MAAM,OAAO,EAAE,CAAC;AAAA,MAC1D;AAAA,IACF;AAEA,QAAI,CAAC,UAAU,SAAS,QAAQ,SAAS,QAAQ,KAAK,KAAK,EAAE,WAAW,GAAG;AACzE,UAAI,MAAM,4CAA4C;AACtD,aAAO;AAAA,IACT;AAEA,WAAO,SAAS,QAAQ,KAAK,KAAK;AAAA,EACpC,SAAS,KAAK;AACZ,QAAI,MAAM,qCAAqC;AAAA,MAC7C,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD,CAAC;AACD,WAAO;AAAA,EACT;AACF;AAEO,SAAS,oBACd,UACA,SACA,WACQ;AACR,QAAM,iBAAiB,QAAQ,OAAO,CAAC,MAAM,EAAE,iBAAiB,SAAS,CAAC;AAE1E,MAAI,eAAe,WAAW,GAAG;AAC/B,WAAO,gBAAgB,QAAQ;AAAA;AAAA;AAAA,EACjC;AAEA,QAAM,SAAS,gBAAgB,QAAQ;AAAA;AAAA,WAAgB,eAAe,MAAM;AAAA;AAAA;AAC5E,MAAI,SAAS;AACb,MAAI,YAAY,YAAY,OAAO;AAEnC,WAAS,IAAI,GAAG,IAAI,eAAe,QAAQ,KAAK;AAC9C,QAAI,aAAa,EAAG;AAEpB,UAAM,SAAS,eAAe,CAAC;AAC/B,UAAM,eAAe,QAAQ,IAAI,CAAC,KAAK,OAAO,KAAK;AAAA,WAAc,OAAO,GAAG;AAAA;AAAA;AAE3E,QAAI,YAAY,aAAa,SAAS,GAAI;AAE1C,cAAU;AACV,iBAAa,aAAa;AAE1B,UAAM,gBAAgB,KAAK,IAAI,YAAY,IAAI,OAAO,iBAAiB,MAAM;AAC7E,QAAI,gBAAgB,GAAG;AACrB,UAAI,UAAU,OAAO,iBAAiB,MAAM,GAAG,aAAa;AAC5D,UAAI,QAAQ,SAAS,OAAO,iBAAiB,QAAQ;AACnD,kBAAU,QAAQ,MAAM,GAAG,KAAK,IAAI,gBAAgB,GAAG,CAAC,CAAC,IAAI;AAAA,MAC/D;AACA,gBAAU,UAAU;AACpB,mBAAa,QAAQ,SAAS;AAAA,IAChC;AAAA,EACF;AAEA,MAAI,OAAO,SAAS,WAAW;AAC7B,aAAS,OAAO,MAAM,GAAG,YAAY,CAAC,IAAI;AAAA,EAC5C;AAEA,SAAO,OAAO,QAAQ;AACxB;","names":[]}
|
|
@@ -0,0 +1,33 @@
|
|
|
1
|
+
import type { SearchResultItem, Citation, StageResult } from '../types.js';
|
|
2
|
+
import type { SamplingCapableServer } from './sampling.js';
|
|
3
|
+
export interface SynthesisResult {
|
|
4
|
+
answer?: string;
|
|
5
|
+
citations?: Citation[];
|
|
6
|
+
fallback: boolean;
|
|
7
|
+
warning?: string;
|
|
8
|
+
}
|
|
9
|
+
export declare function synthesizeAnswer(results: SearchResultItem[], query: string, server: SamplingCapableServer): Promise<SynthesisResult>;
|
|
10
|
+
export declare function buildSourcesText(results: SearchResultItem[]): string;
|
|
11
|
+
export declare function buildSynthesisPrompt(query: string, sourcesText: string): string;
|
|
12
|
+
export interface StructuredFallbackResult {
|
|
13
|
+
answer: string;
|
|
14
|
+
citations: Citation[];
|
|
15
|
+
warning: string;
|
|
16
|
+
}
|
|
17
|
+
export declare function buildStructuredFallback(results: SearchResultItem[], query: string): StructuredFallbackResult;
|
|
18
|
+
export interface SynthesisInput {
|
|
19
|
+
query: string;
|
|
20
|
+
results: SearchResultItem[];
|
|
21
|
+
samplingServer?: SamplingCapableServer;
|
|
22
|
+
/** Reserved for future per-source truncation; T6 currently relies on MAX_CHARS_PER_SOURCE. */
|
|
23
|
+
maxTotalChars: number;
|
|
24
|
+
}
|
|
25
|
+
export interface SynthesizedAnswer {
|
|
26
|
+
answer: string;
|
|
27
|
+
citations: Citation[];
|
|
28
|
+
warning?: string;
|
|
29
|
+
fallback_level: 1 | 2 | 3;
|
|
30
|
+
}
|
|
31
|
+
export declare function runSynthesis(input: SynthesisInput): Promise<StageResult<SynthesizedAnswer>>;
|
|
32
|
+
export declare function extractCitations(answer: string, results: SearchResultItem[]): Citation[];
|
|
33
|
+
//# sourceMappingURL=answer-synthesis.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"answer-synthesis.d.ts","sourceRoot":"","sources":["../../src/search/answer-synthesis.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,gBAAgB,EAAE,QAAQ,EAAE,WAAW,EAAE,MAAM,aAAa,CAAC;AAC3E,OAAO,KAAK,EAAE,qBAAqB,EAAE,MAAM,eAAe,CAAC;AAe3D,MAAM,WAAW,eAAe;IAC9B,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,SAAS,CAAC,EAAE,QAAQ,EAAE,CAAC;IACvB,QAAQ,EAAE,OAAO,CAAC;IAClB,OAAO,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,wBAAsB,gBAAgB,CACpC,OAAO,EAAE,gBAAgB,EAAE,EAC3B,KAAK,EAAE,MAAM,EACb,MAAM,EAAE,qBAAqB,GAC5B,OAAO,CAAC,eAAe,CAAC,CAwD1B;AAED,wBAAgB,gBAAgB,CAAC,OAAO,EAAE,gBAAgB,EAAE,GAAG,MAAM,CAwBpE;AAED,wBAAgB,oBAAoB,CAAC,KAAK,EAAE,MAAM,EAAE,WAAW,EAAE,MAAM,GAAG,MAAM,CAc/E;AAED,MAAM,WAAW,wBAAwB;IACvC,MAAM,EAAE,MAAM,CAAC;IACf,SAAS,EAAE,QAAQ,EAAE,CAAC;IACtB,OAAO,EAAE,MAAM,CAAC;CACjB;AAID,wBAAgB,uBAAuB,CACrC,OAAO,EAAE,gBAAgB,EAAE,EAC3B,KAAK,EAAE,MAAM,GACZ,wBAAwB,CA8B1B;AAyBD,MAAM,WAAW,cAAc;IAC7B,KAAK,EAAE,MAAM,CAAC;IACd,OAAO,EAAE,gBAAgB,EAAE,CAAC;IAC5B,cAAc,CAAC,EAAE,qBAAqB,CAAC;IACvC,8FAA8F;IAC9F,aAAa,EAAE,MAAM,CAAC;CACvB;AAED,MAAM,WAAW,iBAAiB;IAChC,MAAM,EAAE,MAAM,CAAC;IACf,SAAS,EAAE,QAAQ,EAAE,CAAC;IACtB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,cAAc,EAAE,CAAC,GAAG,CAAC,GAAG,CAAC,CAAC;CAC3B;AAED,wBAAsB,YAAY,CAChC,KAAK,EAAE,cAAc,GACpB,OAAO,CAAC,WAAW,CAAC,iBAAiB,CAAC,CAAC,CAoEzC;AAED,wBAAgB,gBAAgB,CAC9B,MAAM,EAAE,MAAM,EACd,OAAO,EAAE,gBAAgB,EAAE,GAC1B,QAAQ,EAAE,CA6BZ"}
|