@staticn0va/wigolo 0.1.0 → 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +1 -1
- package/README.md +195 -73
- package/SKILL.md +382 -0
- package/assets/blocks/claude-code/CLAUDE.md.block +20 -0
- package/assets/blocks/claude-code/wigolo-command.md +40 -0
- package/assets/blocks/cursor/wigolo.mdc +46 -0
- package/assets/blocks/gemini-cli/GEMINI.md.block +18 -0
- package/assets/blocks/vscode/copilot-instructions.md.block +18 -0
- package/assets/skills/wigolo/SKILL.md +50 -0
- package/assets/skills/wigolo/rules/cache-first.md +30 -0
- package/assets/skills/wigolo/rules/synthesis.md +43 -0
- package/assets/skills/wigolo-agent/SKILL.md +73 -0
- package/assets/skills/wigolo-crawl/SKILL.md +60 -0
- package/assets/skills/wigolo-extract/SKILL.md +59 -0
- package/assets/skills/wigolo-fetch/SKILL.md +65 -0
- package/assets/skills/wigolo-find-similar/SKILL.md +72 -0
- package/assets/skills/wigolo-research/SKILL.md +77 -0
- package/assets/skills/wigolo-search/SKILL.md +78 -0
- package/dist/agent/executor.d.ts +33 -0
- package/dist/agent/executor.d.ts.map +1 -0
- package/dist/agent/executor.js +233 -0
- package/dist/agent/executor.js.map +1 -0
- package/dist/agent/pipeline.d.ts +5 -0
- package/dist/agent/pipeline.d.ts.map +1 -0
- package/dist/agent/pipeline.js +208 -0
- package/dist/agent/pipeline.js.map +1 -0
- package/dist/agent/planner.d.ts +13 -0
- package/dist/agent/planner.d.ts.map +1 -0
- package/dist/agent/planner.js +271 -0
- package/dist/agent/planner.js.map +1 -0
- package/dist/agent/relevance.d.ts +15 -0
- package/dist/agent/relevance.d.ts.map +1 -0
- package/dist/agent/relevance.js +60 -0
- package/dist/agent/relevance.js.map +1 -0
- package/dist/cache/backfill-embeddings.d.ts +23 -0
- package/dist/cache/backfill-embeddings.d.ts.map +1 -0
- package/dist/cache/backfill-embeddings.js +105 -0
- package/dist/cache/backfill-embeddings.js.map +1 -0
- package/dist/cache/change-detector.d.ts +7 -0
- package/dist/cache/change-detector.d.ts.map +1 -0
- package/dist/cache/change-detector.js +43 -0
- package/dist/cache/change-detector.js.map +1 -0
- package/dist/cache/db.d.ts +1 -0
- package/dist/cache/db.d.ts.map +1 -1
- package/dist/cache/db.js +94 -22
- package/dist/cache/db.js.map +1 -1
- package/dist/cache/diff-summary.d.ts +2 -0
- package/dist/cache/diff-summary.d.ts.map +1 -0
- package/dist/cache/diff-summary.js +82 -0
- package/dist/cache/diff-summary.js.map +1 -0
- package/dist/cache/migrations/runner.d.ts +29 -0
- package/dist/cache/migrations/runner.d.ts.map +1 -0
- package/dist/cache/migrations/runner.js +147 -0
- package/dist/cache/migrations/runner.js.map +1 -0
- package/dist/cache/sqlite-vec-store.d.ts +42 -0
- package/dist/cache/sqlite-vec-store.d.ts.map +1 -0
- package/dist/cache/sqlite-vec-store.js +176 -0
- package/dist/cache/sqlite-vec-store.js.map +1 -0
- package/dist/cache/store.d.ts +46 -1
- package/dist/cache/store.d.ts.map +1 -1
- package/dist/cache/store.js +362 -168
- package/dist/cache/store.js.map +1 -1
- package/dist/cli/agents/antigravity.d.ts +20 -0
- package/dist/cli/agents/antigravity.d.ts.map +1 -0
- package/dist/cli/agents/antigravity.js +49 -0
- package/dist/cli/agents/antigravity.js.map +1 -0
- package/dist/cli/agents/claude-code.d.ts +25 -0
- package/dist/cli/agents/claude-code.d.ts.map +1 -0
- package/dist/cli/agents/claude-code.js +111 -0
- package/dist/cli/agents/claude-code.js.map +1 -0
- package/dist/cli/agents/cursor.d.ts +21 -0
- package/dist/cli/agents/cursor.d.ts.map +1 -0
- package/dist/cli/agents/cursor.js +58 -0
- package/dist/cli/agents/cursor.js.map +1 -0
- package/dist/cli/agents/gemini-cli.d.ts +21 -0
- package/dist/cli/agents/gemini-cli.d.ts.map +1 -0
- package/dist/cli/agents/gemini-cli.js +55 -0
- package/dist/cli/agents/gemini-cli.js.map +1 -0
- package/dist/cli/agents/registry.d.ts +21 -0
- package/dist/cli/agents/registry.d.ts.map +1 -0
- package/dist/cli/agents/registry.js +27 -0
- package/dist/cli/agents/registry.js.map +1 -0
- package/dist/cli/agents/utils.d.ts +26 -0
- package/dist/cli/agents/utils.d.ts.map +1 -0
- package/dist/cli/agents/utils.js +136 -0
- package/dist/cli/agents/utils.js.map +1 -0
- package/dist/cli/agents/vscode.d.ts +21 -0
- package/dist/cli/agents/vscode.d.ts.map +1 -0
- package/dist/cli/agents/vscode.js +62 -0
- package/dist/cli/agents/vscode.js.map +1 -0
- package/dist/cli/auth.d.ts +2 -0
- package/dist/cli/auth.d.ts.map +1 -0
- package/dist/cli/auth.js +94 -0
- package/dist/cli/auth.js.map +1 -0
- package/dist/cli/backfill.d.ts +2 -0
- package/dist/cli/backfill.d.ts.map +1 -0
- package/dist/cli/backfill.js +58 -0
- package/dist/cli/backfill.js.map +1 -0
- package/dist/cli/daemon.d.ts +6 -1
- package/dist/cli/daemon.d.ts.map +1 -1
- package/dist/cli/daemon.js +61 -3
- package/dist/cli/daemon.js.map +1 -1
- package/dist/cli/doctor.d.ts +8 -0
- package/dist/cli/doctor.d.ts.map +1 -0
- package/dist/cli/doctor.js +318 -0
- package/dist/cli/doctor.js.map +1 -0
- package/dist/cli/health.d.ts +1 -1
- package/dist/cli/health.d.ts.map +1 -1
- package/dist/cli/health.js +42 -3
- package/dist/cli/health.js.map +1 -1
- package/dist/cli/help.d.ts +6 -0
- package/dist/cli/help.d.ts.map +1 -0
- package/dist/cli/help.js +63 -0
- package/dist/cli/help.js.map +1 -0
- package/dist/cli/index.d.ts +1 -1
- package/dist/cli/index.d.ts.map +1 -1
- package/dist/cli/index.js +35 -7
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/init.d.ts +2 -0
- package/dist/cli/init.d.ts.map +1 -0
- package/dist/cli/init.js +201 -0
- package/dist/cli/init.js.map +1 -0
- package/dist/cli/plugin.d.ts +5 -0
- package/dist/cli/plugin.d.ts.map +1 -0
- package/dist/cli/plugin.js +185 -0
- package/dist/cli/plugin.js.map +1 -0
- package/dist/cli/setup-mcp.d.ts +2 -0
- package/dist/cli/setup-mcp.d.ts.map +1 -0
- package/dist/cli/setup-mcp.js +114 -0
- package/dist/cli/setup-mcp.js.map +1 -0
- package/dist/cli/shell.d.ts +2 -0
- package/dist/cli/shell.d.ts.map +1 -0
- package/dist/cli/shell.js +86 -0
- package/dist/cli/shell.js.map +1 -0
- package/dist/cli/status.d.ts +2 -0
- package/dist/cli/status.d.ts.map +1 -0
- package/dist/cli/status.js +31 -0
- package/dist/cli/status.js.map +1 -0
- package/dist/cli/telemetry.d.ts +10 -0
- package/dist/cli/telemetry.d.ts.map +1 -0
- package/dist/cli/telemetry.js +56 -0
- package/dist/cli/telemetry.js.map +1 -0
- package/dist/cli/tui/agents-types.d.ts +28 -0
- package/dist/cli/tui/agents-types.d.ts.map +1 -0
- package/dist/cli/tui/agents-types.js +1 -0
- package/dist/cli/tui/agents-types.js.map +1 -0
- package/dist/cli/tui/agents.d.ts +11 -0
- package/dist/cli/tui/agents.d.ts.map +1 -0
- package/dist/cli/tui/agents.js +93 -0
- package/dist/cli/tui/agents.js.map +1 -0
- package/dist/cli/tui/banner.d.ts +3 -0
- package/dist/cli/tui/banner.d.ts.map +1 -0
- package/dist/cli/tui/banner.js +30 -0
- package/dist/cli/tui/banner.js.map +1 -0
- package/dist/cli/tui/components/AgentSelect.d.ts +13 -0
- package/dist/cli/tui/components/AgentSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/AgentSelect.js +116 -0
- package/dist/cli/tui/components/AgentSelect.js.map +1 -0
- package/dist/cli/tui/components/Banner.d.ts +6 -0
- package/dist/cli/tui/components/Banner.d.ts.map +1 -0
- package/dist/cli/tui/components/Banner.js +25 -0
- package/dist/cli/tui/components/Banner.js.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts +7 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.js +19 -0
- package/dist/cli/tui/components/BrowserSelect.js.map +1 -0
- package/dist/cli/tui/components/InstallProgress.d.ts +9 -0
- package/dist/cli/tui/components/InstallProgress.d.ts.map +1 -0
- package/dist/cli/tui/components/InstallProgress.js +67 -0
- package/dist/cli/tui/components/InstallProgress.js.map +1 -0
- package/dist/cli/tui/components/SkillInstall.d.ts +14 -0
- package/dist/cli/tui/components/SkillInstall.d.ts.map +1 -0
- package/dist/cli/tui/components/SkillInstall.js +94 -0
- package/dist/cli/tui/components/SkillInstall.js.map +1 -0
- package/dist/cli/tui/components/Summary.d.ts +22 -0
- package/dist/cli/tui/components/Summary.d.ts.map +1 -0
- package/dist/cli/tui/components/Summary.js +135 -0
- package/dist/cli/tui/components/Summary.js.map +1 -0
- package/dist/cli/tui/components/SystemCheck.d.ts +8 -0
- package/dist/cli/tui/components/SystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/components/SystemCheck.js +71 -0
- package/dist/cli/tui/components/SystemCheck.js.map +1 -0
- package/dist/cli/tui/components/Verification.d.ts +8 -0
- package/dist/cli/tui/components/Verification.d.ts.map +1 -0
- package/dist/cli/tui/components/Verification.js +63 -0
- package/dist/cli/tui/components/Verification.js.map +1 -0
- package/dist/cli/tui/config-writer-cli.d.ts +12 -0
- package/dist/cli/tui/config-writer-cli.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-cli.js +39 -0
- package/dist/cli/tui/config-writer-cli.js.map +1 -0
- package/dist/cli/tui/config-writer-json.d.ts +16 -0
- package/dist/cli/tui/config-writer-json.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-json.js +86 -0
- package/dist/cli/tui/config-writer-json.js.map +1 -0
- package/dist/cli/tui/config-writer-toml.d.ts +16 -0
- package/dist/cli/tui/config-writer-toml.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-toml.js +83 -0
- package/dist/cli/tui/config-writer-toml.js.map +1 -0
- package/dist/cli/tui/config-writer.d.ts +25 -0
- package/dist/cli/tui/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/config-writer.js +101 -0
- package/dist/cli/tui/config-writer.js.map +1 -0
- package/dist/cli/tui/detect-helpers.d.ts +6 -0
- package/dist/cli/tui/detect-helpers.d.ts.map +1 -0
- package/dist/cli/tui/detect-helpers.js +45 -0
- package/dist/cli/tui/detect-helpers.js.map +1 -0
- package/dist/cli/tui/extras-prompt.d.ts +7 -0
- package/dist/cli/tui/extras-prompt.d.ts.map +1 -0
- package/dist/cli/tui/extras-prompt.js +42 -0
- package/dist/cli/tui/extras-prompt.js.map +1 -0
- package/dist/cli/tui/flags-types.d.ts +19 -0
- package/dist/cli/tui/flags-types.d.ts.map +1 -0
- package/dist/cli/tui/flags-types.js +23 -0
- package/dist/cli/tui/flags-types.js.map +1 -0
- package/dist/cli/tui/flags.d.ts +5 -0
- package/dist/cli/tui/flags.d.ts.map +1 -0
- package/dist/cli/tui/flags.js +132 -0
- package/dist/cli/tui/flags.js.map +1 -0
- package/dist/cli/tui/format.d.ts +14 -0
- package/dist/cli/tui/format.d.ts.map +1 -0
- package/dist/cli/tui/format.js +37 -0
- package/dist/cli/tui/format.js.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts +6 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.js +19 -0
- package/dist/cli/tui/hooks/useAgentDetect.js.map +1 -0
- package/dist/cli/tui/hooks/useInstall.d.ts +14 -0
- package/dist/cli/tui/hooks/useInstall.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useInstall.js +90 -0
- package/dist/cli/tui/hooks/useInstall.js.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts +13 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.js +95 -0
- package/dist/cli/tui/hooks/useSystemCheck.js.map +1 -0
- package/dist/cli/tui/hooks/useVerify.d.ts +14 -0
- package/dist/cli/tui/hooks/useVerify.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useVerify.js +71 -0
- package/dist/cli/tui/hooks/useVerify.js.map +1 -0
- package/dist/cli/tui/ink-init.d.ts +2 -0
- package/dist/cli/tui/ink-init.d.ts.map +1 -0
- package/dist/cli/tui/ink-init.js +198 -0
- package/dist/cli/tui/ink-init.js.map +1 -0
- package/dist/cli/tui/reporter-auto.d.ts +7 -0
- package/dist/cli/tui/reporter-auto.d.ts.map +1 -0
- package/dist/cli/tui/reporter-auto.js +15 -0
- package/dist/cli/tui/reporter-auto.js.map +1 -0
- package/dist/cli/tui/reporter.d.ts +26 -0
- package/dist/cli/tui/reporter.d.ts.map +1 -0
- package/dist/cli/tui/reporter.js +32 -0
- package/dist/cli/tui/reporter.js.map +1 -0
- package/dist/cli/tui/run-command.d.ts +14 -0
- package/dist/cli/tui/run-command.d.ts.map +1 -0
- package/dist/cli/tui/run-command.js +72 -0
- package/dist/cli/tui/run-command.js.map +1 -0
- package/dist/cli/tui/select-agents.d.ts +6 -0
- package/dist/cli/tui/select-agents.d.ts.map +1 -0
- package/dist/cli/tui/select-agents.js +32 -0
- package/dist/cli/tui/select-agents.js.map +1 -0
- package/dist/cli/tui/status-agents.d.ts +11 -0
- package/dist/cli/tui/status-agents.d.ts.map +1 -0
- package/dist/cli/tui/status-agents.js +53 -0
- package/dist/cli/tui/status-agents.js.map +1 -0
- package/dist/cli/tui/status-cache.d.ts +6 -0
- package/dist/cli/tui/status-cache.d.ts.map +1 -0
- package/dist/cli/tui/status-cache.js +39 -0
- package/dist/cli/tui/status-cache.js.map +1 -0
- package/dist/cli/tui/status-format.d.ts +14 -0
- package/dist/cli/tui/status-format.d.ts.map +1 -0
- package/dist/cli/tui/status-format.js +41 -0
- package/dist/cli/tui/status-format.js.map +1 -0
- package/dist/cli/tui/status-python.d.ts +6 -0
- package/dist/cli/tui/status-python.d.ts.map +1 -0
- package/dist/cli/tui/status-python.js +30 -0
- package/dist/cli/tui/status-python.js.map +1 -0
- package/dist/cli/tui/system-check.d.ts +24 -0
- package/dist/cli/tui/system-check.d.ts.map +1 -0
- package/dist/cli/tui/system-check.js +103 -0
- package/dist/cli/tui/system-check.js.map +1 -0
- package/dist/cli/tui/tui-reporter.d.ts +19 -0
- package/dist/cli/tui/tui-reporter.d.ts.map +1 -0
- package/dist/cli/tui/tui-reporter.js +95 -0
- package/dist/cli/tui/tui-reporter.js.map +1 -0
- package/dist/cli/tui/utils/config-writer.d.ts +3 -0
- package/dist/cli/tui/utils/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/utils/config-writer.js +22 -0
- package/dist/cli/tui/utils/config-writer.js.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts +3 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.js +11 -0
- package/dist/cli/tui/utils/suppress-logs.js.map +1 -0
- package/dist/cli/tui/verify-suggestions.d.ts +5 -0
- package/dist/cli/tui/verify-suggestions.d.ts.map +1 -0
- package/dist/cli/tui/verify-suggestions.js +20 -0
- package/dist/cli/tui/verify-suggestions.js.map +1 -0
- package/dist/cli/tui/verify.d.ts +14 -0
- package/dist/cli/tui/verify.d.ts.map +1 -0
- package/dist/cli/tui/verify.js +101 -0
- package/dist/cli/tui/verify.js.map +1 -0
- package/dist/cli/tui/version.d.ts +2 -0
- package/dist/cli/tui/version.d.ts.map +1 -0
- package/dist/cli/tui/version.js +14 -0
- package/dist/cli/tui/version.js.map +1 -0
- package/dist/cli/uninstall.d.ts +2 -0
- package/dist/cli/uninstall.d.ts.map +1 -0
- package/dist/cli/uninstall.js +57 -0
- package/dist/cli/uninstall.js.map +1 -0
- package/dist/cli/warmup.d.ts +10 -2
- package/dist/cli/warmup.d.ts.map +1 -1
- package/dist/cli/warmup.js +226 -93
- package/dist/cli/warmup.js.map +1 -1
- package/dist/config.d.ts +28 -2
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +106 -56
- package/dist/config.js.map +1 -1
- package/dist/crawl/crawler.d.ts +6 -0
- package/dist/crawl/crawler.d.ts.map +1 -1
- package/dist/crawl/crawler.js +210 -209
- package/dist/crawl/crawler.js.map +1 -1
- package/dist/crawl/dedup.d.ts +1 -0
- package/dist/crawl/dedup.d.ts.map +1 -1
- package/dist/crawl/dedup.js +124 -81
- package/dist/crawl/dedup.js.map +1 -1
- package/dist/crawl/etag-incremental.d.ts +43 -0
- package/dist/crawl/etag-incremental.d.ts.map +1 -0
- package/dist/crawl/etag-incremental.js +94 -0
- package/dist/crawl/etag-incremental.js.map +1 -0
- package/dist/crawl/index-to-vec.d.ts +10 -0
- package/dist/crawl/index-to-vec.d.ts.map +1 -0
- package/dist/crawl/index-to-vec.js +44 -0
- package/dist/crawl/index-to-vec.js.map +1 -0
- package/dist/crawl/mapper.js +136 -164
- package/dist/crawl/mapper.js.map +1 -1
- package/dist/crawl/rate-limiter.js +63 -66
- package/dist/crawl/rate-limiter.js.map +1 -1
- package/dist/crawl/robots.js +58 -57
- package/dist/crawl/robots.js.map +1 -1
- package/dist/crawl/sitemap-first.d.ts +12 -0
- package/dist/crawl/sitemap-first.d.ts.map +1 -0
- package/dist/crawl/sitemap-first.js +47 -0
- package/dist/crawl/sitemap-first.js.map +1 -0
- package/dist/crawl/sitemap.js +33 -32
- package/dist/crawl/sitemap.js.map +1 -1
- package/dist/crawl/url-utils.d.ts +1 -0
- package/dist/crawl/url-utils.d.ts.map +1 -1
- package/dist/crawl/url-utils.js +49 -37
- package/dist/crawl/url-utils.js.map +1 -1
- package/dist/daemon/health-check.d.ts +16 -0
- package/dist/daemon/health-check.d.ts.map +1 -0
- package/dist/daemon/health-check.js +33 -0
- package/dist/daemon/health-check.js.map +1 -0
- package/dist/daemon/http-server.d.ts +26 -0
- package/dist/daemon/http-server.d.ts.map +1 -0
- package/dist/daemon/http-server.js +275 -0
- package/dist/daemon/http-server.js.map +1 -0
- package/dist/daemon/proxy.d.ts +10 -0
- package/dist/daemon/proxy.d.ts.map +1 -0
- package/dist/daemon/proxy.js +93 -0
- package/dist/daemon/proxy.js.map +1 -0
- package/dist/embedding/embed.d.ts +59 -0
- package/dist/embedding/embed.d.ts.map +1 -0
- package/dist/embedding/embed.js +233 -0
- package/dist/embedding/embed.js.map +1 -0
- package/dist/embedding/fastembed-provider.d.ts +19 -0
- package/dist/embedding/fastembed-provider.d.ts.map +1 -0
- package/dist/embedding/fastembed-provider.js +51 -0
- package/dist/embedding/fastembed-provider.js.map +1 -0
- package/dist/embedding/key-terms.d.ts +12 -0
- package/dist/embedding/key-terms.d.ts.map +1 -0
- package/dist/embedding/key-terms.js +234 -0
- package/dist/embedding/key-terms.js.map +1 -0
- package/dist/extraction/boilerplate.d.ts +15 -0
- package/dist/extraction/boilerplate.d.ts.map +1 -0
- package/dist/extraction/boilerplate.js +52 -0
- package/dist/extraction/boilerplate.js.map +1 -0
- package/dist/extraction/defuddle.d.ts.map +1 -1
- package/dist/extraction/defuddle.js +27 -23
- package/dist/extraction/defuddle.js.map +1 -1
- package/dist/extraction/extract.d.ts.map +1 -1
- package/dist/extraction/extract.js +76 -76
- package/dist/extraction/extract.js.map +1 -1
- package/dist/extraction/jsonld.js +50 -54
- package/dist/extraction/jsonld.js.map +1 -1
- package/dist/extraction/lang-hints.d.ts +2 -0
- package/dist/extraction/lang-hints.d.ts.map +1 -0
- package/dist/extraction/lang-hints.js +30 -0
- package/dist/extraction/lang-hints.js.map +1 -0
- package/dist/extraction/llm-fallback.d.ts +17 -0
- package/dist/extraction/llm-fallback.d.ts.map +1 -0
- package/dist/extraction/llm-fallback.js +130 -0
- package/dist/extraction/llm-fallback.js.map +1 -0
- package/dist/extraction/markdown-sanitize.d.ts +2 -0
- package/dist/extraction/markdown-sanitize.d.ts.map +1 -0
- package/dist/extraction/markdown-sanitize.js +151 -0
- package/dist/extraction/markdown-sanitize.js.map +1 -0
- package/dist/extraction/markdown.d.ts +11 -0
- package/dist/extraction/markdown.d.ts.map +1 -1
- package/dist/extraction/markdown.js +195 -91
- package/dist/extraction/markdown.js.map +1 -1
- package/dist/extraction/pipeline.d.ts +8 -0
- package/dist/extraction/pipeline.d.ts.map +1 -1
- package/dist/extraction/pipeline.js +57 -91
- package/dist/extraction/pipeline.js.map +1 -1
- package/dist/extraction/readability.d.ts +1 -1
- package/dist/extraction/readability.d.ts.map +1 -1
- package/dist/extraction/readability.js +28 -29
- package/dist/extraction/readability.js.map +1 -1
- package/dist/extraction/schema.d.ts +12 -0
- package/dist/extraction/schema.d.ts.map +1 -1
- package/dist/extraction/schema.js +135 -72
- package/dist/extraction/schema.js.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.d.ts.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.js +81 -91
- package/dist/extraction/site-extractors/docs-generic.js.map +1 -1
- package/dist/extraction/site-extractors/github.d.ts.map +1 -1
- package/dist/extraction/site-extractors/github.js +87 -95
- package/dist/extraction/site-extractors/github.js.map +1 -1
- package/dist/extraction/site-extractors/mdn.d.ts.map +1 -1
- package/dist/extraction/site-extractors/mdn.js +46 -54
- package/dist/extraction/site-extractors/mdn.js.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.d.ts.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.js +71 -80
- package/dist/extraction/site-extractors/stackoverflow.js.map +1 -1
- package/dist/extraction/structured-data.d.ts +4 -0
- package/dist/extraction/structured-data.d.ts.map +1 -0
- package/dist/extraction/structured-data.js +173 -0
- package/dist/extraction/structured-data.js.map +1 -0
- package/dist/extraction/structured.d.ts +4 -0
- package/dist/extraction/structured.d.ts.map +1 -0
- package/dist/extraction/structured.js +163 -0
- package/dist/extraction/structured.js.map +1 -0
- package/dist/extraction/v1/classifier.d.ts +3 -0
- package/dist/extraction/v1/classifier.d.ts.map +1 -0
- package/dist/extraction/v1/classifier.js +110 -0
- package/dist/extraction/v1/classifier.js.map +1 -0
- package/dist/extraction/v1/extract-provider.d.ts +16 -0
- package/dist/extraction/v1/extract-provider.d.ts.map +1 -0
- package/dist/extraction/v1/extract-provider.js +43 -0
- package/dist/extraction/v1/extract-provider.js.map +1 -0
- package/dist/extraction/v1/local-llm.d.ts +8 -0
- package/dist/extraction/v1/local-llm.d.ts.map +1 -0
- package/dist/extraction/v1/local-llm.js +58 -0
- package/dist/extraction/v1/local-llm.js.map +1 -0
- package/dist/extraction/v1/news.d.ts +3 -0
- package/dist/extraction/v1/news.d.ts.map +1 -0
- package/dist/extraction/v1/news.js +61 -0
- package/dist/extraction/v1/news.js.map +1 -0
- package/dist/extraction/v1/product.d.ts +3 -0
- package/dist/extraction/v1/product.d.ts.map +1 -0
- package/dist/extraction/v1/product.js +166 -0
- package/dist/extraction/v1/product.js.map +1 -0
- package/dist/extraction/v1/recipe.d.ts +3 -0
- package/dist/extraction/v1/recipe.d.ts.map +1 -0
- package/dist/extraction/v1/recipe.js +136 -0
- package/dist/extraction/v1/recipe.js.map +1 -0
- package/dist/extraction/v1/routed.d.ts +17 -0
- package/dist/extraction/v1/routed.d.ts.map +1 -0
- package/dist/extraction/v1/routed.js +68 -0
- package/dist/extraction/v1/routed.js.map +1 -0
- package/dist/extraction/v1/schemas/Article.d.ts +11 -0
- package/dist/extraction/v1/schemas/Article.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Article.js +23 -0
- package/dist/extraction/v1/schemas/Article.js.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts +9 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js +90 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts +10 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.js +122 -0
- package/dist/extraction/v1/schemas/EventListing.js.map +1 -0
- package/dist/extraction/v1/schemas/Paper.d.ts +10 -0
- package/dist/extraction/v1/schemas/Paper.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Paper.js +156 -0
- package/dist/extraction/v1/schemas/Paper.js.map +1 -0
- package/dist/extraction/v1/schemas/Product.d.ts +17 -0
- package/dist/extraction/v1/schemas/Product.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Product.js +149 -0
- package/dist/extraction/v1/schemas/Product.js.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts +14 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.js +160 -0
- package/dist/extraction/v1/schemas/Recipe.js.map +1 -0
- package/dist/extraction/v1/schemas/index.d.ts +13 -0
- package/dist/extraction/v1/schemas/index.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/index.js +44 -0
- package/dist/extraction/v1/schemas/index.js.map +1 -0
- package/dist/extraction/v1/site-extractors.d.ts +5 -0
- package/dist/extraction/v1/site-extractors.d.ts.map +1 -0
- package/dist/extraction/v1/site-extractors.js +31 -0
- package/dist/extraction/v1/site-extractors.js.map +1 -0
- package/dist/fetch/action-executor.d.ts +28 -0
- package/dist/fetch/action-executor.d.ts.map +1 -0
- package/dist/fetch/action-executor.js +88 -0
- package/dist/fetch/action-executor.js.map +1 -0
- package/dist/fetch/auth.d.ts +2 -1
- package/dist/fetch/auth.d.ts.map +1 -1
- package/dist/fetch/auth.js +56 -26
- package/dist/fetch/auth.js.map +1 -1
- package/dist/fetch/browser-pool.d.ts +30 -11
- package/dist/fetch/browser-pool.d.ts.map +1 -1
- package/dist/fetch/browser-pool.js +303 -127
- package/dist/fetch/browser-pool.js.map +1 -1
- package/dist/fetch/browser-selector.d.ts +17 -0
- package/dist/fetch/browser-selector.d.ts.map +1 -0
- package/dist/fetch/browser-selector.js +72 -0
- package/dist/fetch/browser-selector.js.map +1 -0
- package/dist/fetch/browser-types.d.ts +3 -0
- package/dist/fetch/browser-types.d.ts.map +1 -0
- package/dist/fetch/browser-types.js +45 -0
- package/dist/fetch/browser-types.js.map +1 -0
- package/dist/fetch/cdp-client.d.ts +9 -0
- package/dist/fetch/cdp-client.d.ts.map +1 -0
- package/dist/fetch/cdp-client.js +89 -0
- package/dist/fetch/cdp-client.js.map +1 -0
- package/dist/fetch/content-check.js +39 -46
- package/dist/fetch/content-check.js.map +1 -1
- package/dist/fetch/http-client.d.ts +4 -0
- package/dist/fetch/http-client.d.ts.map +1 -1
- package/dist/fetch/http-client.js +147 -128
- package/dist/fetch/http-client.js.map +1 -1
- package/dist/fetch/lightpanda.d.ts +28 -0
- package/dist/fetch/lightpanda.d.ts.map +1 -0
- package/dist/fetch/lightpanda.js +174 -0
- package/dist/fetch/lightpanda.js.map +1 -0
- package/dist/fetch/playwright-tier.d.ts +19 -0
- package/dist/fetch/playwright-tier.d.ts.map +1 -0
- package/dist/fetch/playwright-tier.js +76 -0
- package/dist/fetch/playwright-tier.js.map +1 -0
- package/dist/fetch/router.d.ts +49 -3
- package/dist/fetch/router.d.ts.map +1 -1
- package/dist/fetch/router.js +185 -81
- package/dist/fetch/router.js.map +1 -1
- package/dist/index.js +97 -17
- package/dist/index.js.map +1 -1
- package/dist/instructions.d.ts +31 -0
- package/dist/instructions.d.ts.map +1 -0
- package/dist/instructions.js +245 -0
- package/dist/instructions.js.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts +3 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.js +41 -0
- package/dist/integrations/cloud/llm/anthropic.js.map +1 -0
- package/dist/integrations/cloud/llm/cache.d.ts +5 -0
- package/dist/integrations/cloud/llm/cache.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/cache.js +49 -0
- package/dist/integrations/cloud/llm/cache.js.map +1 -0
- package/dist/integrations/cloud/llm/gemini.d.ts +3 -0
- package/dist/integrations/cloud/llm/gemini.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/gemini.js +37 -0
- package/dist/integrations/cloud/llm/gemini.js.map +1 -0
- package/dist/integrations/cloud/llm/groq.d.ts +3 -0
- package/dist/integrations/cloud/llm/groq.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/groq.js +74 -0
- package/dist/integrations/cloud/llm/groq.js.map +1 -0
- package/dist/integrations/cloud/llm/hash.d.ts +3 -0
- package/dist/integrations/cloud/llm/hash.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/hash.js +26 -0
- package/dist/integrations/cloud/llm/hash.js.map +1 -0
- package/dist/integrations/cloud/llm/openai.d.ts +3 -0
- package/dist/integrations/cloud/llm/openai.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/openai.js +43 -0
- package/dist/integrations/cloud/llm/openai.js.map +1 -0
- package/dist/integrations/cloud/llm/select.d.ts +5 -0
- package/dist/integrations/cloud/llm/select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/select.js +30 -0
- package/dist/integrations/cloud/llm/select.js.map +1 -0
- package/dist/integrations/cloud/llm/types.d.ts +24 -0
- package/dist/integrations/cloud/llm/types.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/types.js +1 -0
- package/dist/integrations/cloud/llm/types.js.map +1 -0
- package/dist/integrations/cloud/llm/validate.d.ts +6 -0
- package/dist/integrations/cloud/llm/validate.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/validate.js +63 -0
- package/dist/integrations/cloud/llm/validate.js.map +1 -0
- package/dist/logger.d.ts +4 -1
- package/dist/logger.d.ts.map +1 -1
- package/dist/logger.js +71 -30
- package/dist/logger.js.map +1 -1
- package/dist/pdf-parse.d.js +1 -0
- package/dist/pdf-parse.d.js.map +1 -0
- package/dist/plugins/loader.d.ts +20 -0
- package/dist/plugins/loader.d.ts.map +1 -0
- package/dist/plugins/loader.js +157 -0
- package/dist/plugins/loader.js.map +1 -0
- package/dist/plugins/registry.d.ts +26 -0
- package/dist/plugins/registry.d.ts.map +1 -0
- package/dist/plugins/registry.js +71 -0
- package/dist/plugins/registry.js.map +1 -0
- package/dist/plugins/validate.d.ts +9 -0
- package/dist/plugins/validate.d.ts.map +1 -0
- package/dist/plugins/validate.js +79 -0
- package/dist/plugins/validate.js.map +1 -0
- package/dist/providers/embed-provider.d.ts +11 -0
- package/dist/providers/embed-provider.d.ts.map +1 -0
- package/dist/providers/embed-provider.js +24 -0
- package/dist/providers/embed-provider.js.map +1 -0
- package/dist/providers/extract-provider.d.ts +23 -0
- package/dist/providers/extract-provider.d.ts.map +1 -0
- package/dist/providers/extract-provider.js +25 -0
- package/dist/providers/extract-provider.js.map +1 -0
- package/dist/providers/rerank-provider.d.ts +16 -0
- package/dist/providers/rerank-provider.d.ts.map +1 -0
- package/dist/providers/rerank-provider.js +28 -0
- package/dist/providers/rerank-provider.js.map +1 -0
- package/dist/providers/search-provider.d.ts +25 -0
- package/dist/providers/search-provider.d.ts.map +1 -0
- package/dist/providers/search-provider.js +44 -0
- package/dist/providers/search-provider.js.map +1 -0
- package/dist/providers/vector-store.d.ts +27 -0
- package/dist/providers/vector-store.d.ts.map +1 -0
- package/dist/providers/vector-store.js +27 -0
- package/dist/providers/vector-store.js.map +1 -0
- package/dist/python-env.d.ts +9 -0
- package/dist/python-env.d.ts.map +1 -0
- package/dist/python-env.js +13 -0
- package/dist/python-env.js.map +1 -0
- package/dist/repl/commands/agent.d.ts +5 -0
- package/dist/repl/commands/agent.d.ts.map +1 -0
- package/dist/repl/commands/agent.js +62 -0
- package/dist/repl/commands/agent.js.map +1 -0
- package/dist/repl/commands/cache.d.ts +4 -0
- package/dist/repl/commands/cache.d.ts.map +1 -0
- package/dist/repl/commands/cache.js +43 -0
- package/dist/repl/commands/cache.js.map +1 -0
- package/dist/repl/commands/crawl.d.ts +7 -0
- package/dist/repl/commands/crawl.d.ts.map +1 -0
- package/dist/repl/commands/crawl.js +44 -0
- package/dist/repl/commands/crawl.js.map +1 -0
- package/dist/repl/commands/extract.d.ts +5 -0
- package/dist/repl/commands/extract.d.ts.map +1 -0
- package/dist/repl/commands/extract.js +47 -0
- package/dist/repl/commands/extract.js.map +1 -0
- package/dist/repl/commands/fetch.d.ts +5 -0
- package/dist/repl/commands/fetch.d.ts.map +1 -0
- package/dist/repl/commands/fetch.js +67 -0
- package/dist/repl/commands/fetch.js.map +1 -0
- package/dist/repl/commands/find-similar.d.ts +5 -0
- package/dist/repl/commands/find-similar.d.ts.map +1 -0
- package/dist/repl/commands/find-similar.js +74 -0
- package/dist/repl/commands/find-similar.js.map +1 -0
- package/dist/repl/commands/research.d.ts +5 -0
- package/dist/repl/commands/research.d.ts.map +1 -0
- package/dist/repl/commands/research.js +65 -0
- package/dist/repl/commands/research.js.map +1 -0
- package/dist/repl/commands/search.d.ts +5 -0
- package/dist/repl/commands/search.d.ts.map +1 -0
- package/dist/repl/commands/search.js +74 -0
- package/dist/repl/commands/search.js.map +1 -0
- package/dist/repl/commands/types.d.ts +9 -0
- package/dist/repl/commands/types.d.ts.map +1 -0
- package/dist/repl/commands/types.js +1 -0
- package/dist/repl/commands/types.js.map +1 -0
- package/dist/repl/formatters.d.ts +13 -0
- package/dist/repl/formatters.d.ts.map +1 -0
- package/dist/repl/formatters.js +283 -0
- package/dist/repl/formatters.js.map +1 -0
- package/dist/repl/parser.d.ts +9 -0
- package/dist/repl/parser.d.ts.map +1 -0
- package/dist/repl/parser.js +86 -0
- package/dist/repl/parser.js.map +1 -0
- package/dist/repl/shell.d.ts +8 -0
- package/dist/repl/shell.d.ts.map +1 -0
- package/dist/repl/shell.js +184 -0
- package/dist/repl/shell.js.map +1 -0
- package/dist/research/branch-exploration.d.ts +14 -0
- package/dist/research/branch-exploration.d.ts.map +1 -0
- package/dist/research/branch-exploration.js +100 -0
- package/dist/research/branch-exploration.js.map +1 -0
- package/dist/research/brief.d.ts +5 -0
- package/dist/research/brief.d.ts.map +1 -0
- package/dist/research/brief.js +242 -0
- package/dist/research/brief.js.map +1 -0
- package/dist/research/citation-graph.d.ts +9 -0
- package/dist/research/citation-graph.d.ts.map +1 -0
- package/dist/research/citation-graph.js +114 -0
- package/dist/research/citation-graph.js.map +1 -0
- package/dist/research/decompose.d.ts +14 -0
- package/dist/research/decompose.d.ts.map +1 -0
- package/dist/research/decompose.js +439 -0
- package/dist/research/decompose.js.map +1 -0
- package/dist/research/pipeline.d.ts +5 -0
- package/dist/research/pipeline.d.ts.map +1 -0
- package/dist/research/pipeline.js +269 -0
- package/dist/research/pipeline.js.map +1 -0
- package/dist/research/synthesis-local.d.ts +16 -0
- package/dist/research/synthesis-local.d.ts.map +1 -0
- package/dist/research/synthesis-local.js +73 -0
- package/dist/research/synthesis-local.js.map +1 -0
- package/dist/research/synthesize.d.ts +10 -0
- package/dist/research/synthesize.d.ts.map +1 -0
- package/dist/research/synthesize.js +137 -0
- package/dist/research/synthesize.js.map +1 -0
- package/dist/search/answer-synthesis.d.ts +33 -0
- package/dist/search/answer-synthesis.d.ts.map +1 -0
- package/dist/search/answer-synthesis.js +244 -0
- package/dist/search/answer-synthesis.js.map +1 -0
- package/dist/search/context-formatter.d.ts +3 -0
- package/dist/search/context-formatter.d.ts.map +1 -0
- package/dist/search/context-formatter.js +56 -0
- package/dist/search/context-formatter.js.map +1 -0
- package/dist/search/dedup.d.ts +1 -0
- package/dist/search/dedup.d.ts.map +1 -1
- package/dist/search/dedup.js +40 -32
- package/dist/search/dedup.js.map +1 -1
- package/dist/search/engines/arxiv.d.ts +7 -0
- package/dist/search/engines/arxiv.d.ts.map +1 -0
- package/dist/search/engines/arxiv.js +70 -0
- package/dist/search/engines/arxiv.js.map +1 -0
- package/dist/search/engines/bing-news.d.ts +7 -0
- package/dist/search/engines/bing-news.d.ts.map +1 -0
- package/dist/search/engines/bing-news.js +97 -0
- package/dist/search/engines/bing-news.js.map +1 -0
- package/dist/search/engines/bing.d.ts +1 -0
- package/dist/search/engines/bing.d.ts.map +1 -1
- package/dist/search/engines/bing.js +100 -44
- package/dist/search/engines/bing.js.map +1 -1
- package/dist/search/engines/devdocs.d.ts +6 -0
- package/dist/search/engines/devdocs.d.ts.map +1 -0
- package/dist/search/engines/devdocs.js +56 -0
- package/dist/search/engines/devdocs.js.map +1 -0
- package/dist/search/engines/duckduckgo.d.ts.map +1 -1
- package/dist/search/engines/duckduckgo.js +56 -44
- package/dist/search/engines/duckduckgo.js.map +1 -1
- package/dist/search/engines/github-code.d.ts +7 -0
- package/dist/search/engines/github-code.d.ts.map +1 -0
- package/dist/search/engines/github-code.js +55 -0
- package/dist/search/engines/github-code.js.map +1 -0
- package/dist/search/engines/hn-algolia.d.ts +7 -0
- package/dist/search/engines/hn-algolia.d.ts.map +1 -0
- package/dist/search/engines/hn-algolia.js +76 -0
- package/dist/search/engines/hn-algolia.js.map +1 -0
- package/dist/search/engines/lobsters.d.ts +7 -0
- package/dist/search/engines/lobsters.d.ts.map +1 -0
- package/dist/search/engines/lobsters.js +83 -0
- package/dist/search/engines/lobsters.js.map +1 -0
- package/dist/search/engines/mdn.d.ts +7 -0
- package/dist/search/engines/mdn.d.ts.map +1 -0
- package/dist/search/engines/mdn.js +48 -0
- package/dist/search/engines/mdn.js.map +1 -0
- package/dist/search/engines/semantic-scholar.d.ts +7 -0
- package/dist/search/engines/semantic-scholar.d.ts.map +1 -0
- package/dist/search/engines/semantic-scholar.js +69 -0
- package/dist/search/engines/semantic-scholar.js.map +1 -0
- package/dist/search/engines/stackoverflow.d.ts +7 -0
- package/dist/search/engines/stackoverflow.d.ts.map +1 -0
- package/dist/search/engines/stackoverflow.js +73 -0
- package/dist/search/engines/stackoverflow.js.map +1 -0
- package/dist/search/engines/startpage.d.ts.map +1 -1
- package/dist/search/engines/startpage.js +65 -46
- package/dist/search/engines/startpage.js.map +1 -1
- package/dist/search/evidence.d.ts +25 -0
- package/dist/search/evidence.d.ts.map +1 -0
- package/dist/search/evidence.js +220 -0
- package/dist/search/evidence.js.map +1 -0
- package/dist/search/filters.js +49 -55
- package/dist/search/filters.js.map +1 -1
- package/dist/search/find-similar/crawl-rank.d.ts +9 -0
- package/dist/search/find-similar/crawl-rank.d.ts.map +1 -0
- package/dist/search/find-similar/crawl-rank.js +272 -0
- package/dist/search/find-similar/crawl-rank.js.map +1 -0
- package/dist/search/find-similar/mode.d.ts +4 -0
- package/dist/search/find-similar/mode.d.ts.map +1 -0
- package/dist/search/find-similar/mode.js +12 -0
- package/dist/search/find-similar/mode.js.map +1 -0
- package/dist/search/find-similar.d.ts +5 -0
- package/dist/search/find-similar.d.ts.map +1 -0
- package/dist/search/find-similar.js +509 -0
- package/dist/search/find-similar.js.map +1 -0
- package/dist/search/highlights.d.ts +19 -0
- package/dist/search/highlights.d.ts.map +1 -0
- package/dist/search/highlights.js +167 -0
- package/dist/search/highlights.js.map +1 -0
- package/dist/search/language-filter.d.ts +29 -0
- package/dist/search/language-filter.d.ts.map +1 -0
- package/dist/search/language-filter.js +126 -0
- package/dist/search/language-filter.js.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts +4 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.js +501 -0
- package/dist/search/legacy/searxng-orchestrator.js.map +1 -0
- package/dist/search/legacy/searxng-provider.d.ts +7 -0
- package/dist/search/legacy/searxng-provider.d.ts.map +1 -0
- package/dist/search/legacy/searxng-provider.js +11 -0
- package/dist/search/legacy/searxng-provider.js.map +1 -0
- package/dist/search/multi-query.d.ts +25 -0
- package/dist/search/multi-query.d.ts.map +1 -0
- package/dist/search/multi-query.js +228 -0
- package/dist/search/multi-query.js.map +1 -0
- package/dist/search/query.js +32 -34
- package/dist/search/query.js.map +1 -1
- package/dist/search/rerank.d.ts +3 -1
- package/dist/search/rerank.d.ts.map +1 -1
- package/dist/search/rerank.js +44 -35
- package/dist/search/rerank.js.map +1 -1
- package/dist/search/reranker/authority-boost.d.ts +3 -0
- package/dist/search/reranker/authority-boost.d.ts.map +1 -0
- package/dist/search/reranker/authority-boost.js +179 -0
- package/dist/search/reranker/authority-boost.js.map +1 -0
- package/dist/search/reranker/consensus-boost.d.ts +3 -0
- package/dist/search/reranker/consensus-boost.d.ts.map +1 -0
- package/dist/search/reranker/consensus-boost.js +27 -0
- package/dist/search/reranker/consensus-boost.js.map +1 -0
- package/dist/search/reranker/recency-boost.d.ts +3 -0
- package/dist/search/reranker/recency-boost.d.ts.map +1 -0
- package/dist/search/reranker/recency-boost.js +13 -0
- package/dist/search/reranker/recency-boost.js.map +1 -0
- package/dist/search/reranker/recency.d.ts +3 -0
- package/dist/search/reranker/recency.d.ts.map +1 -0
- package/dist/search/reranker/recency.js +23 -0
- package/dist/search/reranker/recency.js.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts +12 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.js +78 -0
- package/dist/search/reranker/transformers-rerank-provider.js.map +1 -0
- package/dist/search/rrf.d.ts +17 -0
- package/dist/search/rrf.d.ts.map +1 -0
- package/dist/search/rrf.js +39 -0
- package/dist/search/rrf.js.map +1 -0
- package/dist/search/sampling.d.ts +25 -0
- package/dist/search/sampling.d.ts.map +1 -0
- package/dist/search/sampling.js +52 -0
- package/dist/search/sampling.js.map +1 -0
- package/dist/search/searxng.d.ts.map +1 -1
- package/dist/search/searxng.js +69 -79
- package/dist/search/searxng.js.map +1 -1
- package/dist/search/tokens.d.ts +3 -0
- package/dist/search/tokens.d.ts.map +1 -0
- package/dist/search/tokens.js +39 -0
- package/dist/search/tokens.js.map +1 -0
- package/dist/search/truncate.d.ts +6 -0
- package/dist/search/truncate.d.ts.map +1 -0
- package/dist/search/truncate.js +26 -0
- package/dist/search/truncate.js.map +1 -0
- package/dist/search/url-unwrap.d.ts +3 -0
- package/dist/search/url-unwrap.d.ts.map +1 -0
- package/dist/search/url-unwrap.js +43 -0
- package/dist/search/url-unwrap.js.map +1 -0
- package/dist/search/v1/context-rank.d.ts +13 -0
- package/dist/search/v1/context-rank.d.ts.map +1 -0
- package/dist/search/v1/context-rank.js +74 -0
- package/dist/search/v1/context-rank.js.map +1 -0
- package/dist/search/v1/engine-base.d.ts +27 -0
- package/dist/search/v1/engine-base.d.ts.map +1 -0
- package/dist/search/v1/engine-base.js +110 -0
- package/dist/search/v1/engine-base.js.map +1 -0
- package/dist/search/v1/intent-router.d.ts +22 -0
- package/dist/search/v1/intent-router.d.ts.map +1 -0
- package/dist/search/v1/intent-router.js +138 -0
- package/dist/search/v1/intent-router.js.map +1 -0
- package/dist/search/v1/orchestrator.d.ts +24 -0
- package/dist/search/v1/orchestrator.d.ts.map +1 -0
- package/dist/search/v1/orchestrator.js +163 -0
- package/dist/search/v1/orchestrator.js.map +1 -0
- package/dist/search/v1/recency-boost.d.ts +9 -0
- package/dist/search/v1/recency-boost.d.ts.map +1 -0
- package/dist/search/v1/recency-boost.js +37 -0
- package/dist/search/v1/recency-boost.js.map +1 -0
- package/dist/search/v1/recent-cache-dedup.d.ts +6 -0
- package/dist/search/v1/recent-cache-dedup.d.ts.map +1 -0
- package/dist/search/v1/recent-cache-dedup.js +85 -0
- package/dist/search/v1/recent-cache-dedup.js.map +1 -0
- package/dist/search/v1/rss/feed-config.d.ts +21 -0
- package/dist/search/v1/rss/feed-config.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-config.js +90 -0
- package/dist/search/v1/rss/feed-config.js.map +1 -0
- package/dist/search/v1/rss/feed-parser.d.ts +14 -0
- package/dist/search/v1/rss/feed-parser.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-parser.js +104 -0
- package/dist/search/v1/rss/feed-parser.js.map +1 -0
- package/dist/search/v1/rss/feed-poller.d.ts +22 -0
- package/dist/search/v1/rss/feed-poller.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-poller.js +102 -0
- package/dist/search/v1/rss/feed-poller.js.map +1 -0
- package/dist/search/v1/rss/feed-store.d.ts +30 -0
- package/dist/search/v1/rss/feed-store.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-store.js +134 -0
- package/dist/search/v1/rss/feed-store.js.map +1 -0
- package/dist/search/v1/rss/rss-engine.d.ts +6 -0
- package/dist/search/v1/rss/rss-engine.d.ts.map +1 -0
- package/dist/search/v1/rss/rss-engine.js +28 -0
- package/dist/search/v1/rss/rss-engine.js.map +1 -0
- package/dist/search/v1/v1-provider.d.ts +7 -0
- package/dist/search/v1/v1-provider.d.ts.map +1 -0
- package/dist/search/v1/v1-provider.js +68 -0
- package/dist/search/v1/v1-provider.js.map +1 -0
- package/dist/search/v1/verticals/code.d.ts +4 -0
- package/dist/search/v1/verticals/code.d.ts.map +1 -0
- package/dist/search/v1/verticals/code.js +20 -0
- package/dist/search/v1/verticals/code.js.map +1 -0
- package/dist/search/v1/verticals/docs.d.ts +4 -0
- package/dist/search/v1/verticals/docs.d.ts.map +1 -0
- package/dist/search/v1/verticals/docs.js +20 -0
- package/dist/search/v1/verticals/docs.js.map +1 -0
- package/dist/search/v1/verticals/general.d.ts +4 -0
- package/dist/search/v1/verticals/general.d.ts.map +1 -0
- package/dist/search/v1/verticals/general.js +22 -0
- package/dist/search/v1/verticals/general.js.map +1 -0
- package/dist/search/v1/verticals/news.d.ts +10 -0
- package/dist/search/v1/verticals/news.d.ts.map +1 -0
- package/dist/search/v1/verticals/news.js +52 -0
- package/dist/search/v1/verticals/news.js.map +1 -0
- package/dist/search/v1/verticals/papers.d.ts +4 -0
- package/dist/search/v1/verticals/papers.d.ts.map +1 -0
- package/dist/search/v1/verticals/papers.js +23 -0
- package/dist/search/v1/verticals/papers.js.map +1 -0
- package/dist/search/validator.js +31 -31
- package/dist/search/validator.js.map +1 -1
- package/dist/searxng/bootstrap.d.ts +30 -0
- package/dist/searxng/bootstrap.d.ts.map +1 -1
- package/dist/searxng/bootstrap.js +223 -85
- package/dist/searxng/bootstrap.js.map +1 -1
- package/dist/searxng/docker.d.ts.map +1 -1
- package/dist/searxng/docker.js +69 -60
- package/dist/searxng/docker.js.map +1 -1
- package/dist/searxng/process.d.ts +13 -1
- package/dist/searxng/process.d.ts.map +1 -1
- package/dist/searxng/process.js +231 -164
- package/dist/searxng/process.js.map +1 -1
- package/dist/server/backend-status.d.ts +13 -0
- package/dist/server/backend-status.d.ts.map +1 -0
- package/dist/server/backend-status.js +40 -0
- package/dist/server/backend-status.js.map +1 -0
- package/dist/server/tool-schemas.d.ts +549 -0
- package/dist/server/tool-schemas.d.ts.map +1 -0
- package/dist/server/tool-schemas.js +464 -0
- package/dist/server/tool-schemas.js.map +1 -0
- package/dist/server/warmup-on-start.d.ts +9 -0
- package/dist/server/warmup-on-start.d.ts.map +1 -0
- package/dist/server/warmup-on-start.js +55 -0
- package/dist/server/warmup-on-start.js.map +1 -0
- package/dist/server.d.ts +17 -0
- package/dist/server.d.ts.map +1 -1
- package/dist/server.js +454 -297
- package/dist/server.js.map +1 -1
- package/dist/tools/agent.d.ts +5 -0
- package/dist/tools/agent.d.ts.map +1 -0
- package/dist/tools/agent.js +128 -0
- package/dist/tools/agent.js.map +1 -0
- package/dist/tools/cache.d.ts +2 -1
- package/dist/tools/cache.d.ts.map +1 -1
- package/dist/tools/cache.js +175 -44
- package/dist/tools/cache.js.map +1 -1
- package/dist/tools/crawl.d.ts.map +1 -1
- package/dist/tools/crawl.js +171 -88
- package/dist/tools/crawl.js.map +1 -1
- package/dist/tools/extract.d.ts +2 -2
- package/dist/tools/extract.d.ts.map +1 -1
- package/dist/tools/extract.js +175 -59
- package/dist/tools/extract.js.map +1 -1
- package/dist/tools/fetch.d.ts +2 -2
- package/dist/tools/fetch.d.ts.map +1 -1
- package/dist/tools/fetch.js +161 -68
- package/dist/tools/fetch.js.map +1 -1
- package/dist/tools/find-similar.d.ts +5 -0
- package/dist/tools/find-similar.d.ts.map +1 -0
- package/dist/tools/find-similar.js +127 -0
- package/dist/tools/find-similar.js.map +1 -0
- package/dist/tools/research.d.ts +5 -0
- package/dist/tools/research.d.ts.map +1 -0
- package/dist/tools/research.js +107 -0
- package/dist/tools/research.js.map +1 -0
- package/dist/tools/search.d.ts +10 -2
- package/dist/tools/search.d.ts.map +1 -1
- package/dist/tools/search.js +13 -158
- package/dist/tools/search.js.map +1 -1
- package/dist/types.d.ts +350 -7
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js +6 -1
- package/dist/types.js.map +1 -1
- package/dist/util/mode.d.ts +4 -0
- package/dist/util/mode.d.ts.map +1 -0
- package/dist/util/mode.js +34 -0
- package/dist/util/mode.js.map +1 -0
- package/package.json +78 -8
- package/dist/extraction/trafilatura.d.ts +0 -6
- package/dist/extraction/trafilatura.d.ts.map +0 -1
- package/dist/extraction/trafilatura.js +0 -105
- package/dist/extraction/trafilatura.js.map +0 -1
- package/dist/search/flashrank.d.ts +0 -12
- package/dist/search/flashrank.d.ts.map +0 -1
- package/dist/search/flashrank.js +0 -63
- package/dist/search/flashrank.js.map +0 -1
package/dist/fetch/router.js
CHANGED
|
@@ -1,89 +1,193 @@
|
|
|
1
|
-
import { getConfig } from
|
|
2
|
-
import { createLogger } from
|
|
3
|
-
import { contentAppearsEmpty } from
|
|
4
|
-
import { getAuthOptions } from
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
1
|
+
import { getConfig } from "../config.js";
|
|
2
|
+
import { createLogger } from "../logger.js";
|
|
3
|
+
import { contentAppearsEmpty } from "./content-check.js";
|
|
4
|
+
import { getAuthOptions } from "./auth.js";
|
|
5
|
+
import { fetchWithPlaywright, shouldEscalate } from "./playwright-tier.js";
|
|
6
|
+
class SmartRouter {
|
|
7
|
+
domainMap = /* @__PURE__ */ new Map();
|
|
8
|
+
httpClient;
|
|
9
|
+
browserPool;
|
|
10
|
+
httpFetcher;
|
|
11
|
+
playwrightFetcher;
|
|
12
|
+
constructor(httpClientOrOptions, browserPool) {
|
|
13
|
+
if (browserPool !== void 0) {
|
|
14
|
+
this.httpClient = httpClientOrOptions;
|
|
15
|
+
this.browserPool = browserPool;
|
|
16
|
+
} else if (httpClientOrOptions && typeof httpClientOrOptions === "object" && ("httpClient" in httpClientOrOptions || "browserPool" in httpClientOrOptions || "httpFetcher" in httpClientOrOptions || "playwrightFetcher" in httpClientOrOptions)) {
|
|
17
|
+
const opts = httpClientOrOptions;
|
|
18
|
+
if (!opts.httpFetcher && !opts.httpClient) {
|
|
19
|
+
throw new Error("SmartRouter: must provide either httpFetcher or httpClient in options");
|
|
20
|
+
}
|
|
21
|
+
this.httpClient = opts.httpClient;
|
|
22
|
+
this.browserPool = opts.browserPool;
|
|
23
|
+
this.httpFetcher = opts.httpFetcher ?? this.makeDefaultHttpFetcher();
|
|
24
|
+
this.playwrightFetcher = opts.playwrightFetcher ?? fetchWithPlaywright;
|
|
25
|
+
return;
|
|
26
|
+
} else {
|
|
27
|
+
this.httpClient = httpClientOrOptions;
|
|
12
28
|
}
|
|
13
|
-
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
56
|
-
|
|
57
|
-
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
29
|
+
this.httpFetcher = this.makeDefaultHttpFetcher();
|
|
30
|
+
this.playwrightFetcher = fetchWithPlaywright;
|
|
31
|
+
}
|
|
32
|
+
makeDefaultHttpFetcher() {
|
|
33
|
+
return async (url, opts) => {
|
|
34
|
+
if (!this.httpClient) {
|
|
35
|
+
throw new Error("SmartRouter: httpClient not configured");
|
|
36
|
+
}
|
|
37
|
+
const r = await this.httpClient.fetch(url, opts);
|
|
38
|
+
return { url: r.url, html: r.html, text: "" };
|
|
39
|
+
};
|
|
40
|
+
}
|
|
41
|
+
async fetch(url, options = {}) {
|
|
42
|
+
const { renderJs = "auto", useAuth = false, headers, screenshot, actions, mode, conditionalHeaders } = options;
|
|
43
|
+
const config = getConfig();
|
|
44
|
+
const logger = createLogger("fetch");
|
|
45
|
+
const threshold = config.browserFallbackThreshold;
|
|
46
|
+
const domain = new URL(url).hostname;
|
|
47
|
+
if (mode === "stealth") {
|
|
48
|
+
logger.debug("routing to stealth (static then escalate)", { url });
|
|
49
|
+
const staticResult = await this.httpFetcher(url, { headers });
|
|
50
|
+
this.ensureStats(domain);
|
|
51
|
+
if (!shouldEscalate(staticResult.text)) {
|
|
52
|
+
return {
|
|
53
|
+
url: staticResult.url,
|
|
54
|
+
finalUrl: staticResult.url,
|
|
55
|
+
html: staticResult.html,
|
|
56
|
+
contentType: "text/html",
|
|
57
|
+
statusCode: 200,
|
|
58
|
+
method: "http",
|
|
59
|
+
headers: {}
|
|
60
|
+
};
|
|
61
|
+
}
|
|
62
|
+
try {
|
|
63
|
+
const pw = await this.playwrightFetcher(url);
|
|
64
|
+
return {
|
|
65
|
+
url: staticResult.url,
|
|
66
|
+
finalUrl: staticResult.url,
|
|
67
|
+
html: pw.html,
|
|
68
|
+
contentType: "text/html",
|
|
69
|
+
statusCode: 200,
|
|
70
|
+
method: "playwright",
|
|
71
|
+
headers: {},
|
|
72
|
+
escalated: true
|
|
73
|
+
};
|
|
74
|
+
} catch (err) {
|
|
75
|
+
if (err instanceof Error && err.message === "playwright_not_installed") {
|
|
76
|
+
const hint = err.hint ?? "npx playwright install chromium";
|
|
77
|
+
return {
|
|
78
|
+
error: "playwright_not_installed",
|
|
79
|
+
error_reason: "Stealth mode requested but Playwright chromium is not installed",
|
|
80
|
+
stage: "fetch",
|
|
81
|
+
hint
|
|
82
|
+
};
|
|
63
83
|
}
|
|
84
|
+
return {
|
|
85
|
+
error: "playwright_fetch_failed",
|
|
86
|
+
error_reason: err instanceof Error ? err.message : String(err),
|
|
87
|
+
stage: "fetch",
|
|
88
|
+
hint: "Stealth fetch failed; check network or retry"
|
|
89
|
+
};
|
|
90
|
+
}
|
|
64
91
|
}
|
|
65
|
-
|
|
66
|
-
|
|
92
|
+
if (mode === "cache") {
|
|
93
|
+
if (actions && actions.length > 0) {
|
|
94
|
+
logger.warn("mode=cache ignores browser actions; switch to default/stealth to execute them", {
|
|
95
|
+
url,
|
|
96
|
+
actionCount: actions.length
|
|
97
|
+
});
|
|
98
|
+
}
|
|
99
|
+
logger.debug("routing to http (cache)", { url });
|
|
100
|
+
if (!this.httpClient) throw new Error("SmartRouter: httpClient not configured");
|
|
101
|
+
const result = await this.httpClient.fetch(url, {
|
|
102
|
+
headers,
|
|
103
|
+
timeoutMs: config.fastTimeoutMs,
|
|
104
|
+
conditionalHeaders
|
|
105
|
+
});
|
|
106
|
+
this.ensureStats(domain);
|
|
107
|
+
const raw = this.toRawFetchResult(result);
|
|
108
|
+
raw.jsRequired = result.statusCode === 304 ? false : contentAppearsEmpty(result.html);
|
|
109
|
+
return raw;
|
|
67
110
|
}
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
|
|
71
|
-
|
|
72
|
-
|
|
73
|
-
}
|
|
74
|
-
return stats;
|
|
111
|
+
if (actions && actions.length > 0) {
|
|
112
|
+
if (!this.browserPool) throw new Error("SmartRouter: browserPool not configured");
|
|
113
|
+
const authOptions = useAuth ? await getAuthOptions() ?? {} : {};
|
|
114
|
+
logger.debug("routing to playwright", { url, reason: "actions present" });
|
|
115
|
+
return this.browserPool.fetchWithBrowser(url, { headers, screenshot, actions, ...authOptions });
|
|
75
116
|
}
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
|
|
83
|
-
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
|
|
117
|
+
if (renderJs === "always" || useAuth) {
|
|
118
|
+
if (!this.browserPool) throw new Error("SmartRouter: browserPool not configured");
|
|
119
|
+
const authOptions = useAuth ? await getAuthOptions() ?? {} : {};
|
|
120
|
+
logger.debug("routing to playwright", { url, reason: useAuth ? "auth" : "render_js=always" });
|
|
121
|
+
return this.browserPool.fetchWithBrowser(url, { headers, screenshot, ...authOptions });
|
|
122
|
+
}
|
|
123
|
+
if (renderJs === "never") {
|
|
124
|
+
if (!this.httpClient) throw new Error("SmartRouter: httpClient not configured");
|
|
125
|
+
logger.debug("routing to http (never)", { url });
|
|
126
|
+
const result = await this.httpClient.fetch(url, { headers, conditionalHeaders });
|
|
127
|
+
this.ensureStats(domain);
|
|
128
|
+
return this.toRawFetchResult(result);
|
|
129
|
+
}
|
|
130
|
+
const stats = this.ensureStats(domain);
|
|
131
|
+
if (stats.preferPlaywright) {
|
|
132
|
+
if (!this.browserPool) throw new Error("SmartRouter: browserPool not configured");
|
|
133
|
+
logger.debug("routing to playwright (domain marked)", { url, domain });
|
|
134
|
+
return this.browserPool.fetchWithBrowser(url, { headers, screenshot });
|
|
135
|
+
}
|
|
136
|
+
try {
|
|
137
|
+
if (!this.httpClient) throw new Error("SmartRouter: httpClient not configured");
|
|
138
|
+
const result = await this.httpClient.fetch(url, { headers, conditionalHeaders });
|
|
139
|
+
if (result.statusCode === 304) {
|
|
140
|
+
return this.toRawFetchResult(result);
|
|
141
|
+
}
|
|
142
|
+
if (contentAppearsEmpty(result.html)) {
|
|
143
|
+
if (!this.browserPool) throw new Error("SmartRouter: browserPool not configured");
|
|
144
|
+
logger.info("SPA shell detected, marking domain for playwright", { url, domain });
|
|
145
|
+
stats.preferPlaywright = true;
|
|
146
|
+
return this.browserPool.fetchWithBrowser(url, { headers, screenshot });
|
|
147
|
+
}
|
|
148
|
+
return this.toRawFetchResult(result);
|
|
149
|
+
} catch (err) {
|
|
150
|
+
stats.failureCount++;
|
|
151
|
+
logger.warn("http fetch failed", {
|
|
152
|
+
url,
|
|
153
|
+
domain,
|
|
154
|
+
failureCount: stats.failureCount,
|
|
155
|
+
error: err instanceof Error ? err.message : String(err)
|
|
156
|
+
});
|
|
157
|
+
if (stats.failureCount >= threshold) {
|
|
158
|
+
if (!this.browserPool) throw new Error("SmartRouter: browserPool not configured");
|
|
159
|
+
logger.info("failure threshold reached, marking domain for playwright", { url, domain, threshold });
|
|
160
|
+
stats.preferPlaywright = true;
|
|
161
|
+
return this.browserPool.fetchWithBrowser(url, { headers, screenshot });
|
|
162
|
+
}
|
|
163
|
+
throw err;
|
|
164
|
+
}
|
|
165
|
+
}
|
|
166
|
+
getDomainStats(domain) {
|
|
167
|
+
return this.domainMap.get(domain);
|
|
168
|
+
}
|
|
169
|
+
ensureStats(domain) {
|
|
170
|
+
let stats = this.domainMap.get(domain);
|
|
171
|
+
if (!stats) {
|
|
172
|
+
stats = { failureCount: 0, preferPlaywright: false };
|
|
173
|
+
this.domainMap.set(domain, stats);
|
|
87
174
|
}
|
|
175
|
+
return stats;
|
|
176
|
+
}
|
|
177
|
+
toRawFetchResult(result) {
|
|
178
|
+
return {
|
|
179
|
+
url: result.url,
|
|
180
|
+
finalUrl: result.finalUrl,
|
|
181
|
+
html: result.html,
|
|
182
|
+
contentType: result.contentType,
|
|
183
|
+
statusCode: result.statusCode,
|
|
184
|
+
method: "http",
|
|
185
|
+
headers: result.headers,
|
|
186
|
+
rawBuffer: result.rawBuffer
|
|
187
|
+
};
|
|
188
|
+
}
|
|
88
189
|
}
|
|
190
|
+
export {
|
|
191
|
+
SmartRouter
|
|
192
|
+
};
|
|
89
193
|
//# sourceMappingURL=router.js.map
|
package/dist/fetch/router.js.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"router.js","sourceRoot":"","sources":["../../src/fetch/router.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,SAAS,EAAE,MAAM,cAAc,CAAC;AACzC,OAAO,EAAE,YAAY,EAAE,MAAM,cAAc,CAAC;AAC5C,OAAO,EAAE,mBAAmB,EAAE,MAAM,oBAAoB,CAAC;AACzD,OAAO,EAAE,cAAc,EAAE,MAAM,WAAW,CAAC;AAqC3C,MAAM,OAAO,WAAW;IAIH;IACA;IAJF,SAAS,GAAG,IAAI,GAAG,EAAuB,CAAC;IAE5D,YACmB,UAAsB,EACtB,WAAiC;QADjC,eAAU,GAAV,UAAU,CAAY;QACtB,gBAAW,GAAX,WAAW,CAAsB;IACjD,CAAC;IAEJ,KAAK,CAAC,KAAK,CAAC,GAAW,EAAE,UAA8B,EAAE;QACvD,MAAM,EAAE,QAAQ,GAAG,MAAM,EAAE,OAAO,GAAG,KAAK,EAAE,OAAO,EAAE,UAAU,EAAE,GAAG,OAAO,CAAC;QAC5E,MAAM,MAAM,GAAG,SAAS,EAAE,CAAC;QAC3B,MAAM,MAAM,GAAG,YAAY,CAAC,OAAO,CAAC,CAAC;QACrC,MAAM,SAAS,GAAG,MAAM,CAAC,wBAAwB,CAAC;QAClD,MAAM,MAAM,GAAG,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC,QAAQ,CAAC;QAErC,kDAAkD;QAClD,IAAI,QAAQ,KAAK,QAAQ,IAAI,OAAO,EAAE,CAAC;YACrC,MAAM,WAAW,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,cAAc,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;YAC5D,MAAM,CAAC,KAAK,CAAC,uBAAuB,EAAE,EAAE,GAAG,EAAE,MAAM,EAAE,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,kBAAkB,EAAE,CAAC,CAAC;YAC9F,OAAO,IAAI,CAAC,WAAW,CAAC,gBAAgB,CAAC,GAAG,EAAE,EAAE,OAAO,EAAE,UAAU,EAAE,GAAG,WAAW,EAAE,CAAC,CAAC;QACzF,CAAC;QAED,yBAAyB;QACzB,IAAI,QAAQ,KAAK,OAAO,EAAE,CAAC;YACzB,MAAM,CAAC,KAAK,CAAC,yBAAyB,EAAE,EAAE,GAAG,EAAE,CAAC,CAAC;YACjD,MAAM,MAAM,GAAG,MAAM,IAAI,CAAC,UAAU,CAAC,KAAK,CAAC,GAAG,EAAE,EAAE,OAAO,EAAE,CAAC,CAAC;YAC7D,IAAI,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;YACzB,OAAO,IAAI,CAAC,gBAAgB,CAAC,MAAM,CAAC,CAAC;QACvC,CAAC;QAED,yDAAyD;QACzD,MAAM,KAAK,GAAG,IAAI,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;QAEvC,IAAI,KAAK,CAAC,gBAAgB,EAAE,CAAC;YAC3B,MAAM,CAAC,KAAK,CAAC,uCAAuC,EAAE,EAAE,GAAG,EAAE,MAAM,EAAE,CAAC,CAAC;YACvE,OAAO,IAAI,CAAC,WAAW,CAAC,gBAAgB,CAAC,GAAG,EAAE,EAAE,OAAO,EAAE,UAAU,EAAE,CAAC,CAAC;QACzE,CAAC;QAED,iBAAiB;QACjB,IAAI,CAAC;YACH,MAAM,MAAM,GAAG,MAAM,IAAI,CAAC,UAAU,CAAC,KAAK,CAAC,GAAG,EAAE,EAAE,OAAO,EAAE,CAAC,CAAC;YAE7D,sCAAsC;YACtC,IAAI,mBAAmB,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,CAAC;gBACrC,MAAM,CAAC,IAAI,CAAC,mDAAmD,EAAE,EAAE,GAAG,EAAE,MAAM,EAAE,CAAC,CAAC;gBAClF,KAAK,CAAC,gBAAgB,GAAG,IAAI,CAAC;gBAC9B,OAAO,IAAI,CAAC,WAAW,CAAC,gBAAgB,CAAC,GAAG,EAAE,EAAE,OAAO,EAAE,UAAU,EAAE,CAAC,CAAC;YACzE,CAAC;YAED,OAAO,IAAI,CAAC,gBAAgB,CAAC,MAAM,CAAC,CAAC;QACvC,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,KAAK,CAAC,YAAY,EAAE,CAAC;YACrB,MAAM,CAAC,IAAI,CAAC,mBAAmB,EAAE;gBAC/B,GAAG;gBACH,MAAM;gBACN,YAAY,EAAE,KAAK,CAAC,YAAY;gBAChC,KAAK,EAAE,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC;aACxD,CAAC,CAAC;YAEH,IAAI,KAAK,CAAC,YAAY,IAAI,SAAS,EAAE,CAAC;gBACpC,MAAM,CAAC,IAAI,CAAC,0DAA0D,EAAE,EAAE,GAAG,EAAE,MAAM,EAAE,SAAS,EAAE,CAAC,CAAC;gBACpG,KAAK,CAAC,gBAAgB,GAAG,IAAI,CAAC;gBAC9B,OAAO,IAAI,CAAC,WAAW,CAAC,gBAAgB,CAAC,GAAG,EAAE,EAAE,OAAO,EAAE,UAAU,EAAE,CAAC,CAAC;YACzE,CAAC;YAED,MAAM,GAAG,CAAC;QACZ,CAAC;IACH,CAAC;IAED,cAAc,CAAC,MAAc;QAC3B,OAAO,IAAI,CAAC,SAAS,CAAC,GAAG,CAAC,MAAM,CAAC,CAAC;IACpC,CAAC;IAEO,WAAW,CAAC,MAAc;QAChC,IAAI,KAAK,GAAG,IAAI,CAAC,SAAS,CAAC,GAAG,CAAC,MAAM,CAAC,CAAC;QACvC,IAAI,CAAC,KAAK,EAAE,CAAC;YACX,KAAK,GAAG,EAAE,YAAY,EAAE,CAAC,EAAE,gBAAgB,EAAE,KAAK,EAAE,CAAC;YACrD,IAAI,CAAC,SAAS,CAAC,GAAG,CAAC,MAAM,EAAE,KAAK,CAAC,CAAC;QACpC,CAAC;QACD,OAAO,KAAK,CAAC;IACf,CAAC;IAEO,gBAAgB,CACtB,MAAgD;QAEhD,OAAO;YACL,GAAG,EAAE,MAAM,CAAC,GAAG;YACf,QAAQ,EAAE,MAAM,CAAC,QAAQ;YACzB,IAAI,EAAE,MAAM,CAAC,IAAI;YACjB,WAAW,EAAE,MAAM,CAAC,WAAW;YAC/B,UAAU,EAAE,MAAM,CAAC,UAAU;YAC7B,MAAM,EAAE,MAAM;YACd,OAAO,EAAE,MAAM,CAAC,OAAO;YACvB,SAAS,EAAE,MAAM,CAAC,SAAS;SAC5B,CAAC;IACJ,CAAC;CACF"}
|
|
1
|
+
{"version":3,"sources":["../../src/fetch/router.ts"],"sourcesContent":["import { getConfig } from '../config.js';\nimport { createLogger } from '../logger.js';\nimport { contentAppearsEmpty } from './content-check.js';\nimport { getAuthOptions } from './auth.js';\nimport { fetchWithPlaywright, shouldEscalate } from './playwright-tier.js';\nimport type { RawFetchResult, BrowserAction, Mode, StageError } from '../types.js';\n\nexport interface RouterFetchOptions {\n renderJs?: 'auto' | 'always' | 'never';\n useAuth?: boolean;\n headers?: Record<string, string>;\n screenshot?: boolean;\n actions?: BrowserAction[];\n force_refresh?: boolean;\n mode?: Mode;\n /**\n * Conditional-GET headers. When set, the HTTP path sends them with the\n * request and a 304 response is returned as RawFetchResult with\n * statusCode=304 + html=''. Routes that always escalate to Playwright\n * (renderJs=always, useAuth, actions) ignore these headers.\n */\n conditionalHeaders?: {\n ifNoneMatch?: string;\n ifModifiedSince?: string;\n };\n}\n\nexport interface HttpClient {\n fetch(\n url: string,\n options?: {\n headers?: Record<string, string>;\n timeoutMs?: number;\n conditionalHeaders?: {\n ifNoneMatch?: string;\n ifModifiedSince?: string;\n };\n },\n ): Promise<{\n url: string;\n finalUrl: string;\n html: string;\n contentType: string;\n statusCode: number;\n headers: Record<string, string>;\n rawBuffer?: Buffer;\n }>;\n}\n\nexport interface BrowserPoolInterface {\n fetchWithBrowser(\n url: string,\n options?: { headers?: Record<string, string>; storageStatePath?: string; userDataDir?: string; screenshot?: boolean; actions?: BrowserAction[]; cdpUrl?: string },\n ): Promise<RawFetchResult>;\n}\n\nexport type HttpFetcher = (\n url: string,\n options?: { headers?: Record<string, string>; timeoutMs?: number },\n) => Promise<{ url: string; html: string; text: string }>;\n\nexport type PlaywrightFetcher = (\n url: string,\n options?: { timeoutMs?: number },\n) => Promise<{ html: string; text: string }>;\n\nexport interface SmartRouterOptions {\n httpClient?: HttpClient;\n browserPool?: BrowserPoolInterface;\n httpFetcher?: HttpFetcher;\n playwrightFetcher?: PlaywrightFetcher;\n}\n\ninterface DomainStats {\n failureCount: number;\n preferPlaywright: boolean;\n}\n\nexport class SmartRouter {\n private readonly domainMap = new Map<string, DomainStats>();\n private readonly httpClient?: HttpClient;\n private readonly browserPool?: BrowserPoolInterface;\n private readonly httpFetcher: HttpFetcher;\n private readonly playwrightFetcher: PlaywrightFetcher;\n\n constructor(httpClient: HttpClient, browserPool: BrowserPoolInterface);\n constructor(options: SmartRouterOptions);\n constructor(\n httpClientOrOptions: HttpClient | SmartRouterOptions,\n browserPool?: BrowserPoolInterface,\n ) {\n if (browserPool !== undefined) {\n this.httpClient = httpClientOrOptions as HttpClient;\n this.browserPool = browserPool;\n } else if (\n httpClientOrOptions &&\n typeof httpClientOrOptions === 'object' &&\n ('httpClient' in httpClientOrOptions ||\n 'browserPool' in httpClientOrOptions ||\n 'httpFetcher' in httpClientOrOptions ||\n 'playwrightFetcher' in httpClientOrOptions)\n ) {\n const opts = httpClientOrOptions as SmartRouterOptions;\n if (!opts.httpFetcher && !opts.httpClient) {\n throw new Error('SmartRouter: must provide either httpFetcher or httpClient in options');\n }\n this.httpClient = opts.httpClient;\n this.browserPool = opts.browserPool;\n this.httpFetcher = opts.httpFetcher ?? this.makeDefaultHttpFetcher();\n this.playwrightFetcher = opts.playwrightFetcher ?? fetchWithPlaywright;\n return;\n } else {\n // Backwards-compat: single HttpClient positional (unusual but safe)\n this.httpClient = httpClientOrOptions as HttpClient;\n }\n this.httpFetcher = this.makeDefaultHttpFetcher();\n this.playwrightFetcher = fetchWithPlaywright;\n }\n\n private makeDefaultHttpFetcher(): HttpFetcher {\n return async (url, opts) => {\n if (!this.httpClient) {\n throw new Error('SmartRouter: httpClient not configured');\n }\n const r = await this.httpClient.fetch(url, opts);\n return { url: r.url, html: r.html, text: '' };\n };\n }\n\n async fetch(url: string, options: RouterFetchOptions & { mode: 'stealth' }): Promise<RawFetchResult | StageError>;\n async fetch(url: string, options?: RouterFetchOptions): Promise<RawFetchResult>;\n async fetch(\n url: string,\n options: RouterFetchOptions = {},\n ): Promise<RawFetchResult | StageError> {\n const { renderJs = 'auto', useAuth = false, headers, screenshot, actions, mode, conditionalHeaders } = options;\n const config = getConfig();\n const logger = createLogger('fetch');\n const threshold = config.browserFallbackThreshold;\n const domain = new URL(url).hostname;\n\n // Stealth mode: static fetch first, escalate to Playwright when content is thin.\n if (mode === 'stealth') {\n logger.debug('routing to stealth (static then escalate)', { url });\n const staticResult = await this.httpFetcher(url, { headers });\n this.ensureStats(domain);\n if (!shouldEscalate(staticResult.text)) {\n return {\n url: staticResult.url,\n finalUrl: staticResult.url,\n html: staticResult.html,\n contentType: 'text/html',\n statusCode: 200,\n method: 'http',\n headers: {},\n };\n }\n try {\n const pw = await this.playwrightFetcher(url);\n return {\n url: staticResult.url,\n finalUrl: staticResult.url,\n html: pw.html,\n contentType: 'text/html',\n statusCode: 200,\n method: 'playwright',\n headers: {},\n escalated: true,\n };\n } catch (err) {\n if (err instanceof Error && err.message === 'playwright_not_installed') {\n const hint = (err as Error & { hint?: string }).hint ?? 'npx playwright install chromium';\n return {\n error: 'playwright_not_installed',\n error_reason: 'Stealth mode requested but Playwright chromium is not installed',\n stage: 'fetch',\n hint,\n };\n }\n return {\n error: 'playwright_fetch_failed',\n error_reason: err instanceof Error ? err.message : String(err),\n stage: 'fetch',\n hint: 'Stealth fetch failed; check network or retry',\n };\n }\n }\n\n // Cache mode: HTTP-only with tight timeout, never escalates to a browser.\n if (mode === 'cache') {\n if (actions && actions.length > 0) {\n logger.warn('mode=cache ignores browser actions; switch to default/stealth to execute them', {\n url,\n actionCount: actions.length,\n });\n }\n logger.debug('routing to http (cache)', { url });\n if (!this.httpClient) throw new Error('SmartRouter: httpClient not configured');\n const result = await this.httpClient.fetch(url, {\n headers,\n timeoutMs: config.fastTimeoutMs,\n conditionalHeaders,\n });\n this.ensureStats(domain);\n const raw = this.toRawFetchResult(result);\n // Don't probe content of a 304 — body is empty by spec, not a SPA shell.\n raw.jsRequired = result.statusCode === 304 ? false : contentAppearsEmpty(result.html);\n return raw;\n }\n\n // Actions always force Playwright --- actions need a live browser page\n if (actions && actions.length > 0) {\n if (!this.browserPool) throw new Error('SmartRouter: browserPool not configured');\n const authOptions = useAuth ? (await getAuthOptions() ?? {}) : {};\n logger.debug('routing to playwright', { url, reason: 'actions present' });\n return this.browserPool.fetchWithBrowser(url, { headers, screenshot, actions, ...authOptions });\n }\n\n // Always Playwright for auth or explicit override\n if (renderJs === 'always' || useAuth) {\n if (!this.browserPool) throw new Error('SmartRouter: browserPool not configured');\n const authOptions = useAuth ? (await getAuthOptions() ?? {}) : {};\n logger.debug('routing to playwright', { url, reason: useAuth ? 'auth' : 'render_js=always' });\n return this.browserPool.fetchWithBrowser(url, { headers, screenshot, ...authOptions });\n }\n\n // HTTP only, no fallback\n if (renderJs === 'never') {\n if (!this.httpClient) throw new Error('SmartRouter: httpClient not configured');\n logger.debug('routing to http (never)', { url });\n const result = await this.httpClient.fetch(url, { headers, conditionalHeaders });\n this.ensureStats(domain);\n return this.toRawFetchResult(result);\n }\n\n // auto: check if domain is already marked for Playwright\n const stats = this.ensureStats(domain);\n\n if (stats.preferPlaywright) {\n if (!this.browserPool) throw new Error('SmartRouter: browserPool not configured');\n logger.debug('routing to playwright (domain marked)', { url, domain });\n return this.browserPool.fetchWithBrowser(url, { headers, screenshot });\n }\n\n // Try HTTP first\n try {\n if (!this.httpClient) throw new Error('SmartRouter: httpClient not configured');\n const result = await this.httpClient.fetch(url, { headers, conditionalHeaders });\n\n // 304 = unchanged: pass through; never escalate to a browser.\n if (result.statusCode === 304) {\n return this.toRawFetchResult(result);\n }\n\n // Check for SPA shell / empty content\n if (contentAppearsEmpty(result.html)) {\n if (!this.browserPool) throw new Error('SmartRouter: browserPool not configured');\n logger.info('SPA shell detected, marking domain for playwright', { url, domain });\n stats.preferPlaywright = true;\n return this.browserPool.fetchWithBrowser(url, { headers, screenshot });\n }\n\n return this.toRawFetchResult(result);\n } catch (err) {\n stats.failureCount++;\n logger.warn('http fetch failed', {\n url,\n domain,\n failureCount: stats.failureCount,\n error: err instanceof Error ? err.message : String(err),\n });\n\n if (stats.failureCount >= threshold) {\n if (!this.browserPool) throw new Error('SmartRouter: browserPool not configured');\n logger.info('failure threshold reached, marking domain for playwright', { url, domain, threshold });\n stats.preferPlaywright = true;\n return this.browserPool.fetchWithBrowser(url, { headers, screenshot });\n }\n\n throw err;\n }\n }\n\n getDomainStats(domain: string): DomainStats | undefined {\n return this.domainMap.get(domain);\n }\n\n private ensureStats(domain: string): DomainStats {\n let stats = this.domainMap.get(domain);\n if (!stats) {\n stats = { failureCount: 0, preferPlaywright: false };\n this.domainMap.set(domain, stats);\n }\n return stats;\n }\n\n private toRawFetchResult(\n result: Awaited<ReturnType<HttpClient['fetch']>>,\n ): RawFetchResult {\n return {\n url: result.url,\n finalUrl: result.finalUrl,\n html: result.html,\n contentType: result.contentType,\n statusCode: result.statusCode,\n method: 'http',\n headers: result.headers,\n rawBuffer: result.rawBuffer,\n };\n }\n}\n"],"mappings":"AAAA,SAAS,iBAAiB;AAC1B,SAAS,oBAAoB;AAC7B,SAAS,2BAA2B;AACpC,SAAS,sBAAsB;AAC/B,SAAS,qBAAqB,sBAAsB;AA0E7C,MAAM,YAAY;AAAA,EACN,YAAY,oBAAI,IAAyB;AAAA,EACzC;AAAA,EACA;AAAA,EACA;AAAA,EACA;AAAA,EAIjB,YACE,qBACA,aACA;AACA,QAAI,gBAAgB,QAAW;AAC7B,WAAK,aAAa;AAClB,WAAK,cAAc;AAAA,IACrB,WACE,uBACA,OAAO,wBAAwB,aAC9B,gBAAgB,uBACf,iBAAiB,uBACjB,iBAAiB,uBACjB,uBAAuB,sBACzB;AACA,YAAM,OAAO;AACb,UAAI,CAAC,KAAK,eAAe,CAAC,KAAK,YAAY;AACzC,cAAM,IAAI,MAAM,uEAAuE;AAAA,MACzF;AACA,WAAK,aAAa,KAAK;AACvB,WAAK,cAAc,KAAK;AACxB,WAAK,cAAc,KAAK,eAAe,KAAK,uBAAuB;AACnE,WAAK,oBAAoB,KAAK,qBAAqB;AACnD;AAAA,IACF,OAAO;AAEL,WAAK,aAAa;AAAA,IACpB;AACA,SAAK,cAAc,KAAK,uBAAuB;AAC/C,SAAK,oBAAoB;AAAA,EAC3B;AAAA,EAEQ,yBAAsC;AAC5C,WAAO,OAAO,KAAK,SAAS;AAC1B,UAAI,CAAC,KAAK,YAAY;AACpB,cAAM,IAAI,MAAM,wCAAwC;AAAA,MAC1D;AACA,YAAM,IAAI,MAAM,KAAK,WAAW,MAAM,KAAK,IAAI;AAC/C,aAAO,EAAE,KAAK,EAAE,KAAK,MAAM,EAAE,MAAM,MAAM,GAAG;AAAA,IAC9C;AAAA,EACF;AAAA,EAIA,MAAM,MACJ,KACA,UAA8B,CAAC,GACO;AACtC,UAAM,EAAE,WAAW,QAAQ,UAAU,OAAO,SAAS,YAAY,SAAS,MAAM,mBAAmB,IAAI;AACvG,UAAM,SAAS,UAAU;AACzB,UAAM,SAAS,aAAa,OAAO;AACnC,UAAM,YAAY,OAAO;AACzB,UAAM,SAAS,IAAI,IAAI,GAAG,EAAE;AAG5B,QAAI,SAAS,WAAW;AACtB,aAAO,MAAM,6CAA6C,EAAE,IAAI,CAAC;AACjE,YAAM,eAAe,MAAM,KAAK,YAAY,KAAK,EAAE,QAAQ,CAAC;AAC5D,WAAK,YAAY,MAAM;AACvB,UAAI,CAAC,eAAe,aAAa,IAAI,GAAG;AACtC,eAAO;AAAA,UACL,KAAK,aAAa;AAAA,UAClB,UAAU,aAAa;AAAA,UACvB,MAAM,aAAa;AAAA,UACnB,aAAa;AAAA,UACb,YAAY;AAAA,UACZ,QAAQ;AAAA,UACR,SAAS,CAAC;AAAA,QACZ;AAAA,MACF;AACA,UAAI;AACF,cAAM,KAAK,MAAM,KAAK,kBAAkB,GAAG;AAC3C,eAAO;AAAA,UACL,KAAK,aAAa;AAAA,UAClB,UAAU,aAAa;AAAA,UACvB,MAAM,GAAG;AAAA,UACT,aAAa;AAAA,UACb,YAAY;AAAA,UACZ,QAAQ;AAAA,UACR,SAAS,CAAC;AAAA,UACV,WAAW;AAAA,QACb;AAAA,MACF,SAAS,KAAK;AACZ,YAAI,eAAe,SAAS,IAAI,YAAY,4BAA4B;AACtE,gBAAM,OAAQ,IAAkC,QAAQ;AACxD,iBAAO;AAAA,YACL,OAAO;AAAA,YACP,cAAc;AAAA,YACd,OAAO;AAAA,YACP;AAAA,UACF;AAAA,QACF;AACA,eAAO;AAAA,UACL,OAAO;AAAA,UACP,cAAc,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,UAC7D,OAAO;AAAA,UACP,MAAM;AAAA,QACR;AAAA,MACF;AAAA,IACF;AAGA,QAAI,SAAS,SAAS;AACpB,UAAI,WAAW,QAAQ,SAAS,GAAG;AACjC,eAAO,KAAK,iFAAiF;AAAA,UAC3F;AAAA,UACA,aAAa,QAAQ;AAAA,QACvB,CAAC;AAAA,MACH;AACA,aAAO,MAAM,2BAA2B,EAAE,IAAI,CAAC;AAC/C,UAAI,CAAC,KAAK,WAAY,OAAM,IAAI,MAAM,wCAAwC;AAC9E,YAAM,SAAS,MAAM,KAAK,WAAW,MAAM,KAAK;AAAA,QAC9C;AAAA,QACA,WAAW,OAAO;AAAA,QAClB;AAAA,MACF,CAAC;AACD,WAAK,YAAY,MAAM;AACvB,YAAM,MAAM,KAAK,iBAAiB,MAAM;AAExC,UAAI,aAAa,OAAO,eAAe,MAAM,QAAQ,oBAAoB,OAAO,IAAI;AACpF,aAAO;AAAA,IACT;AAGA,QAAI,WAAW,QAAQ,SAAS,GAAG;AACjC,UAAI,CAAC,KAAK,YAAa,OAAM,IAAI,MAAM,yCAAyC;AAChF,YAAM,cAAc,UAAW,MAAM,eAAe,KAAK,CAAC,IAAK,CAAC;AAChE,aAAO,MAAM,yBAAyB,EAAE,KAAK,QAAQ,kBAAkB,CAAC;AACxE,aAAO,KAAK,YAAY,iBAAiB,KAAK,EAAE,SAAS,YAAY,SAAS,GAAG,YAAY,CAAC;AAAA,IAChG;AAGA,QAAI,aAAa,YAAY,SAAS;AACpC,UAAI,CAAC,KAAK,YAAa,OAAM,IAAI,MAAM,yCAAyC;AAChF,YAAM,cAAc,UAAW,MAAM,eAAe,KAAK,CAAC,IAAK,CAAC;AAChE,aAAO,MAAM,yBAAyB,EAAE,KAAK,QAAQ,UAAU,SAAS,mBAAmB,CAAC;AAC5F,aAAO,KAAK,YAAY,iBAAiB,KAAK,EAAE,SAAS,YAAY,GAAG,YAAY,CAAC;AAAA,IACvF;AAGA,QAAI,aAAa,SAAS;AACxB,UAAI,CAAC,KAAK,WAAY,OAAM,IAAI,MAAM,wCAAwC;AAC9E,aAAO,MAAM,2BAA2B,EAAE,IAAI,CAAC;AAC/C,YAAM,SAAS,MAAM,KAAK,WAAW,MAAM,KAAK,EAAE,SAAS,mBAAmB,CAAC;AAC/E,WAAK,YAAY,MAAM;AACvB,aAAO,KAAK,iBAAiB,MAAM;AAAA,IACrC;AAGA,UAAM,QAAQ,KAAK,YAAY,MAAM;AAErC,QAAI,MAAM,kBAAkB;AAC1B,UAAI,CAAC,KAAK,YAAa,OAAM,IAAI,MAAM,yCAAyC;AAChF,aAAO,MAAM,yCAAyC,EAAE,KAAK,OAAO,CAAC;AACrE,aAAO,KAAK,YAAY,iBAAiB,KAAK,EAAE,SAAS,WAAW,CAAC;AAAA,IACvE;AAGA,QAAI;AACF,UAAI,CAAC,KAAK,WAAY,OAAM,IAAI,MAAM,wCAAwC;AAC9E,YAAM,SAAS,MAAM,KAAK,WAAW,MAAM,KAAK,EAAE,SAAS,mBAAmB,CAAC;AAG/E,UAAI,OAAO,eAAe,KAAK;AAC7B,eAAO,KAAK,iBAAiB,MAAM;AAAA,MACrC;AAGA,UAAI,oBAAoB,OAAO,IAAI,GAAG;AACpC,YAAI,CAAC,KAAK,YAAa,OAAM,IAAI,MAAM,yCAAyC;AAChF,eAAO,KAAK,qDAAqD,EAAE,KAAK,OAAO,CAAC;AAChF,cAAM,mBAAmB;AACzB,eAAO,KAAK,YAAY,iBAAiB,KAAK,EAAE,SAAS,WAAW,CAAC;AAAA,MACvE;AAEA,aAAO,KAAK,iBAAiB,MAAM;AAAA,IACrC,SAAS,KAAK;AACZ,YAAM;AACN,aAAO,KAAK,qBAAqB;AAAA,QAC/B;AAAA,QACA;AAAA,QACA,cAAc,MAAM;AAAA,QACpB,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,MACxD,CAAC;AAED,UAAI,MAAM,gBAAgB,WAAW;AACnC,YAAI,CAAC,KAAK,YAAa,OAAM,IAAI,MAAM,yCAAyC;AAChF,eAAO,KAAK,4DAA4D,EAAE,KAAK,QAAQ,UAAU,CAAC;AAClG,cAAM,mBAAmB;AACzB,eAAO,KAAK,YAAY,iBAAiB,KAAK,EAAE,SAAS,WAAW,CAAC;AAAA,MACvE;AAEA,YAAM;AAAA,IACR;AAAA,EACF;AAAA,EAEA,eAAe,QAAyC;AACtD,WAAO,KAAK,UAAU,IAAI,MAAM;AAAA,EAClC;AAAA,EAEQ,YAAY,QAA6B;AAC/C,QAAI,QAAQ,KAAK,UAAU,IAAI,MAAM;AACrC,QAAI,CAAC,OAAO;AACV,cAAQ,EAAE,cAAc,GAAG,kBAAkB,MAAM;AACnD,WAAK,UAAU,IAAI,QAAQ,KAAK;AAAA,IAClC;AACA,WAAO;AAAA,EACT;AAAA,EAEQ,iBACN,QACgB;AAChB,WAAO;AAAA,MACL,KAAK,OAAO;AAAA,MACZ,UAAU,OAAO;AAAA,MACjB,MAAM,OAAO;AAAA,MACb,aAAa,OAAO;AAAA,MACpB,YAAY,OAAO;AAAA,MACnB,QAAQ;AAAA,MACR,SAAS,OAAO;AAAA,MAChB,WAAW,OAAO;AAAA,IACpB;AAAA,EACF;AACF;","names":[]}
|
package/dist/index.js
CHANGED
|
@@ -1,22 +1,102 @@
|
|
|
1
1
|
#!/usr/bin/env node
|
|
2
|
-
import { parseCommand } from
|
|
3
|
-
import { runWarmup } from
|
|
4
|
-
import { runDaemon } from
|
|
5
|
-
import { runHealthCheck } from
|
|
6
|
-
import {
|
|
2
|
+
import { parseCommand } from "./cli/index.js";
|
|
3
|
+
import { runWarmup } from "./cli/warmup.js";
|
|
4
|
+
import { runDaemon } from "./cli/daemon.js";
|
|
5
|
+
import { runHealthCheck } from "./cli/health.js";
|
|
6
|
+
import { runDoctor } from "./cli/doctor.js";
|
|
7
|
+
import { runShell } from "./cli/shell.js";
|
|
8
|
+
import { runAuth } from "./cli/auth.js";
|
|
9
|
+
import { runPluginCommand } from "./cli/plugin.js";
|
|
10
|
+
import { runInit } from "./cli/init.js";
|
|
11
|
+
import { runUninstall } from "./cli/uninstall.js";
|
|
12
|
+
import { runSetupMcp } from "./cli/setup-mcp.js";
|
|
13
|
+
import { runStatus } from "./cli/status.js";
|
|
14
|
+
import { runBackfill } from "./cli/backfill.js";
|
|
15
|
+
import { printHelp, printVersion, printUnknownCommand } from "./cli/help.js";
|
|
16
|
+
import { getConfig } from "./config.js";
|
|
17
|
+
import { startServer } from "./server.js";
|
|
7
18
|
const { command, args } = parseCommand(process.argv.slice(2));
|
|
8
19
|
switch (command) {
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
20
|
+
case "warmup":
|
|
21
|
+
await runWarmup(args);
|
|
22
|
+
process.exit(0);
|
|
23
|
+
break;
|
|
24
|
+
case "serve":
|
|
25
|
+
runDaemon(args);
|
|
26
|
+
break;
|
|
27
|
+
case "health": {
|
|
28
|
+
const exitCode = await runHealthCheck();
|
|
29
|
+
process.exit(exitCode);
|
|
30
|
+
break;
|
|
31
|
+
}
|
|
32
|
+
case "doctor": {
|
|
33
|
+
const code = await runDoctor(getConfig().dataDir);
|
|
34
|
+
process.exit(code);
|
|
35
|
+
break;
|
|
36
|
+
}
|
|
37
|
+
case "auth": {
|
|
38
|
+
const authCode = await runAuth(args);
|
|
39
|
+
process.exit(authCode);
|
|
40
|
+
break;
|
|
41
|
+
}
|
|
42
|
+
case "shell":
|
|
43
|
+
await runShell(args);
|
|
44
|
+
break;
|
|
45
|
+
case "plugin":
|
|
46
|
+
runPluginCommand(args);
|
|
47
|
+
break;
|
|
48
|
+
case "init": {
|
|
49
|
+
const initCode = await runInit(args);
|
|
50
|
+
process.exit(initCode);
|
|
51
|
+
break;
|
|
52
|
+
}
|
|
53
|
+
case "uninstall": {
|
|
54
|
+
const uninstallCode = await runUninstall(args);
|
|
55
|
+
process.exit(uninstallCode);
|
|
56
|
+
break;
|
|
57
|
+
}
|
|
58
|
+
case "setup": {
|
|
59
|
+
const code = await runSetupMcp(args);
|
|
60
|
+
process.exit(code);
|
|
61
|
+
break;
|
|
62
|
+
}
|
|
63
|
+
case "status": {
|
|
64
|
+
const code = await runStatus(args);
|
|
65
|
+
process.exit(code);
|
|
66
|
+
break;
|
|
67
|
+
}
|
|
68
|
+
case "backfill": {
|
|
69
|
+
const code = await runBackfill(args);
|
|
70
|
+
process.exit(code);
|
|
71
|
+
break;
|
|
72
|
+
}
|
|
73
|
+
case "help":
|
|
74
|
+
printHelp();
|
|
75
|
+
process.exit(0);
|
|
76
|
+
break;
|
|
77
|
+
case "version":
|
|
78
|
+
printVersion();
|
|
79
|
+
process.exit(0);
|
|
80
|
+
break;
|
|
81
|
+
case "unknown":
|
|
82
|
+
printUnknownCommand(args[0] ?? "");
|
|
83
|
+
process.exit(1);
|
|
84
|
+
break;
|
|
85
|
+
case "mcp": {
|
|
86
|
+
const config = getConfig();
|
|
87
|
+
try {
|
|
88
|
+
const { tryConnectDaemon } = await import("./daemon/proxy.js");
|
|
89
|
+
const report = await tryConnectDaemon(config.daemonPort, config.daemonHost);
|
|
90
|
+
if (report) {
|
|
91
|
+
process.stderr.write(
|
|
92
|
+
`[wigolo] Daemon detected at ${config.daemonHost}:${config.daemonPort} (status: ${report.status}). Full proxy deferred to v2.1; starting local server.
|
|
93
|
+
`
|
|
94
|
+
);
|
|
95
|
+
}
|
|
96
|
+
} catch {
|
|
97
|
+
}
|
|
98
|
+
await startServer();
|
|
99
|
+
break;
|
|
100
|
+
}
|
|
21
101
|
}
|
|
22
102
|
//# sourceMappingURL=index.js.map
|
package/dist/index.js.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"
|
|
1
|
+
{"version":3,"sources":["../src/index.ts"],"sourcesContent":["#!/usr/bin/env node\n\nimport { parseCommand } from './cli/index.js';\nimport { runWarmup } from './cli/warmup.js';\nimport { runDaemon } from './cli/daemon.js';\nimport { runHealthCheck } from './cli/health.js';\nimport { runDoctor } from './cli/doctor.js';\nimport { runShell } from './cli/shell.js';\nimport { runAuth } from './cli/auth.js';\nimport { runPluginCommand } from './cli/plugin.js';\nimport { runInit } from './cli/init.js';\nimport { runUninstall } from './cli/uninstall.js';\nimport { runSetupMcp } from './cli/setup-mcp.js';\nimport { runStatus } from './cli/status.js';\nimport { runBackfill } from './cli/backfill.js';\nimport { printHelp, printVersion, printUnknownCommand } from './cli/help.js';\nimport { getConfig } from './config.js';\nimport { startServer } from './server.js';\n\nconst { command, args } = parseCommand(process.argv.slice(2));\n\nswitch (command) {\n case 'warmup':\n await runWarmup(args);\n // Explicit exit for clean teardown — ensures all child subprocesses\n // (reranker, embedding) are reaped before Node returns.\n process.exit(0);\n break;\n\n case 'serve':\n runDaemon(args);\n break;\n\n case 'health': {\n const exitCode = await runHealthCheck();\n process.exit(exitCode);\n break;\n }\n\n case 'doctor': {\n const code = await runDoctor(getConfig().dataDir);\n process.exit(code);\n break;\n }\n\n case 'auth': {\n const authCode = await runAuth(args);\n process.exit(authCode);\n break;\n }\n\n case 'shell':\n await runShell(args);\n break;\n\n case 'plugin':\n runPluginCommand(args);\n break;\n\n case 'init': {\n const initCode = await runInit(args);\n process.exit(initCode);\n break;\n }\n\n case 'uninstall': {\n const uninstallCode = await runUninstall(args);\n process.exit(uninstallCode);\n break;\n }\n\n case 'setup': {\n const code = await runSetupMcp(args);\n process.exit(code);\n break;\n }\n\n case 'status': {\n const code = await runStatus(args);\n process.exit(code);\n break;\n }\n\n case 'backfill': {\n const code = await runBackfill(args);\n process.exit(code);\n break;\n }\n\n case 'help':\n printHelp();\n process.exit(0);\n break;\n\n case 'version':\n printVersion();\n process.exit(0);\n break;\n\n case 'unknown':\n printUnknownCommand(args[0] ?? '');\n process.exit(1);\n break;\n\n case 'mcp': {\n const config = getConfig();\n\n try {\n const { tryConnectDaemon } = await import('./daemon/proxy.js');\n const report = await tryConnectDaemon(config.daemonPort, config.daemonHost);\n if (report) {\n process.stderr.write(\n `[wigolo] Daemon detected at ${config.daemonHost}:${config.daemonPort} ` +\n `(status: ${report.status}). Full proxy deferred to v2.1; starting local server.\\n`,\n );\n }\n } catch {\n // Daemon proxy module may not be available -- fall through to local server\n }\n\n await startServer();\n break;\n }\n}\n"],"mappings":";AAEA,SAAS,oBAAoB;AAC7B,SAAS,iBAAiB;AAC1B,SAAS,iBAAiB;AAC1B,SAAS,sBAAsB;AAC/B,SAAS,iBAAiB;AAC1B,SAAS,gBAAgB;AACzB,SAAS,eAAe;AACxB,SAAS,wBAAwB;AACjC,SAAS,eAAe;AACxB,SAAS,oBAAoB;AAC7B,SAAS,mBAAmB;AAC5B,SAAS,iBAAiB;AAC1B,SAAS,mBAAmB;AAC5B,SAAS,WAAW,cAAc,2BAA2B;AAC7D,SAAS,iBAAiB;AAC1B,SAAS,mBAAmB;AAE5B,MAAM,EAAE,SAAS,KAAK,IAAI,aAAa,QAAQ,KAAK,MAAM,CAAC,CAAC;AAE5D,QAAQ,SAAS;AAAA,EACf,KAAK;AACH,UAAM,UAAU,IAAI;AAGpB,YAAQ,KAAK,CAAC;AACd;AAAA,EAEF,KAAK;AACH,cAAU,IAAI;AACd;AAAA,EAEF,KAAK,UAAU;AACb,UAAM,WAAW,MAAM,eAAe;AACtC,YAAQ,KAAK,QAAQ;AACrB;AAAA,EACF;AAAA,EAEA,KAAK,UAAU;AACb,UAAM,OAAO,MAAM,UAAU,UAAU,EAAE,OAAO;AAChD,YAAQ,KAAK,IAAI;AACjB;AAAA,EACF;AAAA,EAEA,KAAK,QAAQ;AACX,UAAM,WAAW,MAAM,QAAQ,IAAI;AACnC,YAAQ,KAAK,QAAQ;AACrB;AAAA,EACF;AAAA,EAEA,KAAK;AACH,UAAM,SAAS,IAAI;AACnB;AAAA,EAEF,KAAK;AACH,qBAAiB,IAAI;AACrB;AAAA,EAEF,KAAK,QAAQ;AACX,UAAM,WAAW,MAAM,QAAQ,IAAI;AACnC,YAAQ,KAAK,QAAQ;AACrB;AAAA,EACF;AAAA,EAEA,KAAK,aAAa;AAChB,UAAM,gBAAgB,MAAM,aAAa,IAAI;AAC7C,YAAQ,KAAK,aAAa;AAC1B;AAAA,EACF;AAAA,EAEA,KAAK,SAAS;AACZ,UAAM,OAAO,MAAM,YAAY,IAAI;AACnC,YAAQ,KAAK,IAAI;AACjB;AAAA,EACF;AAAA,EAEA,KAAK,UAAU;AACb,UAAM,OAAO,MAAM,UAAU,IAAI;AACjC,YAAQ,KAAK,IAAI;AACjB;AAAA,EACF;AAAA,EAEA,KAAK,YAAY;AACf,UAAM,OAAO,MAAM,YAAY,IAAI;AACnC,YAAQ,KAAK,IAAI;AACjB;AAAA,EACF;AAAA,EAEA,KAAK;AACH,cAAU;AACV,YAAQ,KAAK,CAAC;AACd;AAAA,EAEF,KAAK;AACH,iBAAa;AACb,YAAQ,KAAK,CAAC;AACd;AAAA,EAEF,KAAK;AACH,wBAAoB,KAAK,CAAC,KAAK,EAAE;AACjC,YAAQ,KAAK,CAAC;AACd;AAAA,EAEF,KAAK,OAAO;AACV,UAAM,SAAS,UAAU;AAEzB,QAAI;AACF,YAAM,EAAE,iBAAiB,IAAI,MAAM,OAAO,mBAAmB;AAC7D,YAAM,SAAS,MAAM,iBAAiB,OAAO,YAAY,OAAO,UAAU;AAC1E,UAAI,QAAQ;AACV,gBAAQ,OAAO;AAAA,UACb,+BAA+B,OAAO,UAAU,IAAI,OAAO,UAAU,aACzD,OAAO,MAAM;AAAA;AAAA,QAC3B;AAAA,MACF;AAAA,IACF,QAAQ;AAAA,IAER;AAEA,UAAM,YAAY;AAClB;AAAA,EACF;AACF;","names":[]}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* LLM knowledge layer for wigolo.
|
|
3
|
+
*
|
|
4
|
+
* Two layers. They do different jobs and must not repeat each other:
|
|
5
|
+
*
|
|
6
|
+
* Layer 1 — WIGOLO_INSTRUCTIONS: server-level STRATEGY. Injected into the
|
|
7
|
+
* LLM system prompt once per session by compatible MCP clients. Answers
|
|
8
|
+
* "when do I reach for wigolo? which of its tools fits this situation?".
|
|
9
|
+
*
|
|
10
|
+
* Layer 2 — TOOL_DESCRIPTIONS: per-tool TACTICS. Seen every time the LLM is
|
|
11
|
+
* picking a tool. Answers "what does this tool do, which parameters matter,
|
|
12
|
+
* what does the output look like?".
|
|
13
|
+
*
|
|
14
|
+
* Parameter schemas (types, enums, required/optional) belong on the JSON
|
|
15
|
+
* Schema, not here. Installation/configuration is for humans, not LLMs.
|
|
16
|
+
*/
|
|
17
|
+
export declare const WIGOLO_INSTRUCTIONS = "Wigolo is a local-first web access layer: search, fetch, crawl, cache, extract, find_similar, research, agent. Results persist in a local knowledge cache across sessions.\n\n## Host-LLM synthesis (read this first)\n\nWigolo returns *structured evidence* \u2014 YOU write the final answer.\n\n- `search` \u2192 evidence (title/url/excerpt/score/citation_id/source_span) + citations. Quote [N] or {citation_id}.\n- `format: 'answer'|'stream_answer'` \u2192 LLM synthesis when sampling supported; else evidence fallback.\n- `research` \u2192 `brief` with topics/highlights/key_findings/sections; use `sections.overview.cross_references` for corroborated findings, `sections.gaps` for coverage limits.\n- `find_similar` \u2192 `cold_start` string when local signals weak. Pass to user verbatim.\n- `extract mode: \"structured\"` \u2192 tables + definitions + jsonld + chart_hints + key_value_pairs in one call.\n- Common knobs: `max_tokens_out` caps output (cl100k-base); `include_full_markdown: true` restores full body; `citation_format`: `'numbered'`|`'json'`|`'anthropic_tags'`.\n\n## When to use which tool\n\n- `search` \u2014 info on a topic, no URL yet. Pass a string or array of 3-5 keyword variants for breadth.\n- `fetch` \u2014 you already have a URL.\n- `crawl` \u2014 many pages from one site (docs, wikis). `strategy: \"sitemap\"` is fastest for doc sites; `\"map\"` for URL-only discovery.\n- `cache` \u2014 check the local store before going to the network.\n- `extract` \u2014 specific data points (tables, metadata, schema-shaped fields) rather than a whole page.\n- `find_similar` \u2014 \"more like this\" given a URL or concept.\n- `research` \u2014 multi-step investigation: decomposition, parallel search, synthesis. Set `depth` to control thoroughness.\n- `agent` \u2014 natural-language data gathering across sources, optional `schema` for structured output.\n\n## Scope and freshness\n\n- Library/framework/SDK queries: **always pass `include_domains`** with the official site (e.g. `[\"react.dev\", \"nextjs.org\"]`). Unscoped queries return noise. Skip scoping for error strings, news, and broad exploration.\n- News, prices, status, release notes \u2192 `force_refresh: true` to bypass cache. Docs and reference pages \u2192 let the cache work.\n\nFor routing tables, performance budgets, auth flows, and other usage detail, read the resource `wigolo://docs/usage`.";
|
|
18
|
+
export declare const WIGOLO_INSTRUCTIONS_FULL = "# Wigolo Usage Guide\n\nWigolo is a local-first web access layer: search the open web, fetch pages, crawl sites, extract structured data, find related content, run multi-step research, and execute agent-driven data gathering. All results land in a local knowledge cache that persists across sessions.\n\n## Host-LLM synthesis pattern (read this first)\n\nWigolo has no internal LLM. It returns *structured evidence* so YOU (the host LLM) write the final answer. Fold structure into your reply:\n\n- `search` \u2192 evidence (title/url/section_heading/excerpt/score/citation_id/source_span) + citations. Quote [N] or {citation_id}.\n- `format: 'answer'|'stream_answer'` \u2192 LLM synthesis when sampling supported; else evidence fallback.\n- `max_tokens_out` caps total output (cl100k-base, ~5-15% drift on non-OpenAI). `include_full_markdown: true` restores full body. `citation_format`: `'numbered'`|`'json'`|`'anthropic_tags'`.\n- `research` \u2192 `brief` with `topics`, `highlights`, `key_findings`, `sections` when sampling unavailable. Use `sections.overview.cross_references` for corroborated findings, `sections.gaps` for coverage limits, `sections.comparison` for entity-vs-entity analysis. `query_type` indicates decomposition strategy used.\n- `find_similar` \u2192 `cold_start` string when local signals are weak. Pass to user verbatim.\n- `extract` `mode: \"structured\"` \u2192 tables + definitions + jsonld + chart_hints + key_value_pairs in one call.\n- `fetch` metadata \u2192 `og_type`, `canonical_url`, `og_image` when present.\n\n## When to use which tool\n\n- `search` -- you need information on a topic but do not have a URL yet. Pass a query string or an array of 3-5 semantically varied keyword forms for broader coverage.\n- `fetch` -- you already have a specific URL to read.\n- `crawl` -- you need multiple pages from the same site (docs, wikis, references).\n- `cache` -- you want to know if the content is already on disk from an earlier read.\n- `extract` -- you need specific data points (tables, metadata, schema-shaped fields) rather than a whole page as markdown.\n- `find_similar` -- you have a URL or concept and want related content from the cache or web. Useful for \"more like this\" discovery.\n- `research` -- you have a complex question that needs multi-step investigation: question decomposition, parallel search, source synthesis into a report. Set `depth` to control thoroughness.\n- `agent` -- you need to gather structured or unstructured data from multiple sources based on a natural-language prompt. Provides full step transparency.\n\n## Routing by intent\n\n| Intent | Tool | Key parameters |\n|--------|------|----------------|\n| Documentation lookup | `search` | `include_domains: [\"react.dev\", \"nextjs.org\"]` -- scope to the project's official site, do not rely on `category: \"docs\"` alone |\n| Error debugging | `search` | exact error string as query, `category: \"code\"` (no domain scoping -- errors appear everywhere) |\n| Library research | `crawl` | seed URL of docs site, `strategy: \"sitemap\"`, then `cache` for later queries |\n| Related content | `find_similar` | `url` of a known good page, or `concept` as free text |\n| Evidence excerpt | `search` | default output; cite [N] or {citation_id} from each evidence item |\n| Direct answer | `search` | `format: \"answer\"` if client supports sampling, else falls back to evidence |\n| Comprehensive research | `research` | `depth: \"comprehensive\"`, optional `include_domains` to scope |\n| Data gathering | `agent` | natural-language `prompt`, optional `schema` for structured output |\n| Structured extraction | `extract` | `mode: \"structured\"` (tables + dl + JSON-LD + chart hints + kv pairs), or `mode: \"schema\"` with a JSON Schema |\n| Site inventory | `crawl` | `strategy: \"map\"` for URL-only discovery, no content fetched |\n\n## Rapidly changing content\n\nFor news, prices, status pages, or release notes, bypass the cache with `force_refresh: true`:\n\n search({ query: \"...\", force_refresh: true })\n fetch({ url: \"...\", force_refresh: true })\n\nFor docs, tutorials, and reference pages, let the cache work -- much faster.\n\n## Check the cache before going to the network\n\nBefore every `search` or `fetch`, consider a `cache` call. Pages read this session or earlier return instantly with full markdown -- no network. `research` and `agent` check the cache internally.\n\n## Multi-query search strategy\n\nFor broad queries, pass an array of 3-5 semantically varied keyword forms rather than one natural-language question. Example: instead of \"how does React handle state management\", pass `[\"react state management\", \"useState useReducer\", \"react hooks state\", \"react context vs redux\"]`. Sub-queries are deduplicated automatically.\n\n## Pick the right strategy\n\n- For docs sites, prefer `crawl` with `strategy: \"sitemap\"` -- faster and more complete than BFS.\n- For URL discovery only, use `crawl` with `strategy: \"map\"` -- URLs only, no content. Follow with targeted `fetch` calls.\n- For structured data (prices, specs, table rows), use `extract` with `mode: \"schema\"` or `mode: \"tables\"`. Use `fetch` only when you want the whole page as markdown.\n- For multi-source synthesis, use `research` instead of chaining `search` + `fetch` manually.\n- For natural-language data gathering, use `agent` with optional `schema`.\n- `crawl` accepts regex `include_patterns` and `exclude_patterns` to stay inside a section of a large site.\n\n## Scope searches by domain\n\nFor library/framework/SDK queries, **always pass `include_domains`** with official sites. Unscoped queries return generic noise. `category: \"docs\"` alone returns generic portals -- pair with `include_domains` or omit. Skip domain scoping for error strings, broad exploration, and news.\n\n## Performance\n\n- `max_results: 3` for focused lookups; `5` default; `10+` only for broad research.\n- `max_tokens_out` caps total response size (cl100k-base BPE); prefer this over `max_chars` for budget-aware agents. When both are set, `max_tokens_out` wins.\n- `max_content_chars: 3000` remains a legitimate per-page budget \u2014 smart-truncates each result's markdown at a paragraph/heading boundary with a `[... content truncated]` marker.\n- `fetch` with `section: \"Heading Name\"` returns content under that heading -- cheaper than the whole page.\n- Repeated fetches of the same URL are free (local cache).\n- `research` with `depth: \"quick\"` (~15s) suits most factual questions; reserve `\"comprehensive\"` for deep investigation.\n- `agent` respects `max_pages` (default 10) and `max_time_ms` (default 60s).\n\n## Extras\n\n- Localhost URLs (`localhost:3000`, `127.0.0.1:8080`) work for local dev servers.\n- `use_auth: true` on `fetch`/`crawl` reuses browser session for logged-in pages.\n- `cache` supports full-text search syntax (`AND`, `OR`, `NOT`, `\"phrase\"`).\n- `research`/`agent` use MCP sampling when supported; fall back to structured data for host-LLM synthesis.";
|
|
19
|
+
export declare const WIGOLO_DOCS_URI = "wigolo://docs/usage";
|
|
20
|
+
export declare const TOOL_DESCRIPTIONS: {
|
|
21
|
+
readonly fetch: "Fetch a single URL and return clean markdown. Use when you have a specific URL to read. Automatically detects if JavaScript rendering is needed.\n\nKey parameters:\n- section: extract content under a specific heading (e.g., section: \"API Reference\") -- faster than reading the whole page\n- max_content_chars: smart-truncate markdown at a paragraph/heading boundary with a `[... content truncated]` marker (e.g., 3000 for compact context). Preferred over max_chars for AI agents.\n- max_tokens_out: token-budget cap on total output (cl100k-base BPE). Takes precedence over max_chars when both are set.\n- include_full_markdown: default false. Set true to include the full markdown body in addition to evidence excerpts.\n- citation_format: 'numbered' (default) | 'json' | 'anthropic_tags'.\n- use_auth: true to use stored browser session for authenticated/private pages\n- render_js: \"auto\" (default, detects JS need), \"always\" (force browser), \"never\" (HTTP only, fastest)\n- headers: custom HTTP headers if needed\n- force_refresh: true to bypass cache and fetch fresh content from the network\n- mode: 'cache' | 'default' (default) | 'stealth'. cache=HTTP-only, accepts stale cache up to 24h. stealth=full browser render + freshness.\n\nReturns title, markdown, links, images, metadata (og_image, og_type, canonical_url, keywords). Cached locally; repeat fetches are instant. Localhost URLs work.";
|
|
22
|
+
readonly search: "Search the web and return scored evidence excerpts (title/url/section_heading/excerpt/score/citation_id/source_span) plus citations. Default shape is evidence-only — no full markdown body.\n\nKey parameters:\n- query: string or string[] array (3-5 keyword variants; deduplicated automatically)\n- include_domains/exclude_domains: scope to specific sites. ALWAYS scope library/framework queries.\n- category: \"general\" | \"news\" | \"code\" | \"docs\" | \"papers\" — coarse filter, pair with include_domains.\n- from_date/to_date: ISO YYYY-MM-DD for time-bounded queries\n- max_results: default 5; use 3 for focused, 10+ for research\n- format: omit for default evidence shape. 'answer'/'stream_answer' = sampling synthesis (falls back to evidence). Retired values 'full'/'context'/'highlights' reject with a migration error.\n- max_tokens_out: token-budget cap on total output (cl100k-base; wins over max_chars).\n- include_full_markdown: true to restore full markdown body alongside evidence (default false).\n- citation_format: 'numbered' (default) | 'json' | 'anthropic_tags'.\n- max_content_chars: smart-truncate per-page markdown at paragraph boundary (e.g., 3000)\n- force_refresh: true to bypass all caches\n- mode: 'cache' | 'default' (default) | 'stealth'. cache=single-engine, no rerank, 24h-stale cache. stealth=multi-query expansion + full-body top-K.\n\nQuote [N] or {citation_id} from the evidence list.";
|
|
23
|
+
readonly crawl: "Crawl a website starting from a URL and return content from multiple pages. Use for indexing documentation sites, wikis, or any multi-page resource.\n\nKey parameters:\n- strategy: \"bfs\" (breadth-first, default), \"dfs\" (depth-first), \"sitemap\" (use sitemap.xml -- fastest for doc sites), \"map\" (URL discovery only, no content -- fastest for scoping a site)\n- max_depth: how many links deep to follow (default 2)\n- max_pages: maximum pages to fetch (default 20)\n- include_patterns/exclude_patterns: regex filters on URLs\n- max_tokens_out: token-budget cap on total output (cl100k-base; wins over max_chars).\n- include_full_markdown: default false — pages return evidence excerpts; set true for full bodies.\n- citation_format: 'numbered' (default) | 'json' | 'anthropic_tags'.\n\nReturns an array of pages with title, evidence, and depth. Content is deduplicated across pages. All pages are cached for later cache queries.";
|
|
24
|
+
readonly cache: "Search previously fetched content without hitting the network. Use before searching the web -- if relevant content was already fetched or crawled, this returns it instantly.\n\nKey parameters:\n- query: full-text search over cached markdown and titles (supports AND, OR, NOT, \"phrase match\")\n- url_pattern: glob filter on URLs (e.g., \"*example.com*\")\n- since: ISO date -- only results cached after this date\n- stats: true to get cache size, entry count, oldest/newest dates\n- clear: true to delete matching entries\n\nReturns matching cached pages with full markdown content. Cache persists across sessions locally.";
|
|
25
|
+
readonly extract: "Extract structured data from a URL or raw HTML. Use when you need specific data points, tables, or metadata rather than full page markdown.\n\nKey parameters:\n- mode: \"selector\" (CSS selector -> text), \"tables\" (HTML tables only), \"metadata\" (title/author/date/description/og_* + JSON-LD), \"schema\" (JSON Schema -> heuristic field extraction), \"structured\" (ONE-SHOT: tables + <dl> definitions + JSON-LD + chart hints from SVG/figure + microdata/data-attr/grid key-value pairs)\n- css_selector: required for mode=\"selector\" -- any valid CSS selector\n- schema: for mode=\"schema\", a JSON Schema object describing the fields to extract\n- multiple: true to return array of all matches (mode=\"selector\" only)\n\nPrefer mode=\"structured\" over chaining multiple extract calls — it returns every structured pattern on the page in one response:\n { tables, definitions, jsonld, chart_hints, key_value_pairs }\n\nchart_hints surfaces SVG titles, aria-labels, and figcaptions — host LLMs use these to describe data visualizations even when the underlying data is rendered by JavaScript.\n\nFor mode=\"tables\", returns array of table objects with headers and row data. For mode=\"schema\", pass { price: \"string\", name: \"string\" } and get structured fields extracted from the page.";
|
|
26
|
+
readonly find_similar: "Find content related to a URL or concept. Use when you have a known-good page or topic and want to discover similar resources from the cache or web.\n\nKey parameters:\n- url: a URL to find content similar to. The page's content and embeddings are used for similarity matching.\n- concept: free-text description of what you want similar content for. Use when you do not have a specific URL.\n- max_results: number of similar items to return (default 5)\n- include_cached: true (default) to search the local cache first, false to skip cache and search the web only\n- threshold: minimum similarity score (0-1, default 0.5)\n- max_tokens_out: token-budget cap on total output (cl100k-base; wins over max_chars).\n- include_full_markdown: default false — results return evidence excerpts; set true for full bodies.\n- citation_format: 'numbered' (default) | 'json' | 'anthropic_tags'.\n\nProvide either url or concept. Results fuse three signals via 3-way RRF: keyword match, semantic embeddings, and (if local hits sparse) live web search. Each result carries `match_signals` with `embedding_rank`, `fts5_rank`, and `fused_score`.\n\nThe response may include a `cold_start` string when local signals are weak. Pass this verbatim to the user.\n\nReturns results array, method used (\"hybrid\" | \"embedding\" | \"fts5\" | \"search\"), cache_hits, search_hits, embedding_available, and total_time_ms.";
|
|
27
|
+
readonly research: "Run multi-step research on a complex question. Decomposes the question into sub-queries, searches in parallel, fetches top sources, and synthesizes a report with citations.\n\nKey parameters:\n- question: the research question to investigate\n- depth: \"quick\" (~15s, 2 sub-queries, 5-8 sources), \"standard\" (~40s, 4 sub-queries, 10-15 sources, default), \"comprehensive\" (~80s, 7 sub-queries, 20-25 sources)\n- max_sources: override the default source count for the chosen depth\n- include_domains/exclude_domains: scope research to specific sites\n- schema: optional JSON Schema -- structures the report to extract matching fields\n- stream: true to receive progress notifications as each phase completes\n- max_tokens_out: token-budget cap on total output (cl100k-base; wins over max_chars).\n- include_full_markdown: default false — sources return evidence excerpts; set true for full bodies.\n- citation_format: 'numbered' (default) | 'json' | 'anthropic_tags'.\n\nReturns report (markdown with [N] citations), citations array, sources, sub_queries, depth, total_time_ms, sampling_supported, and brief (topics, highlights, key_findings, sections.overview/comparison/gaps).";
|
|
28
|
+
readonly agent: "Execute a natural-language data gathering task. Plans search queries and URLs from a prompt, executes them in parallel, and synthesizes results. Full step transparency.\n\nKey parameters:\n- prompt: natural-language description of what data to gather (e.g., \"find pricing for the top 5 CRM tools\")\n- urls: optional array of specific URLs to include in the gathering\n- schema: optional JSON Schema -- if provided, extracts structured data matching the schema from each page and merges results\n- max_pages: maximum pages to fetch (default 10)\n- max_time_ms: maximum execution time in milliseconds (default 60000)\n- stream: true to receive progress notifications as each step completes\n- max_tokens_out: token-budget cap on total output (cl100k-base; wins over max_chars).\n- include_full_markdown: default false — pages return evidence excerpts; set true for full bodies.\n- citation_format: 'numbered' (default) | 'json' | 'anthropic_tags'.\n\nPipeline: (1) plan, (2) execute search+fetch in parallel within budget, (3) optional schema extraction, (4) synthesize. The steps array exposes every action with timing.\n\nUses MCP requestSampling for planning and synthesis. Without sampling support, uses keyword extraction.\n\nReturns result, sources array, pages_fetched count, steps array, total_time_ms, sampling_supported.";
|
|
29
|
+
};
|
|
30
|
+
export type ToolName = keyof typeof TOOL_DESCRIPTIONS;
|
|
31
|
+
//# sourceMappingURL=instructions.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"instructions.d.ts","sourceRoot":"","sources":["../src/instructions.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;GAeG;AAOH,eAAO,MAAM,mBAAmB,41EA6BwF,CAAC;AAIzH,eAAO,MAAM,wBAAwB,k3NAuF0E,CAAC;AAEhH,eAAO,MAAM,eAAe,wBAAwB,CAAC;AAErD,eAAO,MAAM,iBAAiB;;;;;;;;;CA6HpB,CAAC;AAEX,MAAM,MAAM,QAAQ,GAAG,MAAM,OAAO,iBAAiB,CAAC"}
|