@staticn0va/wigolo 0.1.0 → 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +1 -1
- package/README.md +195 -73
- package/SKILL.md +382 -0
- package/assets/blocks/claude-code/CLAUDE.md.block +20 -0
- package/assets/blocks/claude-code/wigolo-command.md +40 -0
- package/assets/blocks/cursor/wigolo.mdc +46 -0
- package/assets/blocks/gemini-cli/GEMINI.md.block +18 -0
- package/assets/blocks/vscode/copilot-instructions.md.block +18 -0
- package/assets/skills/wigolo/SKILL.md +50 -0
- package/assets/skills/wigolo/rules/cache-first.md +30 -0
- package/assets/skills/wigolo/rules/synthesis.md +43 -0
- package/assets/skills/wigolo-agent/SKILL.md +73 -0
- package/assets/skills/wigolo-crawl/SKILL.md +60 -0
- package/assets/skills/wigolo-extract/SKILL.md +59 -0
- package/assets/skills/wigolo-fetch/SKILL.md +65 -0
- package/assets/skills/wigolo-find-similar/SKILL.md +72 -0
- package/assets/skills/wigolo-research/SKILL.md +77 -0
- package/assets/skills/wigolo-search/SKILL.md +78 -0
- package/dist/agent/executor.d.ts +33 -0
- package/dist/agent/executor.d.ts.map +1 -0
- package/dist/agent/executor.js +233 -0
- package/dist/agent/executor.js.map +1 -0
- package/dist/agent/pipeline.d.ts +5 -0
- package/dist/agent/pipeline.d.ts.map +1 -0
- package/dist/agent/pipeline.js +208 -0
- package/dist/agent/pipeline.js.map +1 -0
- package/dist/agent/planner.d.ts +13 -0
- package/dist/agent/planner.d.ts.map +1 -0
- package/dist/agent/planner.js +271 -0
- package/dist/agent/planner.js.map +1 -0
- package/dist/agent/relevance.d.ts +15 -0
- package/dist/agent/relevance.d.ts.map +1 -0
- package/dist/agent/relevance.js +60 -0
- package/dist/agent/relevance.js.map +1 -0
- package/dist/cache/backfill-embeddings.d.ts +23 -0
- package/dist/cache/backfill-embeddings.d.ts.map +1 -0
- package/dist/cache/backfill-embeddings.js +105 -0
- package/dist/cache/backfill-embeddings.js.map +1 -0
- package/dist/cache/change-detector.d.ts +7 -0
- package/dist/cache/change-detector.d.ts.map +1 -0
- package/dist/cache/change-detector.js +43 -0
- package/dist/cache/change-detector.js.map +1 -0
- package/dist/cache/db.d.ts +1 -0
- package/dist/cache/db.d.ts.map +1 -1
- package/dist/cache/db.js +94 -22
- package/dist/cache/db.js.map +1 -1
- package/dist/cache/diff-summary.d.ts +2 -0
- package/dist/cache/diff-summary.d.ts.map +1 -0
- package/dist/cache/diff-summary.js +82 -0
- package/dist/cache/diff-summary.js.map +1 -0
- package/dist/cache/migrations/runner.d.ts +29 -0
- package/dist/cache/migrations/runner.d.ts.map +1 -0
- package/dist/cache/migrations/runner.js +147 -0
- package/dist/cache/migrations/runner.js.map +1 -0
- package/dist/cache/sqlite-vec-store.d.ts +42 -0
- package/dist/cache/sqlite-vec-store.d.ts.map +1 -0
- package/dist/cache/sqlite-vec-store.js +176 -0
- package/dist/cache/sqlite-vec-store.js.map +1 -0
- package/dist/cache/store.d.ts +46 -1
- package/dist/cache/store.d.ts.map +1 -1
- package/dist/cache/store.js +362 -168
- package/dist/cache/store.js.map +1 -1
- package/dist/cli/agents/antigravity.d.ts +20 -0
- package/dist/cli/agents/antigravity.d.ts.map +1 -0
- package/dist/cli/agents/antigravity.js +49 -0
- package/dist/cli/agents/antigravity.js.map +1 -0
- package/dist/cli/agents/claude-code.d.ts +25 -0
- package/dist/cli/agents/claude-code.d.ts.map +1 -0
- package/dist/cli/agents/claude-code.js +111 -0
- package/dist/cli/agents/claude-code.js.map +1 -0
- package/dist/cli/agents/cursor.d.ts +21 -0
- package/dist/cli/agents/cursor.d.ts.map +1 -0
- package/dist/cli/agents/cursor.js +58 -0
- package/dist/cli/agents/cursor.js.map +1 -0
- package/dist/cli/agents/gemini-cli.d.ts +21 -0
- package/dist/cli/agents/gemini-cli.d.ts.map +1 -0
- package/dist/cli/agents/gemini-cli.js +55 -0
- package/dist/cli/agents/gemini-cli.js.map +1 -0
- package/dist/cli/agents/registry.d.ts +21 -0
- package/dist/cli/agents/registry.d.ts.map +1 -0
- package/dist/cli/agents/registry.js +27 -0
- package/dist/cli/agents/registry.js.map +1 -0
- package/dist/cli/agents/utils.d.ts +26 -0
- package/dist/cli/agents/utils.d.ts.map +1 -0
- package/dist/cli/agents/utils.js +136 -0
- package/dist/cli/agents/utils.js.map +1 -0
- package/dist/cli/agents/vscode.d.ts +21 -0
- package/dist/cli/agents/vscode.d.ts.map +1 -0
- package/dist/cli/agents/vscode.js +62 -0
- package/dist/cli/agents/vscode.js.map +1 -0
- package/dist/cli/auth.d.ts +2 -0
- package/dist/cli/auth.d.ts.map +1 -0
- package/dist/cli/auth.js +94 -0
- package/dist/cli/auth.js.map +1 -0
- package/dist/cli/backfill.d.ts +2 -0
- package/dist/cli/backfill.d.ts.map +1 -0
- package/dist/cli/backfill.js +58 -0
- package/dist/cli/backfill.js.map +1 -0
- package/dist/cli/daemon.d.ts +6 -1
- package/dist/cli/daemon.d.ts.map +1 -1
- package/dist/cli/daemon.js +61 -3
- package/dist/cli/daemon.js.map +1 -1
- package/dist/cli/doctor.d.ts +8 -0
- package/dist/cli/doctor.d.ts.map +1 -0
- package/dist/cli/doctor.js +318 -0
- package/dist/cli/doctor.js.map +1 -0
- package/dist/cli/health.d.ts +1 -1
- package/dist/cli/health.d.ts.map +1 -1
- package/dist/cli/health.js +42 -3
- package/dist/cli/health.js.map +1 -1
- package/dist/cli/help.d.ts +6 -0
- package/dist/cli/help.d.ts.map +1 -0
- package/dist/cli/help.js +63 -0
- package/dist/cli/help.js.map +1 -0
- package/dist/cli/index.d.ts +1 -1
- package/dist/cli/index.d.ts.map +1 -1
- package/dist/cli/index.js +35 -7
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/init.d.ts +2 -0
- package/dist/cli/init.d.ts.map +1 -0
- package/dist/cli/init.js +201 -0
- package/dist/cli/init.js.map +1 -0
- package/dist/cli/plugin.d.ts +5 -0
- package/dist/cli/plugin.d.ts.map +1 -0
- package/dist/cli/plugin.js +185 -0
- package/dist/cli/plugin.js.map +1 -0
- package/dist/cli/setup-mcp.d.ts +2 -0
- package/dist/cli/setup-mcp.d.ts.map +1 -0
- package/dist/cli/setup-mcp.js +114 -0
- package/dist/cli/setup-mcp.js.map +1 -0
- package/dist/cli/shell.d.ts +2 -0
- package/dist/cli/shell.d.ts.map +1 -0
- package/dist/cli/shell.js +86 -0
- package/dist/cli/shell.js.map +1 -0
- package/dist/cli/status.d.ts +2 -0
- package/dist/cli/status.d.ts.map +1 -0
- package/dist/cli/status.js +31 -0
- package/dist/cli/status.js.map +1 -0
- package/dist/cli/telemetry.d.ts +10 -0
- package/dist/cli/telemetry.d.ts.map +1 -0
- package/dist/cli/telemetry.js +56 -0
- package/dist/cli/telemetry.js.map +1 -0
- package/dist/cli/tui/agents-types.d.ts +28 -0
- package/dist/cli/tui/agents-types.d.ts.map +1 -0
- package/dist/cli/tui/agents-types.js +1 -0
- package/dist/cli/tui/agents-types.js.map +1 -0
- package/dist/cli/tui/agents.d.ts +11 -0
- package/dist/cli/tui/agents.d.ts.map +1 -0
- package/dist/cli/tui/agents.js +93 -0
- package/dist/cli/tui/agents.js.map +1 -0
- package/dist/cli/tui/banner.d.ts +3 -0
- package/dist/cli/tui/banner.d.ts.map +1 -0
- package/dist/cli/tui/banner.js +30 -0
- package/dist/cli/tui/banner.js.map +1 -0
- package/dist/cli/tui/components/AgentSelect.d.ts +13 -0
- package/dist/cli/tui/components/AgentSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/AgentSelect.js +116 -0
- package/dist/cli/tui/components/AgentSelect.js.map +1 -0
- package/dist/cli/tui/components/Banner.d.ts +6 -0
- package/dist/cli/tui/components/Banner.d.ts.map +1 -0
- package/dist/cli/tui/components/Banner.js +25 -0
- package/dist/cli/tui/components/Banner.js.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts +7 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.js +19 -0
- package/dist/cli/tui/components/BrowserSelect.js.map +1 -0
- package/dist/cli/tui/components/InstallProgress.d.ts +9 -0
- package/dist/cli/tui/components/InstallProgress.d.ts.map +1 -0
- package/dist/cli/tui/components/InstallProgress.js +67 -0
- package/dist/cli/tui/components/InstallProgress.js.map +1 -0
- package/dist/cli/tui/components/SkillInstall.d.ts +14 -0
- package/dist/cli/tui/components/SkillInstall.d.ts.map +1 -0
- package/dist/cli/tui/components/SkillInstall.js +94 -0
- package/dist/cli/tui/components/SkillInstall.js.map +1 -0
- package/dist/cli/tui/components/Summary.d.ts +22 -0
- package/dist/cli/tui/components/Summary.d.ts.map +1 -0
- package/dist/cli/tui/components/Summary.js +135 -0
- package/dist/cli/tui/components/Summary.js.map +1 -0
- package/dist/cli/tui/components/SystemCheck.d.ts +8 -0
- package/dist/cli/tui/components/SystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/components/SystemCheck.js +71 -0
- package/dist/cli/tui/components/SystemCheck.js.map +1 -0
- package/dist/cli/tui/components/Verification.d.ts +8 -0
- package/dist/cli/tui/components/Verification.d.ts.map +1 -0
- package/dist/cli/tui/components/Verification.js +63 -0
- package/dist/cli/tui/components/Verification.js.map +1 -0
- package/dist/cli/tui/config-writer-cli.d.ts +12 -0
- package/dist/cli/tui/config-writer-cli.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-cli.js +39 -0
- package/dist/cli/tui/config-writer-cli.js.map +1 -0
- package/dist/cli/tui/config-writer-json.d.ts +16 -0
- package/dist/cli/tui/config-writer-json.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-json.js +86 -0
- package/dist/cli/tui/config-writer-json.js.map +1 -0
- package/dist/cli/tui/config-writer-toml.d.ts +16 -0
- package/dist/cli/tui/config-writer-toml.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-toml.js +83 -0
- package/dist/cli/tui/config-writer-toml.js.map +1 -0
- package/dist/cli/tui/config-writer.d.ts +25 -0
- package/dist/cli/tui/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/config-writer.js +101 -0
- package/dist/cli/tui/config-writer.js.map +1 -0
- package/dist/cli/tui/detect-helpers.d.ts +6 -0
- package/dist/cli/tui/detect-helpers.d.ts.map +1 -0
- package/dist/cli/tui/detect-helpers.js +45 -0
- package/dist/cli/tui/detect-helpers.js.map +1 -0
- package/dist/cli/tui/extras-prompt.d.ts +7 -0
- package/dist/cli/tui/extras-prompt.d.ts.map +1 -0
- package/dist/cli/tui/extras-prompt.js +42 -0
- package/dist/cli/tui/extras-prompt.js.map +1 -0
- package/dist/cli/tui/flags-types.d.ts +19 -0
- package/dist/cli/tui/flags-types.d.ts.map +1 -0
- package/dist/cli/tui/flags-types.js +23 -0
- package/dist/cli/tui/flags-types.js.map +1 -0
- package/dist/cli/tui/flags.d.ts +5 -0
- package/dist/cli/tui/flags.d.ts.map +1 -0
- package/dist/cli/tui/flags.js +132 -0
- package/dist/cli/tui/flags.js.map +1 -0
- package/dist/cli/tui/format.d.ts +14 -0
- package/dist/cli/tui/format.d.ts.map +1 -0
- package/dist/cli/tui/format.js +37 -0
- package/dist/cli/tui/format.js.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts +6 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.js +19 -0
- package/dist/cli/tui/hooks/useAgentDetect.js.map +1 -0
- package/dist/cli/tui/hooks/useInstall.d.ts +14 -0
- package/dist/cli/tui/hooks/useInstall.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useInstall.js +90 -0
- package/dist/cli/tui/hooks/useInstall.js.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts +13 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.js +95 -0
- package/dist/cli/tui/hooks/useSystemCheck.js.map +1 -0
- package/dist/cli/tui/hooks/useVerify.d.ts +14 -0
- package/dist/cli/tui/hooks/useVerify.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useVerify.js +71 -0
- package/dist/cli/tui/hooks/useVerify.js.map +1 -0
- package/dist/cli/tui/ink-init.d.ts +2 -0
- package/dist/cli/tui/ink-init.d.ts.map +1 -0
- package/dist/cli/tui/ink-init.js +198 -0
- package/dist/cli/tui/ink-init.js.map +1 -0
- package/dist/cli/tui/reporter-auto.d.ts +7 -0
- package/dist/cli/tui/reporter-auto.d.ts.map +1 -0
- package/dist/cli/tui/reporter-auto.js +15 -0
- package/dist/cli/tui/reporter-auto.js.map +1 -0
- package/dist/cli/tui/reporter.d.ts +26 -0
- package/dist/cli/tui/reporter.d.ts.map +1 -0
- package/dist/cli/tui/reporter.js +32 -0
- package/dist/cli/tui/reporter.js.map +1 -0
- package/dist/cli/tui/run-command.d.ts +14 -0
- package/dist/cli/tui/run-command.d.ts.map +1 -0
- package/dist/cli/tui/run-command.js +72 -0
- package/dist/cli/tui/run-command.js.map +1 -0
- package/dist/cli/tui/select-agents.d.ts +6 -0
- package/dist/cli/tui/select-agents.d.ts.map +1 -0
- package/dist/cli/tui/select-agents.js +32 -0
- package/dist/cli/tui/select-agents.js.map +1 -0
- package/dist/cli/tui/status-agents.d.ts +11 -0
- package/dist/cli/tui/status-agents.d.ts.map +1 -0
- package/dist/cli/tui/status-agents.js +53 -0
- package/dist/cli/tui/status-agents.js.map +1 -0
- package/dist/cli/tui/status-cache.d.ts +6 -0
- package/dist/cli/tui/status-cache.d.ts.map +1 -0
- package/dist/cli/tui/status-cache.js +39 -0
- package/dist/cli/tui/status-cache.js.map +1 -0
- package/dist/cli/tui/status-format.d.ts +14 -0
- package/dist/cli/tui/status-format.d.ts.map +1 -0
- package/dist/cli/tui/status-format.js +41 -0
- package/dist/cli/tui/status-format.js.map +1 -0
- package/dist/cli/tui/status-python.d.ts +6 -0
- package/dist/cli/tui/status-python.d.ts.map +1 -0
- package/dist/cli/tui/status-python.js +30 -0
- package/dist/cli/tui/status-python.js.map +1 -0
- package/dist/cli/tui/system-check.d.ts +24 -0
- package/dist/cli/tui/system-check.d.ts.map +1 -0
- package/dist/cli/tui/system-check.js +103 -0
- package/dist/cli/tui/system-check.js.map +1 -0
- package/dist/cli/tui/tui-reporter.d.ts +19 -0
- package/dist/cli/tui/tui-reporter.d.ts.map +1 -0
- package/dist/cli/tui/tui-reporter.js +95 -0
- package/dist/cli/tui/tui-reporter.js.map +1 -0
- package/dist/cli/tui/utils/config-writer.d.ts +3 -0
- package/dist/cli/tui/utils/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/utils/config-writer.js +22 -0
- package/dist/cli/tui/utils/config-writer.js.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts +3 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.js +11 -0
- package/dist/cli/tui/utils/suppress-logs.js.map +1 -0
- package/dist/cli/tui/verify-suggestions.d.ts +5 -0
- package/dist/cli/tui/verify-suggestions.d.ts.map +1 -0
- package/dist/cli/tui/verify-suggestions.js +20 -0
- package/dist/cli/tui/verify-suggestions.js.map +1 -0
- package/dist/cli/tui/verify.d.ts +14 -0
- package/dist/cli/tui/verify.d.ts.map +1 -0
- package/dist/cli/tui/verify.js +101 -0
- package/dist/cli/tui/verify.js.map +1 -0
- package/dist/cli/tui/version.d.ts +2 -0
- package/dist/cli/tui/version.d.ts.map +1 -0
- package/dist/cli/tui/version.js +14 -0
- package/dist/cli/tui/version.js.map +1 -0
- package/dist/cli/uninstall.d.ts +2 -0
- package/dist/cli/uninstall.d.ts.map +1 -0
- package/dist/cli/uninstall.js +57 -0
- package/dist/cli/uninstall.js.map +1 -0
- package/dist/cli/warmup.d.ts +10 -2
- package/dist/cli/warmup.d.ts.map +1 -1
- package/dist/cli/warmup.js +226 -93
- package/dist/cli/warmup.js.map +1 -1
- package/dist/config.d.ts +28 -2
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +106 -56
- package/dist/config.js.map +1 -1
- package/dist/crawl/crawler.d.ts +6 -0
- package/dist/crawl/crawler.d.ts.map +1 -1
- package/dist/crawl/crawler.js +210 -209
- package/dist/crawl/crawler.js.map +1 -1
- package/dist/crawl/dedup.d.ts +1 -0
- package/dist/crawl/dedup.d.ts.map +1 -1
- package/dist/crawl/dedup.js +124 -81
- package/dist/crawl/dedup.js.map +1 -1
- package/dist/crawl/etag-incremental.d.ts +43 -0
- package/dist/crawl/etag-incremental.d.ts.map +1 -0
- package/dist/crawl/etag-incremental.js +94 -0
- package/dist/crawl/etag-incremental.js.map +1 -0
- package/dist/crawl/index-to-vec.d.ts +10 -0
- package/dist/crawl/index-to-vec.d.ts.map +1 -0
- package/dist/crawl/index-to-vec.js +44 -0
- package/dist/crawl/index-to-vec.js.map +1 -0
- package/dist/crawl/mapper.js +136 -164
- package/dist/crawl/mapper.js.map +1 -1
- package/dist/crawl/rate-limiter.js +63 -66
- package/dist/crawl/rate-limiter.js.map +1 -1
- package/dist/crawl/robots.js +58 -57
- package/dist/crawl/robots.js.map +1 -1
- package/dist/crawl/sitemap-first.d.ts +12 -0
- package/dist/crawl/sitemap-first.d.ts.map +1 -0
- package/dist/crawl/sitemap-first.js +47 -0
- package/dist/crawl/sitemap-first.js.map +1 -0
- package/dist/crawl/sitemap.js +33 -32
- package/dist/crawl/sitemap.js.map +1 -1
- package/dist/crawl/url-utils.d.ts +1 -0
- package/dist/crawl/url-utils.d.ts.map +1 -1
- package/dist/crawl/url-utils.js +49 -37
- package/dist/crawl/url-utils.js.map +1 -1
- package/dist/daemon/health-check.d.ts +16 -0
- package/dist/daemon/health-check.d.ts.map +1 -0
- package/dist/daemon/health-check.js +33 -0
- package/dist/daemon/health-check.js.map +1 -0
- package/dist/daemon/http-server.d.ts +26 -0
- package/dist/daemon/http-server.d.ts.map +1 -0
- package/dist/daemon/http-server.js +275 -0
- package/dist/daemon/http-server.js.map +1 -0
- package/dist/daemon/proxy.d.ts +10 -0
- package/dist/daemon/proxy.d.ts.map +1 -0
- package/dist/daemon/proxy.js +93 -0
- package/dist/daemon/proxy.js.map +1 -0
- package/dist/embedding/embed.d.ts +59 -0
- package/dist/embedding/embed.d.ts.map +1 -0
- package/dist/embedding/embed.js +233 -0
- package/dist/embedding/embed.js.map +1 -0
- package/dist/embedding/fastembed-provider.d.ts +19 -0
- package/dist/embedding/fastembed-provider.d.ts.map +1 -0
- package/dist/embedding/fastembed-provider.js +51 -0
- package/dist/embedding/fastembed-provider.js.map +1 -0
- package/dist/embedding/key-terms.d.ts +12 -0
- package/dist/embedding/key-terms.d.ts.map +1 -0
- package/dist/embedding/key-terms.js +234 -0
- package/dist/embedding/key-terms.js.map +1 -0
- package/dist/extraction/boilerplate.d.ts +15 -0
- package/dist/extraction/boilerplate.d.ts.map +1 -0
- package/dist/extraction/boilerplate.js +52 -0
- package/dist/extraction/boilerplate.js.map +1 -0
- package/dist/extraction/defuddle.d.ts.map +1 -1
- package/dist/extraction/defuddle.js +27 -23
- package/dist/extraction/defuddle.js.map +1 -1
- package/dist/extraction/extract.d.ts.map +1 -1
- package/dist/extraction/extract.js +76 -76
- package/dist/extraction/extract.js.map +1 -1
- package/dist/extraction/jsonld.js +50 -54
- package/dist/extraction/jsonld.js.map +1 -1
- package/dist/extraction/lang-hints.d.ts +2 -0
- package/dist/extraction/lang-hints.d.ts.map +1 -0
- package/dist/extraction/lang-hints.js +30 -0
- package/dist/extraction/lang-hints.js.map +1 -0
- package/dist/extraction/llm-fallback.d.ts +17 -0
- package/dist/extraction/llm-fallback.d.ts.map +1 -0
- package/dist/extraction/llm-fallback.js +130 -0
- package/dist/extraction/llm-fallback.js.map +1 -0
- package/dist/extraction/markdown-sanitize.d.ts +2 -0
- package/dist/extraction/markdown-sanitize.d.ts.map +1 -0
- package/dist/extraction/markdown-sanitize.js +151 -0
- package/dist/extraction/markdown-sanitize.js.map +1 -0
- package/dist/extraction/markdown.d.ts +11 -0
- package/dist/extraction/markdown.d.ts.map +1 -1
- package/dist/extraction/markdown.js +195 -91
- package/dist/extraction/markdown.js.map +1 -1
- package/dist/extraction/pipeline.d.ts +8 -0
- package/dist/extraction/pipeline.d.ts.map +1 -1
- package/dist/extraction/pipeline.js +57 -91
- package/dist/extraction/pipeline.js.map +1 -1
- package/dist/extraction/readability.d.ts +1 -1
- package/dist/extraction/readability.d.ts.map +1 -1
- package/dist/extraction/readability.js +28 -29
- package/dist/extraction/readability.js.map +1 -1
- package/dist/extraction/schema.d.ts +12 -0
- package/dist/extraction/schema.d.ts.map +1 -1
- package/dist/extraction/schema.js +135 -72
- package/dist/extraction/schema.js.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.d.ts.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.js +81 -91
- package/dist/extraction/site-extractors/docs-generic.js.map +1 -1
- package/dist/extraction/site-extractors/github.d.ts.map +1 -1
- package/dist/extraction/site-extractors/github.js +87 -95
- package/dist/extraction/site-extractors/github.js.map +1 -1
- package/dist/extraction/site-extractors/mdn.d.ts.map +1 -1
- package/dist/extraction/site-extractors/mdn.js +46 -54
- package/dist/extraction/site-extractors/mdn.js.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.d.ts.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.js +71 -80
- package/dist/extraction/site-extractors/stackoverflow.js.map +1 -1
- package/dist/extraction/structured-data.d.ts +4 -0
- package/dist/extraction/structured-data.d.ts.map +1 -0
- package/dist/extraction/structured-data.js +173 -0
- package/dist/extraction/structured-data.js.map +1 -0
- package/dist/extraction/structured.d.ts +4 -0
- package/dist/extraction/structured.d.ts.map +1 -0
- package/dist/extraction/structured.js +163 -0
- package/dist/extraction/structured.js.map +1 -0
- package/dist/extraction/v1/classifier.d.ts +3 -0
- package/dist/extraction/v1/classifier.d.ts.map +1 -0
- package/dist/extraction/v1/classifier.js +110 -0
- package/dist/extraction/v1/classifier.js.map +1 -0
- package/dist/extraction/v1/extract-provider.d.ts +16 -0
- package/dist/extraction/v1/extract-provider.d.ts.map +1 -0
- package/dist/extraction/v1/extract-provider.js +43 -0
- package/dist/extraction/v1/extract-provider.js.map +1 -0
- package/dist/extraction/v1/local-llm.d.ts +8 -0
- package/dist/extraction/v1/local-llm.d.ts.map +1 -0
- package/dist/extraction/v1/local-llm.js +58 -0
- package/dist/extraction/v1/local-llm.js.map +1 -0
- package/dist/extraction/v1/news.d.ts +3 -0
- package/dist/extraction/v1/news.d.ts.map +1 -0
- package/dist/extraction/v1/news.js +61 -0
- package/dist/extraction/v1/news.js.map +1 -0
- package/dist/extraction/v1/product.d.ts +3 -0
- package/dist/extraction/v1/product.d.ts.map +1 -0
- package/dist/extraction/v1/product.js +166 -0
- package/dist/extraction/v1/product.js.map +1 -0
- package/dist/extraction/v1/recipe.d.ts +3 -0
- package/dist/extraction/v1/recipe.d.ts.map +1 -0
- package/dist/extraction/v1/recipe.js +136 -0
- package/dist/extraction/v1/recipe.js.map +1 -0
- package/dist/extraction/v1/routed.d.ts +17 -0
- package/dist/extraction/v1/routed.d.ts.map +1 -0
- package/dist/extraction/v1/routed.js +68 -0
- package/dist/extraction/v1/routed.js.map +1 -0
- package/dist/extraction/v1/schemas/Article.d.ts +11 -0
- package/dist/extraction/v1/schemas/Article.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Article.js +23 -0
- package/dist/extraction/v1/schemas/Article.js.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts +9 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js +90 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts +10 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.js +122 -0
- package/dist/extraction/v1/schemas/EventListing.js.map +1 -0
- package/dist/extraction/v1/schemas/Paper.d.ts +10 -0
- package/dist/extraction/v1/schemas/Paper.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Paper.js +156 -0
- package/dist/extraction/v1/schemas/Paper.js.map +1 -0
- package/dist/extraction/v1/schemas/Product.d.ts +17 -0
- package/dist/extraction/v1/schemas/Product.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Product.js +149 -0
- package/dist/extraction/v1/schemas/Product.js.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts +14 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.js +160 -0
- package/dist/extraction/v1/schemas/Recipe.js.map +1 -0
- package/dist/extraction/v1/schemas/index.d.ts +13 -0
- package/dist/extraction/v1/schemas/index.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/index.js +44 -0
- package/dist/extraction/v1/schemas/index.js.map +1 -0
- package/dist/extraction/v1/site-extractors.d.ts +5 -0
- package/dist/extraction/v1/site-extractors.d.ts.map +1 -0
- package/dist/extraction/v1/site-extractors.js +31 -0
- package/dist/extraction/v1/site-extractors.js.map +1 -0
- package/dist/fetch/action-executor.d.ts +28 -0
- package/dist/fetch/action-executor.d.ts.map +1 -0
- package/dist/fetch/action-executor.js +88 -0
- package/dist/fetch/action-executor.js.map +1 -0
- package/dist/fetch/auth.d.ts +2 -1
- package/dist/fetch/auth.d.ts.map +1 -1
- package/dist/fetch/auth.js +56 -26
- package/dist/fetch/auth.js.map +1 -1
- package/dist/fetch/browser-pool.d.ts +30 -11
- package/dist/fetch/browser-pool.d.ts.map +1 -1
- package/dist/fetch/browser-pool.js +303 -127
- package/dist/fetch/browser-pool.js.map +1 -1
- package/dist/fetch/browser-selector.d.ts +17 -0
- package/dist/fetch/browser-selector.d.ts.map +1 -0
- package/dist/fetch/browser-selector.js +72 -0
- package/dist/fetch/browser-selector.js.map +1 -0
- package/dist/fetch/browser-types.d.ts +3 -0
- package/dist/fetch/browser-types.d.ts.map +1 -0
- package/dist/fetch/browser-types.js +45 -0
- package/dist/fetch/browser-types.js.map +1 -0
- package/dist/fetch/cdp-client.d.ts +9 -0
- package/dist/fetch/cdp-client.d.ts.map +1 -0
- package/dist/fetch/cdp-client.js +89 -0
- package/dist/fetch/cdp-client.js.map +1 -0
- package/dist/fetch/content-check.js +39 -46
- package/dist/fetch/content-check.js.map +1 -1
- package/dist/fetch/http-client.d.ts +4 -0
- package/dist/fetch/http-client.d.ts.map +1 -1
- package/dist/fetch/http-client.js +147 -128
- package/dist/fetch/http-client.js.map +1 -1
- package/dist/fetch/lightpanda.d.ts +28 -0
- package/dist/fetch/lightpanda.d.ts.map +1 -0
- package/dist/fetch/lightpanda.js +174 -0
- package/dist/fetch/lightpanda.js.map +1 -0
- package/dist/fetch/playwright-tier.d.ts +19 -0
- package/dist/fetch/playwright-tier.d.ts.map +1 -0
- package/dist/fetch/playwright-tier.js +76 -0
- package/dist/fetch/playwright-tier.js.map +1 -0
- package/dist/fetch/router.d.ts +49 -3
- package/dist/fetch/router.d.ts.map +1 -1
- package/dist/fetch/router.js +185 -81
- package/dist/fetch/router.js.map +1 -1
- package/dist/index.js +97 -17
- package/dist/index.js.map +1 -1
- package/dist/instructions.d.ts +31 -0
- package/dist/instructions.d.ts.map +1 -0
- package/dist/instructions.js +245 -0
- package/dist/instructions.js.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts +3 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.js +41 -0
- package/dist/integrations/cloud/llm/anthropic.js.map +1 -0
- package/dist/integrations/cloud/llm/cache.d.ts +5 -0
- package/dist/integrations/cloud/llm/cache.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/cache.js +49 -0
- package/dist/integrations/cloud/llm/cache.js.map +1 -0
- package/dist/integrations/cloud/llm/gemini.d.ts +3 -0
- package/dist/integrations/cloud/llm/gemini.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/gemini.js +37 -0
- package/dist/integrations/cloud/llm/gemini.js.map +1 -0
- package/dist/integrations/cloud/llm/groq.d.ts +3 -0
- package/dist/integrations/cloud/llm/groq.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/groq.js +74 -0
- package/dist/integrations/cloud/llm/groq.js.map +1 -0
- package/dist/integrations/cloud/llm/hash.d.ts +3 -0
- package/dist/integrations/cloud/llm/hash.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/hash.js +26 -0
- package/dist/integrations/cloud/llm/hash.js.map +1 -0
- package/dist/integrations/cloud/llm/openai.d.ts +3 -0
- package/dist/integrations/cloud/llm/openai.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/openai.js +43 -0
- package/dist/integrations/cloud/llm/openai.js.map +1 -0
- package/dist/integrations/cloud/llm/select.d.ts +5 -0
- package/dist/integrations/cloud/llm/select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/select.js +30 -0
- package/dist/integrations/cloud/llm/select.js.map +1 -0
- package/dist/integrations/cloud/llm/types.d.ts +24 -0
- package/dist/integrations/cloud/llm/types.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/types.js +1 -0
- package/dist/integrations/cloud/llm/types.js.map +1 -0
- package/dist/integrations/cloud/llm/validate.d.ts +6 -0
- package/dist/integrations/cloud/llm/validate.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/validate.js +63 -0
- package/dist/integrations/cloud/llm/validate.js.map +1 -0
- package/dist/logger.d.ts +4 -1
- package/dist/logger.d.ts.map +1 -1
- package/dist/logger.js +71 -30
- package/dist/logger.js.map +1 -1
- package/dist/pdf-parse.d.js +1 -0
- package/dist/pdf-parse.d.js.map +1 -0
- package/dist/plugins/loader.d.ts +20 -0
- package/dist/plugins/loader.d.ts.map +1 -0
- package/dist/plugins/loader.js +157 -0
- package/dist/plugins/loader.js.map +1 -0
- package/dist/plugins/registry.d.ts +26 -0
- package/dist/plugins/registry.d.ts.map +1 -0
- package/dist/plugins/registry.js +71 -0
- package/dist/plugins/registry.js.map +1 -0
- package/dist/plugins/validate.d.ts +9 -0
- package/dist/plugins/validate.d.ts.map +1 -0
- package/dist/plugins/validate.js +79 -0
- package/dist/plugins/validate.js.map +1 -0
- package/dist/providers/embed-provider.d.ts +11 -0
- package/dist/providers/embed-provider.d.ts.map +1 -0
- package/dist/providers/embed-provider.js +24 -0
- package/dist/providers/embed-provider.js.map +1 -0
- package/dist/providers/extract-provider.d.ts +23 -0
- package/dist/providers/extract-provider.d.ts.map +1 -0
- package/dist/providers/extract-provider.js +25 -0
- package/dist/providers/extract-provider.js.map +1 -0
- package/dist/providers/rerank-provider.d.ts +16 -0
- package/dist/providers/rerank-provider.d.ts.map +1 -0
- package/dist/providers/rerank-provider.js +28 -0
- package/dist/providers/rerank-provider.js.map +1 -0
- package/dist/providers/search-provider.d.ts +25 -0
- package/dist/providers/search-provider.d.ts.map +1 -0
- package/dist/providers/search-provider.js +44 -0
- package/dist/providers/search-provider.js.map +1 -0
- package/dist/providers/vector-store.d.ts +27 -0
- package/dist/providers/vector-store.d.ts.map +1 -0
- package/dist/providers/vector-store.js +27 -0
- package/dist/providers/vector-store.js.map +1 -0
- package/dist/python-env.d.ts +9 -0
- package/dist/python-env.d.ts.map +1 -0
- package/dist/python-env.js +13 -0
- package/dist/python-env.js.map +1 -0
- package/dist/repl/commands/agent.d.ts +5 -0
- package/dist/repl/commands/agent.d.ts.map +1 -0
- package/dist/repl/commands/agent.js +62 -0
- package/dist/repl/commands/agent.js.map +1 -0
- package/dist/repl/commands/cache.d.ts +4 -0
- package/dist/repl/commands/cache.d.ts.map +1 -0
- package/dist/repl/commands/cache.js +43 -0
- package/dist/repl/commands/cache.js.map +1 -0
- package/dist/repl/commands/crawl.d.ts +7 -0
- package/dist/repl/commands/crawl.d.ts.map +1 -0
- package/dist/repl/commands/crawl.js +44 -0
- package/dist/repl/commands/crawl.js.map +1 -0
- package/dist/repl/commands/extract.d.ts +5 -0
- package/dist/repl/commands/extract.d.ts.map +1 -0
- package/dist/repl/commands/extract.js +47 -0
- package/dist/repl/commands/extract.js.map +1 -0
- package/dist/repl/commands/fetch.d.ts +5 -0
- package/dist/repl/commands/fetch.d.ts.map +1 -0
- package/dist/repl/commands/fetch.js +67 -0
- package/dist/repl/commands/fetch.js.map +1 -0
- package/dist/repl/commands/find-similar.d.ts +5 -0
- package/dist/repl/commands/find-similar.d.ts.map +1 -0
- package/dist/repl/commands/find-similar.js +74 -0
- package/dist/repl/commands/find-similar.js.map +1 -0
- package/dist/repl/commands/research.d.ts +5 -0
- package/dist/repl/commands/research.d.ts.map +1 -0
- package/dist/repl/commands/research.js +65 -0
- package/dist/repl/commands/research.js.map +1 -0
- package/dist/repl/commands/search.d.ts +5 -0
- package/dist/repl/commands/search.d.ts.map +1 -0
- package/dist/repl/commands/search.js +74 -0
- package/dist/repl/commands/search.js.map +1 -0
- package/dist/repl/commands/types.d.ts +9 -0
- package/dist/repl/commands/types.d.ts.map +1 -0
- package/dist/repl/commands/types.js +1 -0
- package/dist/repl/commands/types.js.map +1 -0
- package/dist/repl/formatters.d.ts +13 -0
- package/dist/repl/formatters.d.ts.map +1 -0
- package/dist/repl/formatters.js +283 -0
- package/dist/repl/formatters.js.map +1 -0
- package/dist/repl/parser.d.ts +9 -0
- package/dist/repl/parser.d.ts.map +1 -0
- package/dist/repl/parser.js +86 -0
- package/dist/repl/parser.js.map +1 -0
- package/dist/repl/shell.d.ts +8 -0
- package/dist/repl/shell.d.ts.map +1 -0
- package/dist/repl/shell.js +184 -0
- package/dist/repl/shell.js.map +1 -0
- package/dist/research/branch-exploration.d.ts +14 -0
- package/dist/research/branch-exploration.d.ts.map +1 -0
- package/dist/research/branch-exploration.js +100 -0
- package/dist/research/branch-exploration.js.map +1 -0
- package/dist/research/brief.d.ts +5 -0
- package/dist/research/brief.d.ts.map +1 -0
- package/dist/research/brief.js +242 -0
- package/dist/research/brief.js.map +1 -0
- package/dist/research/citation-graph.d.ts +9 -0
- package/dist/research/citation-graph.d.ts.map +1 -0
- package/dist/research/citation-graph.js +114 -0
- package/dist/research/citation-graph.js.map +1 -0
- package/dist/research/decompose.d.ts +14 -0
- package/dist/research/decompose.d.ts.map +1 -0
- package/dist/research/decompose.js +439 -0
- package/dist/research/decompose.js.map +1 -0
- package/dist/research/pipeline.d.ts +5 -0
- package/dist/research/pipeline.d.ts.map +1 -0
- package/dist/research/pipeline.js +269 -0
- package/dist/research/pipeline.js.map +1 -0
- package/dist/research/synthesis-local.d.ts +16 -0
- package/dist/research/synthesis-local.d.ts.map +1 -0
- package/dist/research/synthesis-local.js +73 -0
- package/dist/research/synthesis-local.js.map +1 -0
- package/dist/research/synthesize.d.ts +10 -0
- package/dist/research/synthesize.d.ts.map +1 -0
- package/dist/research/synthesize.js +137 -0
- package/dist/research/synthesize.js.map +1 -0
- package/dist/search/answer-synthesis.d.ts +33 -0
- package/dist/search/answer-synthesis.d.ts.map +1 -0
- package/dist/search/answer-synthesis.js +244 -0
- package/dist/search/answer-synthesis.js.map +1 -0
- package/dist/search/context-formatter.d.ts +3 -0
- package/dist/search/context-formatter.d.ts.map +1 -0
- package/dist/search/context-formatter.js +56 -0
- package/dist/search/context-formatter.js.map +1 -0
- package/dist/search/dedup.d.ts +1 -0
- package/dist/search/dedup.d.ts.map +1 -1
- package/dist/search/dedup.js +40 -32
- package/dist/search/dedup.js.map +1 -1
- package/dist/search/engines/arxiv.d.ts +7 -0
- package/dist/search/engines/arxiv.d.ts.map +1 -0
- package/dist/search/engines/arxiv.js +70 -0
- package/dist/search/engines/arxiv.js.map +1 -0
- package/dist/search/engines/bing-news.d.ts +7 -0
- package/dist/search/engines/bing-news.d.ts.map +1 -0
- package/dist/search/engines/bing-news.js +97 -0
- package/dist/search/engines/bing-news.js.map +1 -0
- package/dist/search/engines/bing.d.ts +1 -0
- package/dist/search/engines/bing.d.ts.map +1 -1
- package/dist/search/engines/bing.js +100 -44
- package/dist/search/engines/bing.js.map +1 -1
- package/dist/search/engines/devdocs.d.ts +6 -0
- package/dist/search/engines/devdocs.d.ts.map +1 -0
- package/dist/search/engines/devdocs.js +56 -0
- package/dist/search/engines/devdocs.js.map +1 -0
- package/dist/search/engines/duckduckgo.d.ts.map +1 -1
- package/dist/search/engines/duckduckgo.js +56 -44
- package/dist/search/engines/duckduckgo.js.map +1 -1
- package/dist/search/engines/github-code.d.ts +7 -0
- package/dist/search/engines/github-code.d.ts.map +1 -0
- package/dist/search/engines/github-code.js +55 -0
- package/dist/search/engines/github-code.js.map +1 -0
- package/dist/search/engines/hn-algolia.d.ts +7 -0
- package/dist/search/engines/hn-algolia.d.ts.map +1 -0
- package/dist/search/engines/hn-algolia.js +76 -0
- package/dist/search/engines/hn-algolia.js.map +1 -0
- package/dist/search/engines/lobsters.d.ts +7 -0
- package/dist/search/engines/lobsters.d.ts.map +1 -0
- package/dist/search/engines/lobsters.js +83 -0
- package/dist/search/engines/lobsters.js.map +1 -0
- package/dist/search/engines/mdn.d.ts +7 -0
- package/dist/search/engines/mdn.d.ts.map +1 -0
- package/dist/search/engines/mdn.js +48 -0
- package/dist/search/engines/mdn.js.map +1 -0
- package/dist/search/engines/semantic-scholar.d.ts +7 -0
- package/dist/search/engines/semantic-scholar.d.ts.map +1 -0
- package/dist/search/engines/semantic-scholar.js +69 -0
- package/dist/search/engines/semantic-scholar.js.map +1 -0
- package/dist/search/engines/stackoverflow.d.ts +7 -0
- package/dist/search/engines/stackoverflow.d.ts.map +1 -0
- package/dist/search/engines/stackoverflow.js +73 -0
- package/dist/search/engines/stackoverflow.js.map +1 -0
- package/dist/search/engines/startpage.d.ts.map +1 -1
- package/dist/search/engines/startpage.js +65 -46
- package/dist/search/engines/startpage.js.map +1 -1
- package/dist/search/evidence.d.ts +25 -0
- package/dist/search/evidence.d.ts.map +1 -0
- package/dist/search/evidence.js +220 -0
- package/dist/search/evidence.js.map +1 -0
- package/dist/search/filters.js +49 -55
- package/dist/search/filters.js.map +1 -1
- package/dist/search/find-similar/crawl-rank.d.ts +9 -0
- package/dist/search/find-similar/crawl-rank.d.ts.map +1 -0
- package/dist/search/find-similar/crawl-rank.js +272 -0
- package/dist/search/find-similar/crawl-rank.js.map +1 -0
- package/dist/search/find-similar/mode.d.ts +4 -0
- package/dist/search/find-similar/mode.d.ts.map +1 -0
- package/dist/search/find-similar/mode.js +12 -0
- package/dist/search/find-similar/mode.js.map +1 -0
- package/dist/search/find-similar.d.ts +5 -0
- package/dist/search/find-similar.d.ts.map +1 -0
- package/dist/search/find-similar.js +509 -0
- package/dist/search/find-similar.js.map +1 -0
- package/dist/search/highlights.d.ts +19 -0
- package/dist/search/highlights.d.ts.map +1 -0
- package/dist/search/highlights.js +167 -0
- package/dist/search/highlights.js.map +1 -0
- package/dist/search/language-filter.d.ts +29 -0
- package/dist/search/language-filter.d.ts.map +1 -0
- package/dist/search/language-filter.js +126 -0
- package/dist/search/language-filter.js.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts +4 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.js +501 -0
- package/dist/search/legacy/searxng-orchestrator.js.map +1 -0
- package/dist/search/legacy/searxng-provider.d.ts +7 -0
- package/dist/search/legacy/searxng-provider.d.ts.map +1 -0
- package/dist/search/legacy/searxng-provider.js +11 -0
- package/dist/search/legacy/searxng-provider.js.map +1 -0
- package/dist/search/multi-query.d.ts +25 -0
- package/dist/search/multi-query.d.ts.map +1 -0
- package/dist/search/multi-query.js +228 -0
- package/dist/search/multi-query.js.map +1 -0
- package/dist/search/query.js +32 -34
- package/dist/search/query.js.map +1 -1
- package/dist/search/rerank.d.ts +3 -1
- package/dist/search/rerank.d.ts.map +1 -1
- package/dist/search/rerank.js +44 -35
- package/dist/search/rerank.js.map +1 -1
- package/dist/search/reranker/authority-boost.d.ts +3 -0
- package/dist/search/reranker/authority-boost.d.ts.map +1 -0
- package/dist/search/reranker/authority-boost.js +179 -0
- package/dist/search/reranker/authority-boost.js.map +1 -0
- package/dist/search/reranker/consensus-boost.d.ts +3 -0
- package/dist/search/reranker/consensus-boost.d.ts.map +1 -0
- package/dist/search/reranker/consensus-boost.js +27 -0
- package/dist/search/reranker/consensus-boost.js.map +1 -0
- package/dist/search/reranker/recency-boost.d.ts +3 -0
- package/dist/search/reranker/recency-boost.d.ts.map +1 -0
- package/dist/search/reranker/recency-boost.js +13 -0
- package/dist/search/reranker/recency-boost.js.map +1 -0
- package/dist/search/reranker/recency.d.ts +3 -0
- package/dist/search/reranker/recency.d.ts.map +1 -0
- package/dist/search/reranker/recency.js +23 -0
- package/dist/search/reranker/recency.js.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts +12 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.js +78 -0
- package/dist/search/reranker/transformers-rerank-provider.js.map +1 -0
- package/dist/search/rrf.d.ts +17 -0
- package/dist/search/rrf.d.ts.map +1 -0
- package/dist/search/rrf.js +39 -0
- package/dist/search/rrf.js.map +1 -0
- package/dist/search/sampling.d.ts +25 -0
- package/dist/search/sampling.d.ts.map +1 -0
- package/dist/search/sampling.js +52 -0
- package/dist/search/sampling.js.map +1 -0
- package/dist/search/searxng.d.ts.map +1 -1
- package/dist/search/searxng.js +69 -79
- package/dist/search/searxng.js.map +1 -1
- package/dist/search/tokens.d.ts +3 -0
- package/dist/search/tokens.d.ts.map +1 -0
- package/dist/search/tokens.js +39 -0
- package/dist/search/tokens.js.map +1 -0
- package/dist/search/truncate.d.ts +6 -0
- package/dist/search/truncate.d.ts.map +1 -0
- package/dist/search/truncate.js +26 -0
- package/dist/search/truncate.js.map +1 -0
- package/dist/search/url-unwrap.d.ts +3 -0
- package/dist/search/url-unwrap.d.ts.map +1 -0
- package/dist/search/url-unwrap.js +43 -0
- package/dist/search/url-unwrap.js.map +1 -0
- package/dist/search/v1/context-rank.d.ts +13 -0
- package/dist/search/v1/context-rank.d.ts.map +1 -0
- package/dist/search/v1/context-rank.js +74 -0
- package/dist/search/v1/context-rank.js.map +1 -0
- package/dist/search/v1/engine-base.d.ts +27 -0
- package/dist/search/v1/engine-base.d.ts.map +1 -0
- package/dist/search/v1/engine-base.js +110 -0
- package/dist/search/v1/engine-base.js.map +1 -0
- package/dist/search/v1/intent-router.d.ts +22 -0
- package/dist/search/v1/intent-router.d.ts.map +1 -0
- package/dist/search/v1/intent-router.js +138 -0
- package/dist/search/v1/intent-router.js.map +1 -0
- package/dist/search/v1/orchestrator.d.ts +24 -0
- package/dist/search/v1/orchestrator.d.ts.map +1 -0
- package/dist/search/v1/orchestrator.js +163 -0
- package/dist/search/v1/orchestrator.js.map +1 -0
- package/dist/search/v1/recency-boost.d.ts +9 -0
- package/dist/search/v1/recency-boost.d.ts.map +1 -0
- package/dist/search/v1/recency-boost.js +37 -0
- package/dist/search/v1/recency-boost.js.map +1 -0
- package/dist/search/v1/recent-cache-dedup.d.ts +6 -0
- package/dist/search/v1/recent-cache-dedup.d.ts.map +1 -0
- package/dist/search/v1/recent-cache-dedup.js +85 -0
- package/dist/search/v1/recent-cache-dedup.js.map +1 -0
- package/dist/search/v1/rss/feed-config.d.ts +21 -0
- package/dist/search/v1/rss/feed-config.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-config.js +90 -0
- package/dist/search/v1/rss/feed-config.js.map +1 -0
- package/dist/search/v1/rss/feed-parser.d.ts +14 -0
- package/dist/search/v1/rss/feed-parser.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-parser.js +104 -0
- package/dist/search/v1/rss/feed-parser.js.map +1 -0
- package/dist/search/v1/rss/feed-poller.d.ts +22 -0
- package/dist/search/v1/rss/feed-poller.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-poller.js +102 -0
- package/dist/search/v1/rss/feed-poller.js.map +1 -0
- package/dist/search/v1/rss/feed-store.d.ts +30 -0
- package/dist/search/v1/rss/feed-store.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-store.js +134 -0
- package/dist/search/v1/rss/feed-store.js.map +1 -0
- package/dist/search/v1/rss/rss-engine.d.ts +6 -0
- package/dist/search/v1/rss/rss-engine.d.ts.map +1 -0
- package/dist/search/v1/rss/rss-engine.js +28 -0
- package/dist/search/v1/rss/rss-engine.js.map +1 -0
- package/dist/search/v1/v1-provider.d.ts +7 -0
- package/dist/search/v1/v1-provider.d.ts.map +1 -0
- package/dist/search/v1/v1-provider.js +68 -0
- package/dist/search/v1/v1-provider.js.map +1 -0
- package/dist/search/v1/verticals/code.d.ts +4 -0
- package/dist/search/v1/verticals/code.d.ts.map +1 -0
- package/dist/search/v1/verticals/code.js +20 -0
- package/dist/search/v1/verticals/code.js.map +1 -0
- package/dist/search/v1/verticals/docs.d.ts +4 -0
- package/dist/search/v1/verticals/docs.d.ts.map +1 -0
- package/dist/search/v1/verticals/docs.js +20 -0
- package/dist/search/v1/verticals/docs.js.map +1 -0
- package/dist/search/v1/verticals/general.d.ts +4 -0
- package/dist/search/v1/verticals/general.d.ts.map +1 -0
- package/dist/search/v1/verticals/general.js +22 -0
- package/dist/search/v1/verticals/general.js.map +1 -0
- package/dist/search/v1/verticals/news.d.ts +10 -0
- package/dist/search/v1/verticals/news.d.ts.map +1 -0
- package/dist/search/v1/verticals/news.js +52 -0
- package/dist/search/v1/verticals/news.js.map +1 -0
- package/dist/search/v1/verticals/papers.d.ts +4 -0
- package/dist/search/v1/verticals/papers.d.ts.map +1 -0
- package/dist/search/v1/verticals/papers.js +23 -0
- package/dist/search/v1/verticals/papers.js.map +1 -0
- package/dist/search/validator.js +31 -31
- package/dist/search/validator.js.map +1 -1
- package/dist/searxng/bootstrap.d.ts +30 -0
- package/dist/searxng/bootstrap.d.ts.map +1 -1
- package/dist/searxng/bootstrap.js +223 -85
- package/dist/searxng/bootstrap.js.map +1 -1
- package/dist/searxng/docker.d.ts.map +1 -1
- package/dist/searxng/docker.js +69 -60
- package/dist/searxng/docker.js.map +1 -1
- package/dist/searxng/process.d.ts +13 -1
- package/dist/searxng/process.d.ts.map +1 -1
- package/dist/searxng/process.js +231 -164
- package/dist/searxng/process.js.map +1 -1
- package/dist/server/backend-status.d.ts +13 -0
- package/dist/server/backend-status.d.ts.map +1 -0
- package/dist/server/backend-status.js +40 -0
- package/dist/server/backend-status.js.map +1 -0
- package/dist/server/tool-schemas.d.ts +549 -0
- package/dist/server/tool-schemas.d.ts.map +1 -0
- package/dist/server/tool-schemas.js +464 -0
- package/dist/server/tool-schemas.js.map +1 -0
- package/dist/server/warmup-on-start.d.ts +9 -0
- package/dist/server/warmup-on-start.d.ts.map +1 -0
- package/dist/server/warmup-on-start.js +55 -0
- package/dist/server/warmup-on-start.js.map +1 -0
- package/dist/server.d.ts +17 -0
- package/dist/server.d.ts.map +1 -1
- package/dist/server.js +454 -297
- package/dist/server.js.map +1 -1
- package/dist/tools/agent.d.ts +5 -0
- package/dist/tools/agent.d.ts.map +1 -0
- package/dist/tools/agent.js +128 -0
- package/dist/tools/agent.js.map +1 -0
- package/dist/tools/cache.d.ts +2 -1
- package/dist/tools/cache.d.ts.map +1 -1
- package/dist/tools/cache.js +175 -44
- package/dist/tools/cache.js.map +1 -1
- package/dist/tools/crawl.d.ts.map +1 -1
- package/dist/tools/crawl.js +171 -88
- package/dist/tools/crawl.js.map +1 -1
- package/dist/tools/extract.d.ts +2 -2
- package/dist/tools/extract.d.ts.map +1 -1
- package/dist/tools/extract.js +175 -59
- package/dist/tools/extract.js.map +1 -1
- package/dist/tools/fetch.d.ts +2 -2
- package/dist/tools/fetch.d.ts.map +1 -1
- package/dist/tools/fetch.js +161 -68
- package/dist/tools/fetch.js.map +1 -1
- package/dist/tools/find-similar.d.ts +5 -0
- package/dist/tools/find-similar.d.ts.map +1 -0
- package/dist/tools/find-similar.js +127 -0
- package/dist/tools/find-similar.js.map +1 -0
- package/dist/tools/research.d.ts +5 -0
- package/dist/tools/research.d.ts.map +1 -0
- package/dist/tools/research.js +107 -0
- package/dist/tools/research.js.map +1 -0
- package/dist/tools/search.d.ts +10 -2
- package/dist/tools/search.d.ts.map +1 -1
- package/dist/tools/search.js +13 -158
- package/dist/tools/search.js.map +1 -1
- package/dist/types.d.ts +350 -7
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js +6 -1
- package/dist/types.js.map +1 -1
- package/dist/util/mode.d.ts +4 -0
- package/dist/util/mode.d.ts.map +1 -0
- package/dist/util/mode.js +34 -0
- package/dist/util/mode.js.map +1 -0
- package/package.json +78 -8
- package/dist/extraction/trafilatura.d.ts +0 -6
- package/dist/extraction/trafilatura.d.ts.map +0 -1
- package/dist/extraction/trafilatura.js +0 -105
- package/dist/extraction/trafilatura.js.map +0 -1
- package/dist/search/flashrank.d.ts +0 -12
- package/dist/search/flashrank.d.ts.map +0 -1
- package/dist/search/flashrank.js +0 -63
- package/dist/search/flashrank.js.map +0 -1
|
@@ -0,0 +1,90 @@
|
|
|
1
|
+
import { readFileSync, existsSync } from "node:fs";
|
|
2
|
+
import { join } from "node:path";
|
|
3
|
+
import { getConfig } from "../../../config.js";
|
|
4
|
+
import { createLogger } from "../../../logger.js";
|
|
5
|
+
const log = createLogger("search");
|
|
6
|
+
function isValidUrl(raw) {
|
|
7
|
+
try {
|
|
8
|
+
const u = new URL(raw);
|
|
9
|
+
return u.protocol === "http:" || u.protocol === "https:";
|
|
10
|
+
} catch {
|
|
11
|
+
return false;
|
|
12
|
+
}
|
|
13
|
+
}
|
|
14
|
+
function loadEnvFeeds() {
|
|
15
|
+
const raw = process.env.WIGOLO_RSS_FEEDS;
|
|
16
|
+
if (!raw) return [];
|
|
17
|
+
const out = [];
|
|
18
|
+
for (const piece of raw.split(",")) {
|
|
19
|
+
const url = piece.trim();
|
|
20
|
+
if (!url) continue;
|
|
21
|
+
if (!isValidUrl(url)) {
|
|
22
|
+
log.warn("invalid RSS feed URL in env", { url });
|
|
23
|
+
continue;
|
|
24
|
+
}
|
|
25
|
+
out.push({ url });
|
|
26
|
+
}
|
|
27
|
+
return out;
|
|
28
|
+
}
|
|
29
|
+
function loadFileFeeds(dataDir) {
|
|
30
|
+
const path = join(dataDir, "rss-feeds.json");
|
|
31
|
+
if (!existsSync(path)) return [];
|
|
32
|
+
let raw;
|
|
33
|
+
try {
|
|
34
|
+
raw = readFileSync(path, "utf8");
|
|
35
|
+
} catch (err) {
|
|
36
|
+
log.warn("could not read rss-feeds.json", {
|
|
37
|
+
path,
|
|
38
|
+
error: err instanceof Error ? err.message : String(err)
|
|
39
|
+
});
|
|
40
|
+
return [];
|
|
41
|
+
}
|
|
42
|
+
let parsed;
|
|
43
|
+
try {
|
|
44
|
+
parsed = JSON.parse(raw);
|
|
45
|
+
} catch (err) {
|
|
46
|
+
log.warn("malformed rss-feeds.json \u2014 ignoring", {
|
|
47
|
+
path,
|
|
48
|
+
error: err instanceof Error ? err.message : String(err)
|
|
49
|
+
});
|
|
50
|
+
return [];
|
|
51
|
+
}
|
|
52
|
+
if (!Array.isArray(parsed)) {
|
|
53
|
+
log.warn("rss-feeds.json must be an array \u2014 ignoring", { path });
|
|
54
|
+
return [];
|
|
55
|
+
}
|
|
56
|
+
const out = [];
|
|
57
|
+
for (const entry of parsed) {
|
|
58
|
+
if (!entry || typeof entry !== "object") continue;
|
|
59
|
+
const url = typeof entry.url === "string" ? entry.url.trim() : "";
|
|
60
|
+
if (!url || !isValidUrl(url)) {
|
|
61
|
+
log.warn("invalid RSS feed URL in rss-feeds.json", { url });
|
|
62
|
+
continue;
|
|
63
|
+
}
|
|
64
|
+
const feed = { url };
|
|
65
|
+
if (typeof entry.category === "string" && entry.category.length > 0) {
|
|
66
|
+
feed.category = entry.category;
|
|
67
|
+
}
|
|
68
|
+
if (typeof entry.intervalSec === "number" && isFinite(entry.intervalSec) && entry.intervalSec > 0) {
|
|
69
|
+
feed.intervalSec = entry.intervalSec;
|
|
70
|
+
}
|
|
71
|
+
out.push(feed);
|
|
72
|
+
}
|
|
73
|
+
return out;
|
|
74
|
+
}
|
|
75
|
+
function loadFeedConfig(opts) {
|
|
76
|
+
const dataDir = opts?.dataDir ?? getConfig().dataDir;
|
|
77
|
+
const envFeeds = loadEnvFeeds();
|
|
78
|
+
const fileFeeds = loadFileFeeds(dataDir);
|
|
79
|
+
const sources = [];
|
|
80
|
+
if (envFeeds.length > 0) sources.push("env");
|
|
81
|
+
if (fileFeeds.length > 0) sources.push("file");
|
|
82
|
+
const byUrl = /* @__PURE__ */ new Map();
|
|
83
|
+
for (const f of fileFeeds) byUrl.set(f.url, f);
|
|
84
|
+
for (const f of envFeeds) byUrl.set(f.url, f);
|
|
85
|
+
return { feeds: Array.from(byUrl.values()), sources };
|
|
86
|
+
}
|
|
87
|
+
export {
|
|
88
|
+
loadFeedConfig
|
|
89
|
+
};
|
|
90
|
+
//# sourceMappingURL=feed-config.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../../src/search/v1/rss/feed-config.ts"],"sourcesContent":["import { readFileSync, existsSync } from 'node:fs';\nimport { join } from 'node:path';\nimport { getConfig } from '../../../config.js';\nimport { createLogger } from '../../../logger.js';\n\nconst log = createLogger('search');\n\nexport interface FeedConfig {\n url: string;\n /** Optional category override; defaults to 'news'. */\n category?: string;\n /** Override poll interval per feed in seconds. */\n intervalSec?: number;\n}\n\nexport interface LoadFeedConfigResult {\n feeds: FeedConfig[];\n /** Where feeds came from. */\n sources: Array<'env' | 'file'>;\n}\n\nfunction isValidUrl(raw: string): boolean {\n try {\n const u = new URL(raw);\n return u.protocol === 'http:' || u.protocol === 'https:';\n } catch {\n return false;\n }\n}\n\nfunction loadEnvFeeds(): FeedConfig[] {\n const raw = process.env.WIGOLO_RSS_FEEDS;\n if (!raw) return [];\n const out: FeedConfig[] = [];\n for (const piece of raw.split(',')) {\n const url = piece.trim();\n if (!url) continue;\n if (!isValidUrl(url)) {\n log.warn('invalid RSS feed URL in env', { url });\n continue;\n }\n out.push({ url });\n }\n return out;\n}\n\ninterface FileEntry {\n url?: unknown;\n category?: unknown;\n intervalSec?: unknown;\n}\n\nfunction loadFileFeeds(dataDir: string): FeedConfig[] {\n const path = join(dataDir, 'rss-feeds.json');\n if (!existsSync(path)) return [];\n let raw: string;\n try {\n raw = readFileSync(path, 'utf8');\n } catch (err) {\n log.warn('could not read rss-feeds.json', {\n path,\n error: err instanceof Error ? err.message : String(err),\n });\n return [];\n }\n\n let parsed: unknown;\n try {\n parsed = JSON.parse(raw);\n } catch (err) {\n log.warn('malformed rss-feeds.json — ignoring', {\n path,\n error: err instanceof Error ? err.message : String(err),\n });\n return [];\n }\n\n if (!Array.isArray(parsed)) {\n log.warn('rss-feeds.json must be an array — ignoring', { path });\n return [];\n }\n\n const out: FeedConfig[] = [];\n for (const entry of parsed as FileEntry[]) {\n if (!entry || typeof entry !== 'object') continue;\n const url = typeof entry.url === 'string' ? entry.url.trim() : '';\n if (!url || !isValidUrl(url)) {\n log.warn('invalid RSS feed URL in rss-feeds.json', { url });\n continue;\n }\n const feed: FeedConfig = { url };\n if (typeof entry.category === 'string' && entry.category.length > 0) {\n feed.category = entry.category;\n }\n if (typeof entry.intervalSec === 'number' && isFinite(entry.intervalSec) && entry.intervalSec > 0) {\n feed.intervalSec = entry.intervalSec;\n }\n out.push(feed);\n }\n return out;\n}\n\n/**\n * Load feeds from env (`WIGOLO_RSS_FEEDS` — comma-separated URLs) and\n * JSON file (`<dataDir>/rss-feeds.json`). Env entries win on URL collision.\n * Dedup by URL.\n */\nexport function loadFeedConfig(opts?: { dataDir?: string }): LoadFeedConfigResult {\n const dataDir = opts?.dataDir ?? getConfig().dataDir;\n const envFeeds = loadEnvFeeds();\n const fileFeeds = loadFileFeeds(dataDir);\n\n const sources: Array<'env' | 'file'> = [];\n if (envFeeds.length > 0) sources.push('env');\n if (fileFeeds.length > 0) sources.push('file');\n\n const byUrl = new Map<string, FeedConfig>();\n for (const f of fileFeeds) byUrl.set(f.url, f);\n for (const f of envFeeds) byUrl.set(f.url, f); // env wins\n\n return { feeds: Array.from(byUrl.values()), sources };\n}\n"],"mappings":"AAAA,SAAS,cAAc,kBAAkB;AACzC,SAAS,YAAY;AACrB,SAAS,iBAAiB;AAC1B,SAAS,oBAAoB;AAE7B,MAAM,MAAM,aAAa,QAAQ;AAgBjC,SAAS,WAAW,KAAsB;AACxC,MAAI;AACF,UAAM,IAAI,IAAI,IAAI,GAAG;AACrB,WAAO,EAAE,aAAa,WAAW,EAAE,aAAa;AAAA,EAClD,QAAQ;AACN,WAAO;AAAA,EACT;AACF;AAEA,SAAS,eAA6B;AACpC,QAAM,MAAM,QAAQ,IAAI;AACxB,MAAI,CAAC,IAAK,QAAO,CAAC;AAClB,QAAM,MAAoB,CAAC;AAC3B,aAAW,SAAS,IAAI,MAAM,GAAG,GAAG;AAClC,UAAM,MAAM,MAAM,KAAK;AACvB,QAAI,CAAC,IAAK;AACV,QAAI,CAAC,WAAW,GAAG,GAAG;AACpB,UAAI,KAAK,+BAA+B,EAAE,IAAI,CAAC;AAC/C;AAAA,IACF;AACA,QAAI,KAAK,EAAE,IAAI,CAAC;AAAA,EAClB;AACA,SAAO;AACT;AAQA,SAAS,cAAc,SAA+B;AACpD,QAAM,OAAO,KAAK,SAAS,gBAAgB;AAC3C,MAAI,CAAC,WAAW,IAAI,EAAG,QAAO,CAAC;AAC/B,MAAI;AACJ,MAAI;AACF,UAAM,aAAa,MAAM,MAAM;AAAA,EACjC,SAAS,KAAK;AACZ,QAAI,KAAK,iCAAiC;AAAA,MACxC;AAAA,MACA,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD,CAAC;AACD,WAAO,CAAC;AAAA,EACV;AAEA,MAAI;AACJ,MAAI;AACF,aAAS,KAAK,MAAM,GAAG;AAAA,EACzB,SAAS,KAAK;AACZ,QAAI,KAAK,4CAAuC;AAAA,MAC9C;AAAA,MACA,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD,CAAC;AACD,WAAO,CAAC;AAAA,EACV;AAEA,MAAI,CAAC,MAAM,QAAQ,MAAM,GAAG;AAC1B,QAAI,KAAK,mDAA8C,EAAE,KAAK,CAAC;AAC/D,WAAO,CAAC;AAAA,EACV;AAEA,QAAM,MAAoB,CAAC;AAC3B,aAAW,SAAS,QAAuB;AACzC,QAAI,CAAC,SAAS,OAAO,UAAU,SAAU;AACzC,UAAM,MAAM,OAAO,MAAM,QAAQ,WAAW,MAAM,IAAI,KAAK,IAAI;AAC/D,QAAI,CAAC,OAAO,CAAC,WAAW,GAAG,GAAG;AAC5B,UAAI,KAAK,0CAA0C,EAAE,IAAI,CAAC;AAC1D;AAAA,IACF;AACA,UAAM,OAAmB,EAAE,IAAI;AAC/B,QAAI,OAAO,MAAM,aAAa,YAAY,MAAM,SAAS,SAAS,GAAG;AACnE,WAAK,WAAW,MAAM;AAAA,IACxB;AACA,QAAI,OAAO,MAAM,gBAAgB,YAAY,SAAS,MAAM,WAAW,KAAK,MAAM,cAAc,GAAG;AACjG,WAAK,cAAc,MAAM;AAAA,IAC3B;AACA,QAAI,KAAK,IAAI;AAAA,EACf;AACA,SAAO;AACT;AAOO,SAAS,eAAe,MAAmD;AAChF,QAAM,UAAU,MAAM,WAAW,UAAU,EAAE;AAC7C,QAAM,WAAW,aAAa;AAC9B,QAAM,YAAY,cAAc,OAAO;AAEvC,QAAM,UAAiC,CAAC;AACxC,MAAI,SAAS,SAAS,EAAG,SAAQ,KAAK,KAAK;AAC3C,MAAI,UAAU,SAAS,EAAG,SAAQ,KAAK,MAAM;AAE7C,QAAM,QAAQ,oBAAI,IAAwB;AAC1C,aAAW,KAAK,UAAW,OAAM,IAAI,EAAE,KAAK,CAAC;AAC7C,aAAW,KAAK,SAAU,OAAM,IAAI,EAAE,KAAK,CAAC;AAE5C,SAAO,EAAE,OAAO,MAAM,KAAK,MAAM,OAAO,CAAC,GAAG,QAAQ;AACtD;","names":[]}
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
export interface ParsedFeedItem {
|
|
2
|
+
guid: string;
|
|
3
|
+
title: string;
|
|
4
|
+
link: string;
|
|
5
|
+
summary: string;
|
|
6
|
+
publishedDate?: string;
|
|
7
|
+
}
|
|
8
|
+
export interface ParsedFeed {
|
|
9
|
+
feedUrl: string;
|
|
10
|
+
feedTitle: string;
|
|
11
|
+
items: ParsedFeedItem[];
|
|
12
|
+
}
|
|
13
|
+
export declare function parseFeed(xml: string, feedUrl: string): ParsedFeed | null;
|
|
14
|
+
//# sourceMappingURL=feed-parser.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"feed-parser.d.ts","sourceRoot":"","sources":["../../../../src/search/v1/rss/feed-parser.ts"],"names":[],"mappings":"AAKA,MAAM,WAAW,cAAc;IAC7B,IAAI,EAAE,MAAM,CAAC;IACb,KAAK,EAAE,MAAM,CAAC;IACd,IAAI,EAAE,MAAM,CAAC;IACb,OAAO,EAAE,MAAM,CAAC;IAChB,aAAa,CAAC,EAAE,MAAM,CAAC;CACxB;AAED,MAAM,WAAW,UAAU;IACzB,OAAO,EAAE,MAAM,CAAC;IAChB,SAAS,EAAE,MAAM,CAAC;IAClB,KAAK,EAAE,cAAc,EAAE,CAAC;CACzB;AAgGD,wBAAgB,SAAS,CAAC,GAAG,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,GAAG,UAAU,GAAG,IAAI,CAgCzE"}
|
|
@@ -0,0 +1,104 @@
|
|
|
1
|
+
import { parseHTML } from "linkedom";
|
|
2
|
+
import { createLogger } from "../../../logger.js";
|
|
3
|
+
const log = createLogger("search");
|
|
4
|
+
function textOf(el) {
|
|
5
|
+
if (!el) return "";
|
|
6
|
+
return (el.textContent ?? "").trim();
|
|
7
|
+
}
|
|
8
|
+
function toIso(raw) {
|
|
9
|
+
if (!raw) return void 0;
|
|
10
|
+
const d = new Date(raw);
|
|
11
|
+
if (isNaN(d.getTime())) return void 0;
|
|
12
|
+
return d.toISOString();
|
|
13
|
+
}
|
|
14
|
+
function parseRss(doc, feedUrl) {
|
|
15
|
+
const channel = doc.querySelector("rss > channel") ?? doc.querySelector("channel");
|
|
16
|
+
if (!channel) return null;
|
|
17
|
+
const items = Array.from(channel.querySelectorAll("item"));
|
|
18
|
+
if (items.length === 0) return null;
|
|
19
|
+
const feedTitle = textOf(channel.querySelector("title")) || feedUrl;
|
|
20
|
+
const parsed = [];
|
|
21
|
+
for (const item of items) {
|
|
22
|
+
const title = textOf(item.querySelector("title"));
|
|
23
|
+
const link = textOf(item.querySelector("rsslink"));
|
|
24
|
+
const description = textOf(item.querySelector("description"));
|
|
25
|
+
const guid = textOf(item.querySelector("guid")) || link;
|
|
26
|
+
const pubDate = textOf(item.querySelector("pubDate"));
|
|
27
|
+
if (!title || !link) continue;
|
|
28
|
+
const entry = {
|
|
29
|
+
guid: guid || link,
|
|
30
|
+
title,
|
|
31
|
+
link,
|
|
32
|
+
summary: description
|
|
33
|
+
};
|
|
34
|
+
const iso = toIso(pubDate);
|
|
35
|
+
if (iso) entry.publishedDate = iso;
|
|
36
|
+
parsed.push(entry);
|
|
37
|
+
}
|
|
38
|
+
return { feedUrl, feedTitle, items: parsed };
|
|
39
|
+
}
|
|
40
|
+
function parseAtom(doc, feedUrl) {
|
|
41
|
+
const feed = doc.querySelector("feed");
|
|
42
|
+
if (!feed) return null;
|
|
43
|
+
const entries = Array.from(feed.querySelectorAll("entry"));
|
|
44
|
+
if (entries.length === 0) return null;
|
|
45
|
+
const feedTitle = textOf(feed.querySelector("title")) || feedUrl;
|
|
46
|
+
const parsed = [];
|
|
47
|
+
for (const entry of entries) {
|
|
48
|
+
const title = textOf(entry.querySelector("title"));
|
|
49
|
+
const linkEl = Array.from(entry.querySelectorAll("link")).find(
|
|
50
|
+
(l) => (l.getAttribute("rel") ?? "alternate") === "alternate"
|
|
51
|
+
) ?? entry.querySelector("link");
|
|
52
|
+
const link = linkEl?.getAttribute("href") ?? "";
|
|
53
|
+
const summaryEl = entry.querySelector("summary");
|
|
54
|
+
const contentEl = entry.querySelector("content");
|
|
55
|
+
const summary = textOf(summaryEl) || textOf(contentEl);
|
|
56
|
+
const id = textOf(entry.querySelector("id")) || link;
|
|
57
|
+
const published = textOf(entry.querySelector("published")) || textOf(entry.querySelector("updated"));
|
|
58
|
+
if (!title || !link) continue;
|
|
59
|
+
const item = {
|
|
60
|
+
guid: id || link,
|
|
61
|
+
title,
|
|
62
|
+
link,
|
|
63
|
+
summary
|
|
64
|
+
};
|
|
65
|
+
const iso = toIso(published);
|
|
66
|
+
if (iso) item.publishedDate = iso;
|
|
67
|
+
parsed.push(item);
|
|
68
|
+
}
|
|
69
|
+
return { feedUrl, feedTitle, items: parsed };
|
|
70
|
+
}
|
|
71
|
+
function rewriteRssLinks(xml) {
|
|
72
|
+
return xml.replace(/<link>([\s\S]*?)<\/link>/g, "<rsslink>$1</rsslink>");
|
|
73
|
+
}
|
|
74
|
+
function parseFeed(xml, feedUrl) {
|
|
75
|
+
if (!xml || xml.trim().length === 0) return null;
|
|
76
|
+
const prepared = rewriteRssLinks(xml);
|
|
77
|
+
let doc;
|
|
78
|
+
try {
|
|
79
|
+
({ document: doc } = parseHTML(prepared));
|
|
80
|
+
} catch (err) {
|
|
81
|
+
log.warn("feed XML parse failed", {
|
|
82
|
+
feedUrl,
|
|
83
|
+
error: err instanceof Error ? err.message : String(err)
|
|
84
|
+
});
|
|
85
|
+
return null;
|
|
86
|
+
}
|
|
87
|
+
const rss = parseRss(doc, feedUrl);
|
|
88
|
+
if (rss) return rss;
|
|
89
|
+
const atom = parseAtom(doc, feedUrl);
|
|
90
|
+
if (atom) return atom;
|
|
91
|
+
if (doc.querySelector("rss") || doc.querySelector("channel") || doc.querySelector("feed")) {
|
|
92
|
+
const isAtom = !!doc.querySelector("feed");
|
|
93
|
+
return {
|
|
94
|
+
feedUrl,
|
|
95
|
+
feedTitle: textOf(doc.querySelector(isAtom ? "feed > title" : "channel > title")) || feedUrl,
|
|
96
|
+
items: []
|
|
97
|
+
};
|
|
98
|
+
}
|
|
99
|
+
return null;
|
|
100
|
+
}
|
|
101
|
+
export {
|
|
102
|
+
parseFeed
|
|
103
|
+
};
|
|
104
|
+
//# sourceMappingURL=feed-parser.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../../src/search/v1/rss/feed-parser.ts"],"sourcesContent":["import { parseHTML } from 'linkedom';\nimport { createLogger } from '../../../logger.js';\n\nconst log = createLogger('search');\n\nexport interface ParsedFeedItem {\n guid: string;\n title: string;\n link: string;\n summary: string;\n publishedDate?: string;\n}\n\nexport interface ParsedFeed {\n feedUrl: string;\n feedTitle: string;\n items: ParsedFeedItem[];\n}\n\nfunction textOf(el: Element | null | undefined): string {\n if (!el) return '';\n return (el.textContent ?? '').trim();\n}\n\nfunction toIso(raw: string | undefined | null): string | undefined {\n if (!raw) return undefined;\n const d = new Date(raw);\n if (isNaN(d.getTime())) return undefined;\n return d.toISOString();\n}\n\nfunction parseRss(doc: Document, feedUrl: string): ParsedFeed | null {\n const channel = doc.querySelector('rss > channel') ?? doc.querySelector('channel');\n if (!channel) return null;\n const items = Array.from(channel.querySelectorAll('item'));\n if (items.length === 0) return null;\n\n const feedTitle = textOf(channel.querySelector('title')) || feedUrl;\n const parsed: ParsedFeedItem[] = [];\n\n for (const item of items) {\n const title = textOf(item.querySelector('title'));\n const link = textOf(item.querySelector('rsslink'));\n const description = textOf(item.querySelector('description'));\n const guid = textOf(item.querySelector('guid')) || link;\n const pubDate = textOf(item.querySelector('pubDate'));\n\n if (!title || !link) continue;\n\n const entry: ParsedFeedItem = {\n guid: guid || link,\n title,\n link,\n summary: description,\n };\n const iso = toIso(pubDate);\n if (iso) entry.publishedDate = iso;\n parsed.push(entry);\n }\n\n return { feedUrl, feedTitle, items: parsed };\n}\n\nfunction parseAtom(doc: Document, feedUrl: string): ParsedFeed | null {\n const feed = doc.querySelector('feed');\n if (!feed) return null;\n const entries = Array.from(feed.querySelectorAll('entry'));\n if (entries.length === 0) return null;\n\n const feedTitle = textOf(feed.querySelector('title')) || feedUrl;\n const parsed: ParsedFeedItem[] = [];\n\n for (const entry of entries) {\n const title = textOf(entry.querySelector('title'));\n // Atom: <link rel=\"alternate\" href=\"...\"/> — prefer alternate, else first link\n const linkEl = Array.from(entry.querySelectorAll('link')).find(\n (l) => (l.getAttribute('rel') ?? 'alternate') === 'alternate',\n ) ?? entry.querySelector('link');\n const link = linkEl?.getAttribute('href') ?? '';\n const summaryEl = entry.querySelector('summary');\n const contentEl = entry.querySelector('content');\n const summary = textOf(summaryEl) || textOf(contentEl);\n const id = textOf(entry.querySelector('id')) || link;\n const published = textOf(entry.querySelector('published')) || textOf(entry.querySelector('updated'));\n\n if (!title || !link) continue;\n\n const item: ParsedFeedItem = {\n guid: id || link,\n title,\n link,\n summary,\n };\n const iso = toIso(published);\n if (iso) item.publishedDate = iso;\n parsed.push(item);\n }\n\n return { feedUrl, feedTitle, items: parsed };\n}\n\n/**\n * linkedom treats <link> as an HTML void element (self-closing), so RSS\n * <link>https://...</link> ends up with the URL as a text node sibling\n * rather than the link's textContent. Atom uses <link href=\"...\" /> which\n * is fine. We rewrite RSS-style <link>URL</link> → <rsslink>URL</rsslink>\n * so the URL becomes the element's textContent. Atom <link rel=\"...\" href=\"...\"/>\n * is left untouched.\n */\nfunction rewriteRssLinks(xml: string): string {\n return xml.replace(/<link>([\\s\\S]*?)<\\/link>/g, '<rsslink>$1</rsslink>');\n}\n\nexport function parseFeed(xml: string, feedUrl: string): ParsedFeed | null {\n if (!xml || xml.trim().length === 0) return null;\n const prepared = rewriteRssLinks(xml);\n let doc: Document;\n try {\n ({ document: doc } = parseHTML(prepared));\n } catch (err) {\n log.warn('feed XML parse failed', {\n feedUrl,\n error: err instanceof Error ? err.message : String(err),\n });\n return null;\n }\n\n // Prefer RSS shape — if a channel + items exist, use them.\n const rss = parseRss(doc, feedUrl);\n if (rss) return rss;\n\n const atom = parseAtom(doc, feedUrl);\n if (atom) return atom;\n\n // Distinguish \"empty but valid feed\" vs \"not a feed at all\".\n if (doc.querySelector('rss') || doc.querySelector('channel') || doc.querySelector('feed')) {\n const isAtom = !!doc.querySelector('feed');\n return {\n feedUrl,\n feedTitle: textOf(doc.querySelector(isAtom ? 'feed > title' : 'channel > title')) || feedUrl,\n items: [],\n };\n }\n\n return null;\n}\n"],"mappings":"AAAA,SAAS,iBAAiB;AAC1B,SAAS,oBAAoB;AAE7B,MAAM,MAAM,aAAa,QAAQ;AAgBjC,SAAS,OAAO,IAAwC;AACtD,MAAI,CAAC,GAAI,QAAO;AAChB,UAAQ,GAAG,eAAe,IAAI,KAAK;AACrC;AAEA,SAAS,MAAM,KAAoD;AACjE,MAAI,CAAC,IAAK,QAAO;AACjB,QAAM,IAAI,IAAI,KAAK,GAAG;AACtB,MAAI,MAAM,EAAE,QAAQ,CAAC,EAAG,QAAO;AAC/B,SAAO,EAAE,YAAY;AACvB;AAEA,SAAS,SAAS,KAAe,SAAoC;AACnE,QAAM,UAAU,IAAI,cAAc,eAAe,KAAK,IAAI,cAAc,SAAS;AACjF,MAAI,CAAC,QAAS,QAAO;AACrB,QAAM,QAAQ,MAAM,KAAK,QAAQ,iBAAiB,MAAM,CAAC;AACzD,MAAI,MAAM,WAAW,EAAG,QAAO;AAE/B,QAAM,YAAY,OAAO,QAAQ,cAAc,OAAO,CAAC,KAAK;AAC5D,QAAM,SAA2B,CAAC;AAElC,aAAW,QAAQ,OAAO;AACxB,UAAM,QAAQ,OAAO,KAAK,cAAc,OAAO,CAAC;AAChD,UAAM,OAAO,OAAO,KAAK,cAAc,SAAS,CAAC;AACjD,UAAM,cAAc,OAAO,KAAK,cAAc,aAAa,CAAC;AAC5D,UAAM,OAAO,OAAO,KAAK,cAAc,MAAM,CAAC,KAAK;AACnD,UAAM,UAAU,OAAO,KAAK,cAAc,SAAS,CAAC;AAEpD,QAAI,CAAC,SAAS,CAAC,KAAM;AAErB,UAAM,QAAwB;AAAA,MAC5B,MAAM,QAAQ;AAAA,MACd;AAAA,MACA;AAAA,MACA,SAAS;AAAA,IACX;AACA,UAAM,MAAM,MAAM,OAAO;AACzB,QAAI,IAAK,OAAM,gBAAgB;AAC/B,WAAO,KAAK,KAAK;AAAA,EACnB;AAEA,SAAO,EAAE,SAAS,WAAW,OAAO,OAAO;AAC7C;AAEA,SAAS,UAAU,KAAe,SAAoC;AACpE,QAAM,OAAO,IAAI,cAAc,MAAM;AACrC,MAAI,CAAC,KAAM,QAAO;AAClB,QAAM,UAAU,MAAM,KAAK,KAAK,iBAAiB,OAAO,CAAC;AACzD,MAAI,QAAQ,WAAW,EAAG,QAAO;AAEjC,QAAM,YAAY,OAAO,KAAK,cAAc,OAAO,CAAC,KAAK;AACzD,QAAM,SAA2B,CAAC;AAElC,aAAW,SAAS,SAAS;AAC3B,UAAM,QAAQ,OAAO,MAAM,cAAc,OAAO,CAAC;AAEjD,UAAM,SAAS,MAAM,KAAK,MAAM,iBAAiB,MAAM,CAAC,EAAE;AAAA,MACxD,CAAC,OAAO,EAAE,aAAa,KAAK,KAAK,iBAAiB;AAAA,IACpD,KAAK,MAAM,cAAc,MAAM;AAC/B,UAAM,OAAO,QAAQ,aAAa,MAAM,KAAK;AAC7C,UAAM,YAAY,MAAM,cAAc,SAAS;AAC/C,UAAM,YAAY,MAAM,cAAc,SAAS;AAC/C,UAAM,UAAU,OAAO,SAAS,KAAK,OAAO,SAAS;AACrD,UAAM,KAAK,OAAO,MAAM,cAAc,IAAI,CAAC,KAAK;AAChD,UAAM,YAAY,OAAO,MAAM,cAAc,WAAW,CAAC,KAAK,OAAO,MAAM,cAAc,SAAS,CAAC;AAEnG,QAAI,CAAC,SAAS,CAAC,KAAM;AAErB,UAAM,OAAuB;AAAA,MAC3B,MAAM,MAAM;AAAA,MACZ;AAAA,MACA;AAAA,MACA;AAAA,IACF;AACA,UAAM,MAAM,MAAM,SAAS;AAC3B,QAAI,IAAK,MAAK,gBAAgB;AAC9B,WAAO,KAAK,IAAI;AAAA,EAClB;AAEA,SAAO,EAAE,SAAS,WAAW,OAAO,OAAO;AAC7C;AAUA,SAAS,gBAAgB,KAAqB;AAC5C,SAAO,IAAI,QAAQ,6BAA6B,uBAAuB;AACzE;AAEO,SAAS,UAAU,KAAa,SAAoC;AACzE,MAAI,CAAC,OAAO,IAAI,KAAK,EAAE,WAAW,EAAG,QAAO;AAC5C,QAAM,WAAW,gBAAgB,GAAG;AACpC,MAAI;AACJ,MAAI;AACF,KAAC,EAAE,UAAU,IAAI,IAAI,UAAU,QAAQ;AAAA,EACzC,SAAS,KAAK;AACZ,QAAI,KAAK,yBAAyB;AAAA,MAChC;AAAA,MACA,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD,CAAC;AACD,WAAO;AAAA,EACT;AAGA,QAAM,MAAM,SAAS,KAAK,OAAO;AACjC,MAAI,IAAK,QAAO;AAEhB,QAAM,OAAO,UAAU,KAAK,OAAO;AACnC,MAAI,KAAM,QAAO;AAGjB,MAAI,IAAI,cAAc,KAAK,KAAK,IAAI,cAAc,SAAS,KAAK,IAAI,cAAc,MAAM,GAAG;AACzF,UAAM,SAAS,CAAC,CAAC,IAAI,cAAc,MAAM;AACzC,WAAO;AAAA,MACL;AAAA,MACA,WAAW,OAAO,IAAI,cAAc,SAAS,iBAAiB,iBAAiB,CAAC,KAAK;AAAA,MACrF,OAAO,CAAC;AAAA,IACV;AAAA,EACF;AAEA,SAAO;AACT;","names":[]}
|
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
import { type FeedConfig } from './feed-config.js';
|
|
2
|
+
export interface PollResult {
|
|
3
|
+
feedUrl: string;
|
|
4
|
+
ok: boolean;
|
|
5
|
+
itemsAdded: number;
|
|
6
|
+
error?: string;
|
|
7
|
+
}
|
|
8
|
+
export interface PollerHandle {
|
|
9
|
+
stop(): void;
|
|
10
|
+
readonly running: boolean;
|
|
11
|
+
}
|
|
12
|
+
export declare function pollFeedsOnce(opts?: {
|
|
13
|
+
feeds?: FeedConfig[];
|
|
14
|
+
fetchImpl?: typeof fetch;
|
|
15
|
+
timeoutMs?: number;
|
|
16
|
+
}): Promise<PollResult[]>;
|
|
17
|
+
export declare function pollFeedsForever(opts?: {
|
|
18
|
+
intervalSec?: number;
|
|
19
|
+
feeds?: FeedConfig[];
|
|
20
|
+
fetchImpl?: typeof fetch;
|
|
21
|
+
}): PollerHandle;
|
|
22
|
+
//# sourceMappingURL=feed-poller.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"feed-poller.d.ts","sourceRoot":"","sources":["../../../../src/search/v1/rss/feed-poller.ts"],"names":[],"mappings":"AAAA,OAAO,EAAkB,KAAK,UAAU,EAAE,MAAM,kBAAkB,CAAC;AAOnE,MAAM,WAAW,UAAU;IACzB,OAAO,EAAE,MAAM,CAAC;IAChB,EAAE,EAAE,OAAO,CAAC;IACZ,UAAU,EAAE,MAAM,CAAC;IACnB,KAAK,CAAC,EAAE,MAAM,CAAC;CAChB;AAED,MAAM,WAAW,YAAY;IAC3B,IAAI,IAAI,IAAI,CAAC;IACb,QAAQ,CAAC,OAAO,EAAE,OAAO,CAAC;CAC3B;AA+CD,wBAAsB,aAAa,CAAC,IAAI,GAAE;IACxC,KAAK,CAAC,EAAE,UAAU,EAAE,CAAC;IACrB,SAAS,CAAC,EAAE,OAAO,KAAK,CAAC;IACzB,SAAS,CAAC,EAAE,MAAM,CAAC;CACf,GAAG,OAAO,CAAC,UAAU,EAAE,CAAC,CAiC7B;AAED,wBAAgB,gBAAgB,CAAC,IAAI,GAAE;IACrC,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,KAAK,CAAC,EAAE,UAAU,EAAE,CAAC;IACrB,SAAS,CAAC,EAAE,OAAO,KAAK,CAAC;CACrB,GAAG,YAAY,CAyBpB"}
|
|
@@ -0,0 +1,102 @@
|
|
|
1
|
+
import { loadFeedConfig } from "./feed-config.js";
|
|
2
|
+
import { parseFeed } from "./feed-parser.js";
|
|
3
|
+
import { upsertFeedItems } from "./feed-store.js";
|
|
4
|
+
import { createLogger } from "../../../logger.js";
|
|
5
|
+
const log = createLogger("search");
|
|
6
|
+
const DEFAULT_TIMEOUT_MS = 1e4;
|
|
7
|
+
const DEFAULT_INTERVAL_SEC = 300;
|
|
8
|
+
async function pollOne(feed, fetchImpl, timeoutMs) {
|
|
9
|
+
try {
|
|
10
|
+
const res = await fetchImpl(feed.url, {
|
|
11
|
+
signal: AbortSignal.timeout(timeoutMs),
|
|
12
|
+
headers: { Accept: "application/rss+xml, application/atom+xml, application/xml, text/xml" }
|
|
13
|
+
});
|
|
14
|
+
if (!res.ok) {
|
|
15
|
+
return { feedUrl: feed.url, ok: false, itemsAdded: 0, error: `HTTP ${res.status}` };
|
|
16
|
+
}
|
|
17
|
+
const xml = await res.text();
|
|
18
|
+
const parsed = parseFeed(xml, feed.url);
|
|
19
|
+
if (!parsed) {
|
|
20
|
+
return { feedUrl: feed.url, ok: false, itemsAdded: 0, error: "parse failed" };
|
|
21
|
+
}
|
|
22
|
+
const category = feed.category ?? "news";
|
|
23
|
+
const itemsAdded = upsertFeedItems(
|
|
24
|
+
parsed.items.map((it) => ({
|
|
25
|
+
feedUrl: feed.url,
|
|
26
|
+
guid: it.guid,
|
|
27
|
+
title: it.title,
|
|
28
|
+
link: it.link,
|
|
29
|
+
summary: it.summary,
|
|
30
|
+
...it.publishedDate ? { publishedDate: it.publishedDate } : {},
|
|
31
|
+
category
|
|
32
|
+
}))
|
|
33
|
+
);
|
|
34
|
+
return { feedUrl: feed.url, ok: true, itemsAdded };
|
|
35
|
+
} catch (err) {
|
|
36
|
+
return {
|
|
37
|
+
feedUrl: feed.url,
|
|
38
|
+
ok: false,
|
|
39
|
+
itemsAdded: 0,
|
|
40
|
+
error: err instanceof Error ? err.message : String(err)
|
|
41
|
+
};
|
|
42
|
+
}
|
|
43
|
+
}
|
|
44
|
+
async function pollFeedsOnce(opts = {}) {
|
|
45
|
+
const feeds = opts.feeds ?? loadFeedConfig().feeds;
|
|
46
|
+
if (feeds.length === 0) return [];
|
|
47
|
+
const fetchImpl = opts.fetchImpl ?? fetch;
|
|
48
|
+
const timeoutMs = opts.timeoutMs ?? DEFAULT_TIMEOUT_MS;
|
|
49
|
+
const settled = await Promise.allSettled(
|
|
50
|
+
feeds.map((f) => pollOne(f, fetchImpl, timeoutMs))
|
|
51
|
+
);
|
|
52
|
+
const results = [];
|
|
53
|
+
for (let i = 0; i < settled.length; i++) {
|
|
54
|
+
const r = settled[i];
|
|
55
|
+
if (r.status === "fulfilled") {
|
|
56
|
+
results.push(r.value);
|
|
57
|
+
} else {
|
|
58
|
+
results.push({
|
|
59
|
+
feedUrl: feeds[i].url,
|
|
60
|
+
ok: false,
|
|
61
|
+
itemsAdded: 0,
|
|
62
|
+
error: r.reason instanceof Error ? r.reason.message : String(r.reason)
|
|
63
|
+
});
|
|
64
|
+
}
|
|
65
|
+
}
|
|
66
|
+
const totalAdded = results.reduce((acc, r) => acc + r.itemsAdded, 0);
|
|
67
|
+
log.info("feed poll complete", {
|
|
68
|
+
feeds: feeds.length,
|
|
69
|
+
ok: results.filter((r) => r.ok).length,
|
|
70
|
+
itemsAdded: totalAdded
|
|
71
|
+
});
|
|
72
|
+
return results;
|
|
73
|
+
}
|
|
74
|
+
function pollFeedsForever(opts = {}) {
|
|
75
|
+
const intervalSec = opts.intervalSec ?? DEFAULT_INTERVAL_SEC;
|
|
76
|
+
const intervalMs = Math.max(1, Math.floor(intervalSec * 1e3));
|
|
77
|
+
const state = { running: true };
|
|
78
|
+
const handle = setInterval(() => {
|
|
79
|
+
void pollFeedsOnce({
|
|
80
|
+
...opts.feeds ? { feeds: opts.feeds } : {},
|
|
81
|
+
...opts.fetchImpl ? { fetchImpl: opts.fetchImpl } : {}
|
|
82
|
+
}).catch((err) => {
|
|
83
|
+
log.warn("scheduled poll threw", {
|
|
84
|
+
error: err instanceof Error ? err.message : String(err)
|
|
85
|
+
});
|
|
86
|
+
});
|
|
87
|
+
}, intervalMs);
|
|
88
|
+
return {
|
|
89
|
+
stop() {
|
|
90
|
+
clearInterval(handle);
|
|
91
|
+
state.running = false;
|
|
92
|
+
},
|
|
93
|
+
get running() {
|
|
94
|
+
return state.running;
|
|
95
|
+
}
|
|
96
|
+
};
|
|
97
|
+
}
|
|
98
|
+
export {
|
|
99
|
+
pollFeedsForever,
|
|
100
|
+
pollFeedsOnce
|
|
101
|
+
};
|
|
102
|
+
//# sourceMappingURL=feed-poller.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../../src/search/v1/rss/feed-poller.ts"],"sourcesContent":["import { loadFeedConfig, type FeedConfig } from './feed-config.js';\nimport { parseFeed } from './feed-parser.js';\nimport { upsertFeedItems } from './feed-store.js';\nimport { createLogger } from '../../../logger.js';\n\nconst log = createLogger('search');\n\nexport interface PollResult {\n feedUrl: string;\n ok: boolean;\n itemsAdded: number;\n error?: string;\n}\n\nexport interface PollerHandle {\n stop(): void;\n readonly running: boolean;\n}\n\nconst DEFAULT_TIMEOUT_MS = 10_000;\nconst DEFAULT_INTERVAL_SEC = 300;\n\nasync function pollOne(\n feed: FeedConfig,\n fetchImpl: typeof fetch,\n timeoutMs: number,\n): Promise<PollResult> {\n try {\n const res = await fetchImpl(feed.url, {\n signal: AbortSignal.timeout(timeoutMs),\n headers: { Accept: 'application/rss+xml, application/atom+xml, application/xml, text/xml' },\n });\n if (!res.ok) {\n return { feedUrl: feed.url, ok: false, itemsAdded: 0, error: `HTTP ${res.status}` };\n }\n const xml = await res.text();\n const parsed = parseFeed(xml, feed.url);\n if (!parsed) {\n return { feedUrl: feed.url, ok: false, itemsAdded: 0, error: 'parse failed' };\n }\n\n const category = feed.category ?? 'news';\n const itemsAdded = upsertFeedItems(\n parsed.items.map((it) => ({\n feedUrl: feed.url,\n guid: it.guid,\n title: it.title,\n link: it.link,\n summary: it.summary,\n ...(it.publishedDate ? { publishedDate: it.publishedDate } : {}),\n category,\n })),\n );\n return { feedUrl: feed.url, ok: true, itemsAdded };\n } catch (err) {\n return {\n feedUrl: feed.url,\n ok: false,\n itemsAdded: 0,\n error: err instanceof Error ? err.message : String(err),\n };\n }\n}\n\nexport async function pollFeedsOnce(opts: {\n feeds?: FeedConfig[];\n fetchImpl?: typeof fetch;\n timeoutMs?: number;\n} = {}): Promise<PollResult[]> {\n const feeds = opts.feeds ?? loadFeedConfig().feeds;\n if (feeds.length === 0) return [];\n\n const fetchImpl = opts.fetchImpl ?? fetch;\n const timeoutMs = opts.timeoutMs ?? DEFAULT_TIMEOUT_MS;\n\n const settled = await Promise.allSettled(\n feeds.map((f) => pollOne(f, fetchImpl, timeoutMs)),\n );\n\n const results: PollResult[] = [];\n for (let i = 0; i < settled.length; i++) {\n const r = settled[i];\n if (r.status === 'fulfilled') {\n results.push(r.value);\n } else {\n results.push({\n feedUrl: feeds[i].url,\n ok: false,\n itemsAdded: 0,\n error: r.reason instanceof Error ? r.reason.message : String(r.reason),\n });\n }\n }\n\n const totalAdded = results.reduce((acc, r) => acc + r.itemsAdded, 0);\n log.info('feed poll complete', {\n feeds: feeds.length,\n ok: results.filter((r) => r.ok).length,\n itemsAdded: totalAdded,\n });\n return results;\n}\n\nexport function pollFeedsForever(opts: {\n intervalSec?: number;\n feeds?: FeedConfig[];\n fetchImpl?: typeof fetch;\n} = {}): PollerHandle {\n const intervalSec = opts.intervalSec ?? DEFAULT_INTERVAL_SEC;\n const intervalMs = Math.max(1, Math.floor(intervalSec * 1000));\n\n const state = { running: true };\n const handle = setInterval(() => {\n void pollFeedsOnce({\n ...(opts.feeds ? { feeds: opts.feeds } : {}),\n ...(opts.fetchImpl ? { fetchImpl: opts.fetchImpl } : {}),\n }).catch((err) => {\n log.warn('scheduled poll threw', {\n error: err instanceof Error ? err.message : String(err),\n });\n });\n }, intervalMs);\n\n return {\n stop() {\n clearInterval(handle);\n state.running = false;\n },\n get running() {\n return state.running;\n },\n };\n}\n"],"mappings":"AAAA,SAAS,sBAAuC;AAChD,SAAS,iBAAiB;AAC1B,SAAS,uBAAuB;AAChC,SAAS,oBAAoB;AAE7B,MAAM,MAAM,aAAa,QAAQ;AAcjC,MAAM,qBAAqB;AAC3B,MAAM,uBAAuB;AAE7B,eAAe,QACb,MACA,WACA,WACqB;AACrB,MAAI;AACF,UAAM,MAAM,MAAM,UAAU,KAAK,KAAK;AAAA,MACpC,QAAQ,YAAY,QAAQ,SAAS;AAAA,MACrC,SAAS,EAAE,QAAQ,uEAAuE;AAAA,IAC5F,CAAC;AACD,QAAI,CAAC,IAAI,IAAI;AACX,aAAO,EAAE,SAAS,KAAK,KAAK,IAAI,OAAO,YAAY,GAAG,OAAO,QAAQ,IAAI,MAAM,GAAG;AAAA,IACpF;AACA,UAAM,MAAM,MAAM,IAAI,KAAK;AAC3B,UAAM,SAAS,UAAU,KAAK,KAAK,GAAG;AACtC,QAAI,CAAC,QAAQ;AACX,aAAO,EAAE,SAAS,KAAK,KAAK,IAAI,OAAO,YAAY,GAAG,OAAO,eAAe;AAAA,IAC9E;AAEA,UAAM,WAAW,KAAK,YAAY;AAClC,UAAM,aAAa;AAAA,MACjB,OAAO,MAAM,IAAI,CAAC,QAAQ;AAAA,QACxB,SAAS,KAAK;AAAA,QACd,MAAM,GAAG;AAAA,QACT,OAAO,GAAG;AAAA,QACV,MAAM,GAAG;AAAA,QACT,SAAS,GAAG;AAAA,QACZ,GAAI,GAAG,gBAAgB,EAAE,eAAe,GAAG,cAAc,IAAI,CAAC;AAAA,QAC9D;AAAA,MACF,EAAE;AAAA,IACJ;AACA,WAAO,EAAE,SAAS,KAAK,KAAK,IAAI,MAAM,WAAW;AAAA,EACnD,SAAS,KAAK;AACZ,WAAO;AAAA,MACL,SAAS,KAAK;AAAA,MACd,IAAI;AAAA,MACJ,YAAY;AAAA,MACZ,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD;AAAA,EACF;AACF;AAEA,eAAsB,cAAc,OAIhC,CAAC,GAA0B;AAC7B,QAAM,QAAQ,KAAK,SAAS,eAAe,EAAE;AAC7C,MAAI,MAAM,WAAW,EAAG,QAAO,CAAC;AAEhC,QAAM,YAAY,KAAK,aAAa;AACpC,QAAM,YAAY,KAAK,aAAa;AAEpC,QAAM,UAAU,MAAM,QAAQ;AAAA,IAC5B,MAAM,IAAI,CAAC,MAAM,QAAQ,GAAG,WAAW,SAAS,CAAC;AAAA,EACnD;AAEA,QAAM,UAAwB,CAAC;AAC/B,WAAS,IAAI,GAAG,IAAI,QAAQ,QAAQ,KAAK;AACvC,UAAM,IAAI,QAAQ,CAAC;AACnB,QAAI,EAAE,WAAW,aAAa;AAC5B,cAAQ,KAAK,EAAE,KAAK;AAAA,IACtB,OAAO;AACL,cAAQ,KAAK;AAAA,QACX,SAAS,MAAM,CAAC,EAAE;AAAA,QAClB,IAAI;AAAA,QACJ,YAAY;AAAA,QACZ,OAAO,EAAE,kBAAkB,QAAQ,EAAE,OAAO,UAAU,OAAO,EAAE,MAAM;AAAA,MACvE,CAAC;AAAA,IACH;AAAA,EACF;AAEA,QAAM,aAAa,QAAQ,OAAO,CAAC,KAAK,MAAM,MAAM,EAAE,YAAY,CAAC;AACnE,MAAI,KAAK,sBAAsB;AAAA,IAC7B,OAAO,MAAM;AAAA,IACb,IAAI,QAAQ,OAAO,CAAC,MAAM,EAAE,EAAE,EAAE;AAAA,IAChC,YAAY;AAAA,EACd,CAAC;AACD,SAAO;AACT;AAEO,SAAS,iBAAiB,OAI7B,CAAC,GAAiB;AACpB,QAAM,cAAc,KAAK,eAAe;AACxC,QAAM,aAAa,KAAK,IAAI,GAAG,KAAK,MAAM,cAAc,GAAI,CAAC;AAE7D,QAAM,QAAQ,EAAE,SAAS,KAAK;AAC9B,QAAM,SAAS,YAAY,MAAM;AAC/B,SAAK,cAAc;AAAA,MACjB,GAAI,KAAK,QAAQ,EAAE,OAAO,KAAK,MAAM,IAAI,CAAC;AAAA,MAC1C,GAAI,KAAK,YAAY,EAAE,WAAW,KAAK,UAAU,IAAI,CAAC;AAAA,IACxD,CAAC,EAAE,MAAM,CAAC,QAAQ;AAChB,UAAI,KAAK,wBAAwB;AAAA,QAC/B,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,MACxD,CAAC;AAAA,IACH,CAAC;AAAA,EACH,GAAG,UAAU;AAEb,SAAO;AAAA,IACL,OAAO;AACL,oBAAc,MAAM;AACpB,YAAM,UAAU;AAAA,IAClB;AAAA,IACA,IAAI,UAAU;AACZ,aAAO,MAAM;AAAA,IACf;AAAA,EACF;AACF;","names":[]}
|
|
@@ -0,0 +1,30 @@
|
|
|
1
|
+
export interface FeedStoreItem {
|
|
2
|
+
id: number;
|
|
3
|
+
feedUrl: string;
|
|
4
|
+
guid: string;
|
|
5
|
+
title: string;
|
|
6
|
+
link: string;
|
|
7
|
+
summary: string;
|
|
8
|
+
publishedDate?: string;
|
|
9
|
+
category: string;
|
|
10
|
+
fetchedAt: string;
|
|
11
|
+
}
|
|
12
|
+
export interface FeedStoreQueryOptions {
|
|
13
|
+
maxResults?: number;
|
|
14
|
+
fromDate?: string;
|
|
15
|
+
toDate?: string;
|
|
16
|
+
category?: string;
|
|
17
|
+
}
|
|
18
|
+
export declare function upsertFeedItems(items: Array<{
|
|
19
|
+
feedUrl: string;
|
|
20
|
+
guid: string;
|
|
21
|
+
title: string;
|
|
22
|
+
link: string;
|
|
23
|
+
summary: string;
|
|
24
|
+
publishedDate?: string;
|
|
25
|
+
category?: string;
|
|
26
|
+
}>): number;
|
|
27
|
+
export declare function queryFeedStore(query: string, options?: FeedStoreQueryOptions): FeedStoreItem[];
|
|
28
|
+
export declare function countFeedItems(): number;
|
|
29
|
+
export declare function _clearFeedStoreForTest(): void;
|
|
30
|
+
//# sourceMappingURL=feed-store.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"feed-store.d.ts","sourceRoot":"","sources":["../../../../src/search/v1/rss/feed-store.ts"],"names":[],"mappings":"AAMA,MAAM,WAAW,aAAa;IAC5B,EAAE,EAAE,MAAM,CAAC;IACX,OAAO,EAAE,MAAM,CAAC;IAChB,IAAI,EAAE,MAAM,CAAC;IACb,KAAK,EAAE,MAAM,CAAC;IACd,IAAI,EAAE,MAAM,CAAC;IACb,OAAO,EAAE,MAAM,CAAC;IAChB,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,QAAQ,EAAE,MAAM,CAAC;IACjB,SAAS,EAAE,MAAM,CAAC;CACnB;AAED,MAAM,WAAW,qBAAqB;IACpC,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,QAAQ,CAAC,EAAE,MAAM,CAAC;CACnB;AA0CD,wBAAgB,eAAe,CAAC,KAAK,EAAE,KAAK,CAAC;IAC3C,OAAO,EAAE,MAAM,CAAC;IAAC,IAAI,EAAE,MAAM,CAAC;IAAC,KAAK,EAAE,MAAM,CAAC;IAAC,IAAI,EAAE,MAAM,CAAC;IAC3D,OAAO,EAAE,MAAM,CAAC;IAAC,aAAa,CAAC,EAAE,MAAM,CAAC;IAAC,QAAQ,CAAC,EAAE,MAAM,CAAC;CAC5D,CAAC,GAAG,MAAM,CA6BV;AA6BD,wBAAgB,cAAc,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,GAAE,qBAA0B,GAAG,aAAa,EAAE,CA2ClG;AAED,wBAAgB,cAAc,IAAI,MAAM,CASvC;AAED,wBAAgB,sBAAsB,IAAI,IAAI,CAQ7C"}
|
|
@@ -0,0 +1,134 @@
|
|
|
1
|
+
import { getDatabase } from "../../../cache/db.js";
|
|
2
|
+
import { createLogger } from "../../../logger.js";
|
|
3
|
+
const log = createLogger("search");
|
|
4
|
+
let cachedDb = null;
|
|
5
|
+
let cachedStmts = null;
|
|
6
|
+
function stmts() {
|
|
7
|
+
const db = getDatabase();
|
|
8
|
+
if (cachedDb !== db) {
|
|
9
|
+
cachedDb = db;
|
|
10
|
+
cachedStmts = {
|
|
11
|
+
insert: db.prepare(
|
|
12
|
+
`INSERT OR IGNORE INTO feed_items
|
|
13
|
+
(feed_url, guid, title, link, summary, published_date, category, fetched_at)
|
|
14
|
+
VALUES (?, ?, ?, ?, ?, ?, ?, ?)`
|
|
15
|
+
),
|
|
16
|
+
count: db.prepare("SELECT COUNT(*) AS n FROM feed_items"),
|
|
17
|
+
clear: db.prepare("DELETE FROM feed_items"),
|
|
18
|
+
clearFts: db.prepare("INSERT INTO feed_items_fts(feed_items_fts) VALUES('rebuild')")
|
|
19
|
+
};
|
|
20
|
+
}
|
|
21
|
+
return { db, s: cachedStmts };
|
|
22
|
+
}
|
|
23
|
+
function sanitizeFtsQuery(query) {
|
|
24
|
+
const tokens = query.split(/\s+/).map((t) => t.trim()).filter((t) => t.length > 0).map((t) => t.replace(/"/g, "")).filter((t) => t.length > 0).map((t) => `"${t}"`);
|
|
25
|
+
return tokens.join(" ");
|
|
26
|
+
}
|
|
27
|
+
function upsertFeedItems(items) {
|
|
28
|
+
if (items.length === 0) return 0;
|
|
29
|
+
const { db, s } = stmts();
|
|
30
|
+
const now = (/* @__PURE__ */ new Date()).toISOString();
|
|
31
|
+
let added = 0;
|
|
32
|
+
const tx = db.transaction(() => {
|
|
33
|
+
for (const it of items) {
|
|
34
|
+
const res = s.insert.run(
|
|
35
|
+
it.feedUrl,
|
|
36
|
+
it.guid,
|
|
37
|
+
it.title,
|
|
38
|
+
it.link,
|
|
39
|
+
it.summary,
|
|
40
|
+
it.publishedDate ?? null,
|
|
41
|
+
it.category ?? "news",
|
|
42
|
+
now
|
|
43
|
+
);
|
|
44
|
+
if (res.changes > 0) added += 1;
|
|
45
|
+
}
|
|
46
|
+
});
|
|
47
|
+
try {
|
|
48
|
+
tx();
|
|
49
|
+
} catch (err) {
|
|
50
|
+
log.error("feed_items upsert failed", {
|
|
51
|
+
error: err instanceof Error ? err.message : String(err)
|
|
52
|
+
});
|
|
53
|
+
throw err;
|
|
54
|
+
}
|
|
55
|
+
return added;
|
|
56
|
+
}
|
|
57
|
+
function rowToItem(r) {
|
|
58
|
+
const item = {
|
|
59
|
+
id: r.id,
|
|
60
|
+
feedUrl: r.feed_url,
|
|
61
|
+
guid: r.guid,
|
|
62
|
+
title: r.title,
|
|
63
|
+
link: r.link,
|
|
64
|
+
summary: r.summary,
|
|
65
|
+
category: r.category,
|
|
66
|
+
fetchedAt: r.fetched_at
|
|
67
|
+
};
|
|
68
|
+
if (r.published_date) item.publishedDate = r.published_date;
|
|
69
|
+
return item;
|
|
70
|
+
}
|
|
71
|
+
function queryFeedStore(query, options = {}) {
|
|
72
|
+
const { db } = stmts();
|
|
73
|
+
const max = options.maxResults ?? 10;
|
|
74
|
+
const safe = sanitizeFtsQuery(query);
|
|
75
|
+
if (!safe) return [];
|
|
76
|
+
const clauses = [];
|
|
77
|
+
const params = [safe];
|
|
78
|
+
if (options.fromDate) {
|
|
79
|
+
clauses.push("feed_items.published_date >= ?");
|
|
80
|
+
params.push(options.fromDate);
|
|
81
|
+
}
|
|
82
|
+
if (options.toDate) {
|
|
83
|
+
clauses.push("feed_items.published_date <= ?");
|
|
84
|
+
params.push(options.toDate);
|
|
85
|
+
}
|
|
86
|
+
if (options.category) {
|
|
87
|
+
clauses.push("feed_items.category = ?");
|
|
88
|
+
params.push(options.category);
|
|
89
|
+
}
|
|
90
|
+
const where = clauses.length > 0 ? " AND " + clauses.join(" AND ") : "";
|
|
91
|
+
params.push(max);
|
|
92
|
+
const sql = `
|
|
93
|
+
SELECT feed_items.*
|
|
94
|
+
FROM feed_items_fts
|
|
95
|
+
JOIN feed_items ON feed_items.id = feed_items_fts.rowid
|
|
96
|
+
WHERE feed_items_fts MATCH ?${where}
|
|
97
|
+
ORDER BY bm25(feed_items_fts)
|
|
98
|
+
LIMIT ?
|
|
99
|
+
`;
|
|
100
|
+
try {
|
|
101
|
+
const rows = db.prepare(sql).all(...params);
|
|
102
|
+
return rows.map(rowToItem);
|
|
103
|
+
} catch (err) {
|
|
104
|
+
log.warn("feed_items_fts query failed", {
|
|
105
|
+
query,
|
|
106
|
+
error: err instanceof Error ? err.message : String(err)
|
|
107
|
+
});
|
|
108
|
+
return [];
|
|
109
|
+
}
|
|
110
|
+
}
|
|
111
|
+
function countFeedItems() {
|
|
112
|
+
try {
|
|
113
|
+
const { s } = stmts();
|
|
114
|
+
const row = s.count.get();
|
|
115
|
+
return row?.n ?? 0;
|
|
116
|
+
} catch {
|
|
117
|
+
return 0;
|
|
118
|
+
}
|
|
119
|
+
}
|
|
120
|
+
function _clearFeedStoreForTest() {
|
|
121
|
+
try {
|
|
122
|
+
const { s } = stmts();
|
|
123
|
+
s.clear.run();
|
|
124
|
+
s.clearFts.run();
|
|
125
|
+
} catch {
|
|
126
|
+
}
|
|
127
|
+
}
|
|
128
|
+
export {
|
|
129
|
+
_clearFeedStoreForTest,
|
|
130
|
+
countFeedItems,
|
|
131
|
+
queryFeedStore,
|
|
132
|
+
upsertFeedItems
|
|
133
|
+
};
|
|
134
|
+
//# sourceMappingURL=feed-store.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../../src/search/v1/rss/feed-store.ts"],"sourcesContent":["import type Database from 'better-sqlite3';\nimport { getDatabase } from '../../../cache/db.js';\nimport { createLogger } from '../../../logger.js';\n\nconst log = createLogger('search');\n\nexport interface FeedStoreItem {\n id: number;\n feedUrl: string;\n guid: string;\n title: string;\n link: string;\n summary: string;\n publishedDate?: string;\n category: string;\n fetchedAt: string;\n}\n\nexport interface FeedStoreQueryOptions {\n maxResults?: number;\n fromDate?: string;\n toDate?: string;\n category?: string;\n}\n\ninterface Stmts {\n insert: Database.Statement;\n count: Database.Statement;\n clear: Database.Statement;\n clearFts: Database.Statement;\n}\n\nlet cachedDb: Database.Database | null = null;\nlet cachedStmts: Stmts | null = null;\n\nfunction stmts(): { db: Database.Database; s: Stmts } {\n const db = getDatabase();\n if (cachedDb !== db) {\n cachedDb = db;\n cachedStmts = {\n insert: db.prepare(\n `INSERT OR IGNORE INTO feed_items\n (feed_url, guid, title, link, summary, published_date, category, fetched_at)\n VALUES (?, ?, ?, ?, ?, ?, ?, ?)`,\n ),\n count: db.prepare('SELECT COUNT(*) AS n FROM feed_items'),\n clear: db.prepare('DELETE FROM feed_items'),\n clearFts: db.prepare(\"INSERT INTO feed_items_fts(feed_items_fts) VALUES('rebuild')\"),\n };\n }\n return { db, s: cachedStmts! };\n}\n\n// FTS5 reserves characters; quote each token to be safe.\nfunction sanitizeFtsQuery(query: string): string {\n const tokens = query\n .split(/\\s+/)\n .map((t) => t.trim())\n .filter((t) => t.length > 0)\n .map((t) => t.replace(/\"/g, ''))\n .filter((t) => t.length > 0)\n .map((t) => `\"${t}\"`);\n return tokens.join(' ');\n}\n\nexport function upsertFeedItems(items: Array<{\n feedUrl: string; guid: string; title: string; link: string;\n summary: string; publishedDate?: string; category?: string;\n}>): number {\n if (items.length === 0) return 0;\n const { db, s } = stmts();\n const now = new Date().toISOString();\n let added = 0;\n const tx = db.transaction(() => {\n for (const it of items) {\n const res = s.insert.run(\n it.feedUrl,\n it.guid,\n it.title,\n it.link,\n it.summary,\n it.publishedDate ?? null,\n it.category ?? 'news',\n now,\n );\n if (res.changes > 0) added += 1;\n }\n });\n try {\n tx();\n } catch (err) {\n log.error('feed_items upsert failed', {\n error: err instanceof Error ? err.message : String(err),\n });\n throw err;\n }\n return added;\n}\n\ninterface RawRow {\n id: number;\n feed_url: string;\n guid: string;\n title: string;\n link: string;\n summary: string;\n published_date: string | null;\n category: string;\n fetched_at: string;\n}\n\nfunction rowToItem(r: RawRow): FeedStoreItem {\n const item: FeedStoreItem = {\n id: r.id,\n feedUrl: r.feed_url,\n guid: r.guid,\n title: r.title,\n link: r.link,\n summary: r.summary,\n category: r.category,\n fetchedAt: r.fetched_at,\n };\n if (r.published_date) item.publishedDate = r.published_date;\n return item;\n}\n\nexport function queryFeedStore(query: string, options: FeedStoreQueryOptions = {}): FeedStoreItem[] {\n const { db } = stmts();\n const max = options.maxResults ?? 10;\n const safe = sanitizeFtsQuery(query);\n if (!safe) return [];\n\n const clauses: string[] = [];\n const params: Array<string | number> = [safe];\n\n if (options.fromDate) {\n clauses.push('feed_items.published_date >= ?');\n params.push(options.fromDate);\n }\n if (options.toDate) {\n clauses.push('feed_items.published_date <= ?');\n params.push(options.toDate);\n }\n if (options.category) {\n clauses.push('feed_items.category = ?');\n params.push(options.category);\n }\n\n const where = clauses.length > 0 ? ' AND ' + clauses.join(' AND ') : '';\n params.push(max);\n\n const sql = `\n SELECT feed_items.*\n FROM feed_items_fts\n JOIN feed_items ON feed_items.id = feed_items_fts.rowid\n WHERE feed_items_fts MATCH ?${where}\n ORDER BY bm25(feed_items_fts)\n LIMIT ?\n `;\n try {\n const rows = db.prepare(sql).all(...params) as RawRow[];\n return rows.map(rowToItem);\n } catch (err) {\n log.warn('feed_items_fts query failed', {\n query,\n error: err instanceof Error ? err.message : String(err),\n });\n return [];\n }\n}\n\nexport function countFeedItems(): number {\n try {\n const { s } = stmts();\n const row = s.count.get() as { n: number } | undefined;\n return row?.n ?? 0;\n } catch {\n // Table missing — treat as empty.\n return 0;\n }\n}\n\nexport function _clearFeedStoreForTest(): void {\n try {\n const { s } = stmts();\n s.clear.run();\n s.clearFts.run();\n } catch {\n // ignore — store may not be initialized in this test\n }\n}\n"],"mappings":"AACA,SAAS,mBAAmB;AAC5B,SAAS,oBAAoB;AAE7B,MAAM,MAAM,aAAa,QAAQ;AA4BjC,IAAI,WAAqC;AACzC,IAAI,cAA4B;AAEhC,SAAS,QAA6C;AACpD,QAAM,KAAK,YAAY;AACvB,MAAI,aAAa,IAAI;AACnB,eAAW;AACX,kBAAc;AAAA,MACZ,QAAQ,GAAG;AAAA,QACT;AAAA;AAAA;AAAA,MAGF;AAAA,MACA,OAAO,GAAG,QAAQ,sCAAsC;AAAA,MACxD,OAAO,GAAG,QAAQ,wBAAwB;AAAA,MAC1C,UAAU,GAAG,QAAQ,8DAA8D;AAAA,IACrF;AAAA,EACF;AACA,SAAO,EAAE,IAAI,GAAG,YAAa;AAC/B;AAGA,SAAS,iBAAiB,OAAuB;AAC/C,QAAM,SAAS,MACZ,MAAM,KAAK,EACX,IAAI,CAAC,MAAM,EAAE,KAAK,CAAC,EACnB,OAAO,CAAC,MAAM,EAAE,SAAS,CAAC,EAC1B,IAAI,CAAC,MAAM,EAAE,QAAQ,MAAM,EAAE,CAAC,EAC9B,OAAO,CAAC,MAAM,EAAE,SAAS,CAAC,EAC1B,IAAI,CAAC,MAAM,IAAI,CAAC,GAAG;AACtB,SAAO,OAAO,KAAK,GAAG;AACxB;AAEO,SAAS,gBAAgB,OAGpB;AACV,MAAI,MAAM,WAAW,EAAG,QAAO;AAC/B,QAAM,EAAE,IAAI,EAAE,IAAI,MAAM;AACxB,QAAM,OAAM,oBAAI,KAAK,GAAE,YAAY;AACnC,MAAI,QAAQ;AACZ,QAAM,KAAK,GAAG,YAAY,MAAM;AAC9B,eAAW,MAAM,OAAO;AACtB,YAAM,MAAM,EAAE,OAAO;AAAA,QACnB,GAAG;AAAA,QACH,GAAG;AAAA,QACH,GAAG;AAAA,QACH,GAAG;AAAA,QACH,GAAG;AAAA,QACH,GAAG,iBAAiB;AAAA,QACpB,GAAG,YAAY;AAAA,QACf;AAAA,MACF;AACA,UAAI,IAAI,UAAU,EAAG,UAAS;AAAA,IAChC;AAAA,EACF,CAAC;AACD,MAAI;AACF,OAAG;AAAA,EACL,SAAS,KAAK;AACZ,QAAI,MAAM,4BAA4B;AAAA,MACpC,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD,CAAC;AACD,UAAM;AAAA,EACR;AACA,SAAO;AACT;AAcA,SAAS,UAAU,GAA0B;AAC3C,QAAM,OAAsB;AAAA,IAC1B,IAAI,EAAE;AAAA,IACN,SAAS,EAAE;AAAA,IACX,MAAM,EAAE;AAAA,IACR,OAAO,EAAE;AAAA,IACT,MAAM,EAAE;AAAA,IACR,SAAS,EAAE;AAAA,IACX,UAAU,EAAE;AAAA,IACZ,WAAW,EAAE;AAAA,EACf;AACA,MAAI,EAAE,eAAgB,MAAK,gBAAgB,EAAE;AAC7C,SAAO;AACT;AAEO,SAAS,eAAe,OAAe,UAAiC,CAAC,GAAoB;AAClG,QAAM,EAAE,GAAG,IAAI,MAAM;AACrB,QAAM,MAAM,QAAQ,cAAc;AAClC,QAAM,OAAO,iBAAiB,KAAK;AACnC,MAAI,CAAC,KAAM,QAAO,CAAC;AAEnB,QAAM,UAAoB,CAAC;AAC3B,QAAM,SAAiC,CAAC,IAAI;AAE5C,MAAI,QAAQ,UAAU;AACpB,YAAQ,KAAK,gCAAgC;AAC7C,WAAO,KAAK,QAAQ,QAAQ;AAAA,EAC9B;AACA,MAAI,QAAQ,QAAQ;AAClB,YAAQ,KAAK,gCAAgC;AAC7C,WAAO,KAAK,QAAQ,MAAM;AAAA,EAC5B;AACA,MAAI,QAAQ,UAAU;AACpB,YAAQ,KAAK,yBAAyB;AACtC,WAAO,KAAK,QAAQ,QAAQ;AAAA,EAC9B;AAEA,QAAM,QAAQ,QAAQ,SAAS,IAAI,UAAU,QAAQ,KAAK,OAAO,IAAI;AACrE,SAAO,KAAK,GAAG;AAEf,QAAM,MAAM;AAAA;AAAA;AAAA;AAAA,kCAIoB,KAAK;AAAA;AAAA;AAAA;AAIrC,MAAI;AACF,UAAM,OAAO,GAAG,QAAQ,GAAG,EAAE,IAAI,GAAG,MAAM;AAC1C,WAAO,KAAK,IAAI,SAAS;AAAA,EAC3B,SAAS,KAAK;AACZ,QAAI,KAAK,+BAA+B;AAAA,MACtC;AAAA,MACA,OAAO,eAAe,QAAQ,IAAI,UAAU,OAAO,GAAG;AAAA,IACxD,CAAC;AACD,WAAO,CAAC;AAAA,EACV;AACF;AAEO,SAAS,iBAAyB;AACvC,MAAI;AACF,UAAM,EAAE,EAAE,IAAI,MAAM;AACpB,UAAM,MAAM,EAAE,MAAM,IAAI;AACxB,WAAO,KAAK,KAAK;AAAA,EACnB,QAAQ;AAEN,WAAO;AAAA,EACT;AACF;AAEO,SAAS,yBAA+B;AAC7C,MAAI;AACF,UAAM,EAAE,EAAE,IAAI,MAAM;AACpB,MAAE,MAAM,IAAI;AACZ,MAAE,SAAS,IAAI;AAAA,EACjB,QAAQ;AAAA,EAER;AACF;","names":[]}
|
|
@@ -0,0 +1,6 @@
|
|
|
1
|
+
import type { SearchEngine, SearchEngineOptions, RawSearchResult } from '../../../types.js';
|
|
2
|
+
export declare class RssFeedEngine implements SearchEngine {
|
|
3
|
+
name: string;
|
|
4
|
+
search(query: string, options?: SearchEngineOptions): Promise<RawSearchResult[]>;
|
|
5
|
+
}
|
|
6
|
+
//# sourceMappingURL=rss-engine.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"rss-engine.d.ts","sourceRoot":"","sources":["../../../../src/search/v1/rss/rss-engine.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,YAAY,EAAE,mBAAmB,EAAE,eAAe,EAAE,MAAM,mBAAmB,CAAC;AAK5F,qBAAa,aAAc,YAAW,YAAY;IAChD,IAAI,SAAc;IAEZ,MAAM,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,GAAE,mBAAwB,GAAG,OAAO,CAAC,eAAe,EAAE,CAAC;CAmB3F"}
|
|
@@ -0,0 +1,28 @@
|
|
|
1
|
+
import { queryFeedStore } from "./feed-store.js";
|
|
2
|
+
const SNIPPET_LIMIT = 200;
|
|
3
|
+
class RssFeedEngine {
|
|
4
|
+
name = "rss-feed";
|
|
5
|
+
async search(query, options = {}) {
|
|
6
|
+
const items = queryFeedStore(query, {
|
|
7
|
+
maxResults: options.maxResults ?? 10,
|
|
8
|
+
...options.fromDate ? { fromDate: options.fromDate } : {},
|
|
9
|
+
...options.toDate ? { toDate: options.toDate } : {}
|
|
10
|
+
});
|
|
11
|
+
const total = items.length;
|
|
12
|
+
return items.map((it, i) => {
|
|
13
|
+
const result = {
|
|
14
|
+
title: it.title,
|
|
15
|
+
url: it.link,
|
|
16
|
+
snippet: it.summary.slice(0, SNIPPET_LIMIT),
|
|
17
|
+
relevance_score: 1 - i / Math.max(total, 1),
|
|
18
|
+
engine: "rss-feed"
|
|
19
|
+
};
|
|
20
|
+
if (it.publishedDate) result.published_date = it.publishedDate;
|
|
21
|
+
return result;
|
|
22
|
+
});
|
|
23
|
+
}
|
|
24
|
+
}
|
|
25
|
+
export {
|
|
26
|
+
RssFeedEngine
|
|
27
|
+
};
|
|
28
|
+
//# sourceMappingURL=rss-engine.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../../src/search/v1/rss/rss-engine.ts"],"sourcesContent":["import type { SearchEngine, SearchEngineOptions, RawSearchResult } from '../../../types.js';\nimport { queryFeedStore } from './feed-store.js';\n\nconst SNIPPET_LIMIT = 200;\n\nexport class RssFeedEngine implements SearchEngine {\n name = 'rss-feed';\n\n async search(query: string, options: SearchEngineOptions = {}): Promise<RawSearchResult[]> {\n const items = queryFeedStore(query, {\n maxResults: options.maxResults ?? 10,\n ...(options.fromDate ? { fromDate: options.fromDate } : {}),\n ...(options.toDate ? { toDate: options.toDate } : {}),\n });\n const total = items.length;\n return items.map((it, i) => {\n const result: RawSearchResult = {\n title: it.title,\n url: it.link,\n snippet: it.summary.slice(0, SNIPPET_LIMIT),\n relevance_score: 1 - i / Math.max(total, 1),\n engine: 'rss-feed',\n };\n if (it.publishedDate) result.published_date = it.publishedDate;\n return result;\n });\n }\n}\n"],"mappings":"AACA,SAAS,sBAAsB;AAE/B,MAAM,gBAAgB;AAEf,MAAM,cAAsC;AAAA,EACjD,OAAO;AAAA,EAEP,MAAM,OAAO,OAAe,UAA+B,CAAC,GAA+B;AACzF,UAAM,QAAQ,eAAe,OAAO;AAAA,MAClC,YAAY,QAAQ,cAAc;AAAA,MAClC,GAAI,QAAQ,WAAW,EAAE,UAAU,QAAQ,SAAS,IAAI,CAAC;AAAA,MACzD,GAAI,QAAQ,SAAS,EAAE,QAAQ,QAAQ,OAAO,IAAI,CAAC;AAAA,IACrD,CAAC;AACD,UAAM,QAAQ,MAAM;AACpB,WAAO,MAAM,IAAI,CAAC,IAAI,MAAM;AAC1B,YAAM,SAA0B;AAAA,QAC9B,OAAO,GAAG;AAAA,QACV,KAAK,GAAG;AAAA,QACR,SAAS,GAAG,QAAQ,MAAM,GAAG,aAAa;AAAA,QAC1C,iBAAiB,IAAI,IAAI,KAAK,IAAI,OAAO,CAAC;AAAA,QAC1C,QAAQ;AAAA,MACV;AACA,UAAI,GAAG,cAAe,QAAO,iBAAiB,GAAG;AACjD,aAAO;AAAA,IACT,CAAC;AAAA,EACH;AACF;","names":[]}
|
|
@@ -0,0 +1,7 @@
|
|
|
1
|
+
import type { SearchProvider, SearchContext } from '../../providers/search-provider.js';
|
|
2
|
+
import type { SearchInput, SearchOutput, StageResult } from '../../types.js';
|
|
3
|
+
export declare class V1SearchProvider implements SearchProvider {
|
|
4
|
+
readonly name: "v1";
|
|
5
|
+
search(input: SearchInput, _ctx: SearchContext): Promise<StageResult<SearchOutput>>;
|
|
6
|
+
}
|
|
7
|
+
//# sourceMappingURL=v1-provider.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"v1-provider.d.ts","sourceRoot":"","sources":["../../../src/search/v1/v1-provider.ts"],"names":[],"mappings":"AAQA,OAAO,KAAK,EAAE,cAAc,EAAE,aAAa,EAAE,MAAM,oCAAoC,CAAC;AACxF,OAAO,KAAK,EACV,WAAW,EACX,YAAY,EAEZ,WAAW,EACZ,MAAM,gBAAgB,CAAC;AAKxB,qBAAa,gBAAiB,YAAW,cAAc;IACrD,QAAQ,CAAC,IAAI,EAAG,IAAI,CAAU;IAExB,MAAM,CAAC,KAAK,EAAE,WAAW,EAAE,IAAI,EAAE,aAAa,GAAG,OAAO,CAAC,WAAW,CAAC,YAAY,CAAC,CAAC;CAuE1F"}
|