@staticn0va/wigolo 0.1.0 → 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +1 -1
- package/README.md +195 -73
- package/SKILL.md +382 -0
- package/assets/blocks/claude-code/CLAUDE.md.block +20 -0
- package/assets/blocks/claude-code/wigolo-command.md +40 -0
- package/assets/blocks/cursor/wigolo.mdc +46 -0
- package/assets/blocks/gemini-cli/GEMINI.md.block +18 -0
- package/assets/blocks/vscode/copilot-instructions.md.block +18 -0
- package/assets/skills/wigolo/SKILL.md +50 -0
- package/assets/skills/wigolo/rules/cache-first.md +30 -0
- package/assets/skills/wigolo/rules/synthesis.md +43 -0
- package/assets/skills/wigolo-agent/SKILL.md +73 -0
- package/assets/skills/wigolo-crawl/SKILL.md +60 -0
- package/assets/skills/wigolo-extract/SKILL.md +59 -0
- package/assets/skills/wigolo-fetch/SKILL.md +65 -0
- package/assets/skills/wigolo-find-similar/SKILL.md +72 -0
- package/assets/skills/wigolo-research/SKILL.md +77 -0
- package/assets/skills/wigolo-search/SKILL.md +78 -0
- package/dist/agent/executor.d.ts +33 -0
- package/dist/agent/executor.d.ts.map +1 -0
- package/dist/agent/executor.js +233 -0
- package/dist/agent/executor.js.map +1 -0
- package/dist/agent/pipeline.d.ts +5 -0
- package/dist/agent/pipeline.d.ts.map +1 -0
- package/dist/agent/pipeline.js +208 -0
- package/dist/agent/pipeline.js.map +1 -0
- package/dist/agent/planner.d.ts +13 -0
- package/dist/agent/planner.d.ts.map +1 -0
- package/dist/agent/planner.js +271 -0
- package/dist/agent/planner.js.map +1 -0
- package/dist/agent/relevance.d.ts +15 -0
- package/dist/agent/relevance.d.ts.map +1 -0
- package/dist/agent/relevance.js +60 -0
- package/dist/agent/relevance.js.map +1 -0
- package/dist/cache/backfill-embeddings.d.ts +23 -0
- package/dist/cache/backfill-embeddings.d.ts.map +1 -0
- package/dist/cache/backfill-embeddings.js +105 -0
- package/dist/cache/backfill-embeddings.js.map +1 -0
- package/dist/cache/change-detector.d.ts +7 -0
- package/dist/cache/change-detector.d.ts.map +1 -0
- package/dist/cache/change-detector.js +43 -0
- package/dist/cache/change-detector.js.map +1 -0
- package/dist/cache/db.d.ts +1 -0
- package/dist/cache/db.d.ts.map +1 -1
- package/dist/cache/db.js +94 -22
- package/dist/cache/db.js.map +1 -1
- package/dist/cache/diff-summary.d.ts +2 -0
- package/dist/cache/diff-summary.d.ts.map +1 -0
- package/dist/cache/diff-summary.js +82 -0
- package/dist/cache/diff-summary.js.map +1 -0
- package/dist/cache/migrations/runner.d.ts +29 -0
- package/dist/cache/migrations/runner.d.ts.map +1 -0
- package/dist/cache/migrations/runner.js +147 -0
- package/dist/cache/migrations/runner.js.map +1 -0
- package/dist/cache/sqlite-vec-store.d.ts +42 -0
- package/dist/cache/sqlite-vec-store.d.ts.map +1 -0
- package/dist/cache/sqlite-vec-store.js +176 -0
- package/dist/cache/sqlite-vec-store.js.map +1 -0
- package/dist/cache/store.d.ts +46 -1
- package/dist/cache/store.d.ts.map +1 -1
- package/dist/cache/store.js +362 -168
- package/dist/cache/store.js.map +1 -1
- package/dist/cli/agents/antigravity.d.ts +20 -0
- package/dist/cli/agents/antigravity.d.ts.map +1 -0
- package/dist/cli/agents/antigravity.js +49 -0
- package/dist/cli/agents/antigravity.js.map +1 -0
- package/dist/cli/agents/claude-code.d.ts +25 -0
- package/dist/cli/agents/claude-code.d.ts.map +1 -0
- package/dist/cli/agents/claude-code.js +111 -0
- package/dist/cli/agents/claude-code.js.map +1 -0
- package/dist/cli/agents/cursor.d.ts +21 -0
- package/dist/cli/agents/cursor.d.ts.map +1 -0
- package/dist/cli/agents/cursor.js +58 -0
- package/dist/cli/agents/cursor.js.map +1 -0
- package/dist/cli/agents/gemini-cli.d.ts +21 -0
- package/dist/cli/agents/gemini-cli.d.ts.map +1 -0
- package/dist/cli/agents/gemini-cli.js +55 -0
- package/dist/cli/agents/gemini-cli.js.map +1 -0
- package/dist/cli/agents/registry.d.ts +21 -0
- package/dist/cli/agents/registry.d.ts.map +1 -0
- package/dist/cli/agents/registry.js +27 -0
- package/dist/cli/agents/registry.js.map +1 -0
- package/dist/cli/agents/utils.d.ts +26 -0
- package/dist/cli/agents/utils.d.ts.map +1 -0
- package/dist/cli/agents/utils.js +136 -0
- package/dist/cli/agents/utils.js.map +1 -0
- package/dist/cli/agents/vscode.d.ts +21 -0
- package/dist/cli/agents/vscode.d.ts.map +1 -0
- package/dist/cli/agents/vscode.js +62 -0
- package/dist/cli/agents/vscode.js.map +1 -0
- package/dist/cli/auth.d.ts +2 -0
- package/dist/cli/auth.d.ts.map +1 -0
- package/dist/cli/auth.js +94 -0
- package/dist/cli/auth.js.map +1 -0
- package/dist/cli/backfill.d.ts +2 -0
- package/dist/cli/backfill.d.ts.map +1 -0
- package/dist/cli/backfill.js +58 -0
- package/dist/cli/backfill.js.map +1 -0
- package/dist/cli/daemon.d.ts +6 -1
- package/dist/cli/daemon.d.ts.map +1 -1
- package/dist/cli/daemon.js +61 -3
- package/dist/cli/daemon.js.map +1 -1
- package/dist/cli/doctor.d.ts +8 -0
- package/dist/cli/doctor.d.ts.map +1 -0
- package/dist/cli/doctor.js +318 -0
- package/dist/cli/doctor.js.map +1 -0
- package/dist/cli/health.d.ts +1 -1
- package/dist/cli/health.d.ts.map +1 -1
- package/dist/cli/health.js +42 -3
- package/dist/cli/health.js.map +1 -1
- package/dist/cli/help.d.ts +6 -0
- package/dist/cli/help.d.ts.map +1 -0
- package/dist/cli/help.js +63 -0
- package/dist/cli/help.js.map +1 -0
- package/dist/cli/index.d.ts +1 -1
- package/dist/cli/index.d.ts.map +1 -1
- package/dist/cli/index.js +35 -7
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/init.d.ts +2 -0
- package/dist/cli/init.d.ts.map +1 -0
- package/dist/cli/init.js +201 -0
- package/dist/cli/init.js.map +1 -0
- package/dist/cli/plugin.d.ts +5 -0
- package/dist/cli/plugin.d.ts.map +1 -0
- package/dist/cli/plugin.js +185 -0
- package/dist/cli/plugin.js.map +1 -0
- package/dist/cli/setup-mcp.d.ts +2 -0
- package/dist/cli/setup-mcp.d.ts.map +1 -0
- package/dist/cli/setup-mcp.js +114 -0
- package/dist/cli/setup-mcp.js.map +1 -0
- package/dist/cli/shell.d.ts +2 -0
- package/dist/cli/shell.d.ts.map +1 -0
- package/dist/cli/shell.js +86 -0
- package/dist/cli/shell.js.map +1 -0
- package/dist/cli/status.d.ts +2 -0
- package/dist/cli/status.d.ts.map +1 -0
- package/dist/cli/status.js +31 -0
- package/dist/cli/status.js.map +1 -0
- package/dist/cli/telemetry.d.ts +10 -0
- package/dist/cli/telemetry.d.ts.map +1 -0
- package/dist/cli/telemetry.js +56 -0
- package/dist/cli/telemetry.js.map +1 -0
- package/dist/cli/tui/agents-types.d.ts +28 -0
- package/dist/cli/tui/agents-types.d.ts.map +1 -0
- package/dist/cli/tui/agents-types.js +1 -0
- package/dist/cli/tui/agents-types.js.map +1 -0
- package/dist/cli/tui/agents.d.ts +11 -0
- package/dist/cli/tui/agents.d.ts.map +1 -0
- package/dist/cli/tui/agents.js +93 -0
- package/dist/cli/tui/agents.js.map +1 -0
- package/dist/cli/tui/banner.d.ts +3 -0
- package/dist/cli/tui/banner.d.ts.map +1 -0
- package/dist/cli/tui/banner.js +30 -0
- package/dist/cli/tui/banner.js.map +1 -0
- package/dist/cli/tui/components/AgentSelect.d.ts +13 -0
- package/dist/cli/tui/components/AgentSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/AgentSelect.js +116 -0
- package/dist/cli/tui/components/AgentSelect.js.map +1 -0
- package/dist/cli/tui/components/Banner.d.ts +6 -0
- package/dist/cli/tui/components/Banner.d.ts.map +1 -0
- package/dist/cli/tui/components/Banner.js +25 -0
- package/dist/cli/tui/components/Banner.js.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts +7 -0
- package/dist/cli/tui/components/BrowserSelect.d.ts.map +1 -0
- package/dist/cli/tui/components/BrowserSelect.js +19 -0
- package/dist/cli/tui/components/BrowserSelect.js.map +1 -0
- package/dist/cli/tui/components/InstallProgress.d.ts +9 -0
- package/dist/cli/tui/components/InstallProgress.d.ts.map +1 -0
- package/dist/cli/tui/components/InstallProgress.js +67 -0
- package/dist/cli/tui/components/InstallProgress.js.map +1 -0
- package/dist/cli/tui/components/SkillInstall.d.ts +14 -0
- package/dist/cli/tui/components/SkillInstall.d.ts.map +1 -0
- package/dist/cli/tui/components/SkillInstall.js +94 -0
- package/dist/cli/tui/components/SkillInstall.js.map +1 -0
- package/dist/cli/tui/components/Summary.d.ts +22 -0
- package/dist/cli/tui/components/Summary.d.ts.map +1 -0
- package/dist/cli/tui/components/Summary.js +135 -0
- package/dist/cli/tui/components/Summary.js.map +1 -0
- package/dist/cli/tui/components/SystemCheck.d.ts +8 -0
- package/dist/cli/tui/components/SystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/components/SystemCheck.js +71 -0
- package/dist/cli/tui/components/SystemCheck.js.map +1 -0
- package/dist/cli/tui/components/Verification.d.ts +8 -0
- package/dist/cli/tui/components/Verification.d.ts.map +1 -0
- package/dist/cli/tui/components/Verification.js +63 -0
- package/dist/cli/tui/components/Verification.js.map +1 -0
- package/dist/cli/tui/config-writer-cli.d.ts +12 -0
- package/dist/cli/tui/config-writer-cli.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-cli.js +39 -0
- package/dist/cli/tui/config-writer-cli.js.map +1 -0
- package/dist/cli/tui/config-writer-json.d.ts +16 -0
- package/dist/cli/tui/config-writer-json.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-json.js +86 -0
- package/dist/cli/tui/config-writer-json.js.map +1 -0
- package/dist/cli/tui/config-writer-toml.d.ts +16 -0
- package/dist/cli/tui/config-writer-toml.d.ts.map +1 -0
- package/dist/cli/tui/config-writer-toml.js +83 -0
- package/dist/cli/tui/config-writer-toml.js.map +1 -0
- package/dist/cli/tui/config-writer.d.ts +25 -0
- package/dist/cli/tui/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/config-writer.js +101 -0
- package/dist/cli/tui/config-writer.js.map +1 -0
- package/dist/cli/tui/detect-helpers.d.ts +6 -0
- package/dist/cli/tui/detect-helpers.d.ts.map +1 -0
- package/dist/cli/tui/detect-helpers.js +45 -0
- package/dist/cli/tui/detect-helpers.js.map +1 -0
- package/dist/cli/tui/extras-prompt.d.ts +7 -0
- package/dist/cli/tui/extras-prompt.d.ts.map +1 -0
- package/dist/cli/tui/extras-prompt.js +42 -0
- package/dist/cli/tui/extras-prompt.js.map +1 -0
- package/dist/cli/tui/flags-types.d.ts +19 -0
- package/dist/cli/tui/flags-types.d.ts.map +1 -0
- package/dist/cli/tui/flags-types.js +23 -0
- package/dist/cli/tui/flags-types.js.map +1 -0
- package/dist/cli/tui/flags.d.ts +5 -0
- package/dist/cli/tui/flags.d.ts.map +1 -0
- package/dist/cli/tui/flags.js +132 -0
- package/dist/cli/tui/flags.js.map +1 -0
- package/dist/cli/tui/format.d.ts +14 -0
- package/dist/cli/tui/format.d.ts.map +1 -0
- package/dist/cli/tui/format.js +37 -0
- package/dist/cli/tui/format.js.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts +6 -0
- package/dist/cli/tui/hooks/useAgentDetect.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useAgentDetect.js +19 -0
- package/dist/cli/tui/hooks/useAgentDetect.js.map +1 -0
- package/dist/cli/tui/hooks/useInstall.d.ts +14 -0
- package/dist/cli/tui/hooks/useInstall.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useInstall.js +90 -0
- package/dist/cli/tui/hooks/useInstall.js.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts +13 -0
- package/dist/cli/tui/hooks/useSystemCheck.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useSystemCheck.js +95 -0
- package/dist/cli/tui/hooks/useSystemCheck.js.map +1 -0
- package/dist/cli/tui/hooks/useVerify.d.ts +14 -0
- package/dist/cli/tui/hooks/useVerify.d.ts.map +1 -0
- package/dist/cli/tui/hooks/useVerify.js +71 -0
- package/dist/cli/tui/hooks/useVerify.js.map +1 -0
- package/dist/cli/tui/ink-init.d.ts +2 -0
- package/dist/cli/tui/ink-init.d.ts.map +1 -0
- package/dist/cli/tui/ink-init.js +198 -0
- package/dist/cli/tui/ink-init.js.map +1 -0
- package/dist/cli/tui/reporter-auto.d.ts +7 -0
- package/dist/cli/tui/reporter-auto.d.ts.map +1 -0
- package/dist/cli/tui/reporter-auto.js +15 -0
- package/dist/cli/tui/reporter-auto.js.map +1 -0
- package/dist/cli/tui/reporter.d.ts +26 -0
- package/dist/cli/tui/reporter.d.ts.map +1 -0
- package/dist/cli/tui/reporter.js +32 -0
- package/dist/cli/tui/reporter.js.map +1 -0
- package/dist/cli/tui/run-command.d.ts +14 -0
- package/dist/cli/tui/run-command.d.ts.map +1 -0
- package/dist/cli/tui/run-command.js +72 -0
- package/dist/cli/tui/run-command.js.map +1 -0
- package/dist/cli/tui/select-agents.d.ts +6 -0
- package/dist/cli/tui/select-agents.d.ts.map +1 -0
- package/dist/cli/tui/select-agents.js +32 -0
- package/dist/cli/tui/select-agents.js.map +1 -0
- package/dist/cli/tui/status-agents.d.ts +11 -0
- package/dist/cli/tui/status-agents.d.ts.map +1 -0
- package/dist/cli/tui/status-agents.js +53 -0
- package/dist/cli/tui/status-agents.js.map +1 -0
- package/dist/cli/tui/status-cache.d.ts +6 -0
- package/dist/cli/tui/status-cache.d.ts.map +1 -0
- package/dist/cli/tui/status-cache.js +39 -0
- package/dist/cli/tui/status-cache.js.map +1 -0
- package/dist/cli/tui/status-format.d.ts +14 -0
- package/dist/cli/tui/status-format.d.ts.map +1 -0
- package/dist/cli/tui/status-format.js +41 -0
- package/dist/cli/tui/status-format.js.map +1 -0
- package/dist/cli/tui/status-python.d.ts +6 -0
- package/dist/cli/tui/status-python.d.ts.map +1 -0
- package/dist/cli/tui/status-python.js +30 -0
- package/dist/cli/tui/status-python.js.map +1 -0
- package/dist/cli/tui/system-check.d.ts +24 -0
- package/dist/cli/tui/system-check.d.ts.map +1 -0
- package/dist/cli/tui/system-check.js +103 -0
- package/dist/cli/tui/system-check.js.map +1 -0
- package/dist/cli/tui/tui-reporter.d.ts +19 -0
- package/dist/cli/tui/tui-reporter.d.ts.map +1 -0
- package/dist/cli/tui/tui-reporter.js +95 -0
- package/dist/cli/tui/tui-reporter.js.map +1 -0
- package/dist/cli/tui/utils/config-writer.d.ts +3 -0
- package/dist/cli/tui/utils/config-writer.d.ts.map +1 -0
- package/dist/cli/tui/utils/config-writer.js +22 -0
- package/dist/cli/tui/utils/config-writer.js.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts +3 -0
- package/dist/cli/tui/utils/suppress-logs.d.ts.map +1 -0
- package/dist/cli/tui/utils/suppress-logs.js +11 -0
- package/dist/cli/tui/utils/suppress-logs.js.map +1 -0
- package/dist/cli/tui/verify-suggestions.d.ts +5 -0
- package/dist/cli/tui/verify-suggestions.d.ts.map +1 -0
- package/dist/cli/tui/verify-suggestions.js +20 -0
- package/dist/cli/tui/verify-suggestions.js.map +1 -0
- package/dist/cli/tui/verify.d.ts +14 -0
- package/dist/cli/tui/verify.d.ts.map +1 -0
- package/dist/cli/tui/verify.js +101 -0
- package/dist/cli/tui/verify.js.map +1 -0
- package/dist/cli/tui/version.d.ts +2 -0
- package/dist/cli/tui/version.d.ts.map +1 -0
- package/dist/cli/tui/version.js +14 -0
- package/dist/cli/tui/version.js.map +1 -0
- package/dist/cli/uninstall.d.ts +2 -0
- package/dist/cli/uninstall.d.ts.map +1 -0
- package/dist/cli/uninstall.js +57 -0
- package/dist/cli/uninstall.js.map +1 -0
- package/dist/cli/warmup.d.ts +10 -2
- package/dist/cli/warmup.d.ts.map +1 -1
- package/dist/cli/warmup.js +226 -93
- package/dist/cli/warmup.js.map +1 -1
- package/dist/config.d.ts +28 -2
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +106 -56
- package/dist/config.js.map +1 -1
- package/dist/crawl/crawler.d.ts +6 -0
- package/dist/crawl/crawler.d.ts.map +1 -1
- package/dist/crawl/crawler.js +210 -209
- package/dist/crawl/crawler.js.map +1 -1
- package/dist/crawl/dedup.d.ts +1 -0
- package/dist/crawl/dedup.d.ts.map +1 -1
- package/dist/crawl/dedup.js +124 -81
- package/dist/crawl/dedup.js.map +1 -1
- package/dist/crawl/etag-incremental.d.ts +43 -0
- package/dist/crawl/etag-incremental.d.ts.map +1 -0
- package/dist/crawl/etag-incremental.js +94 -0
- package/dist/crawl/etag-incremental.js.map +1 -0
- package/dist/crawl/index-to-vec.d.ts +10 -0
- package/dist/crawl/index-to-vec.d.ts.map +1 -0
- package/dist/crawl/index-to-vec.js +44 -0
- package/dist/crawl/index-to-vec.js.map +1 -0
- package/dist/crawl/mapper.js +136 -164
- package/dist/crawl/mapper.js.map +1 -1
- package/dist/crawl/rate-limiter.js +63 -66
- package/dist/crawl/rate-limiter.js.map +1 -1
- package/dist/crawl/robots.js +58 -57
- package/dist/crawl/robots.js.map +1 -1
- package/dist/crawl/sitemap-first.d.ts +12 -0
- package/dist/crawl/sitemap-first.d.ts.map +1 -0
- package/dist/crawl/sitemap-first.js +47 -0
- package/dist/crawl/sitemap-first.js.map +1 -0
- package/dist/crawl/sitemap.js +33 -32
- package/dist/crawl/sitemap.js.map +1 -1
- package/dist/crawl/url-utils.d.ts +1 -0
- package/dist/crawl/url-utils.d.ts.map +1 -1
- package/dist/crawl/url-utils.js +49 -37
- package/dist/crawl/url-utils.js.map +1 -1
- package/dist/daemon/health-check.d.ts +16 -0
- package/dist/daemon/health-check.d.ts.map +1 -0
- package/dist/daemon/health-check.js +33 -0
- package/dist/daemon/health-check.js.map +1 -0
- package/dist/daemon/http-server.d.ts +26 -0
- package/dist/daemon/http-server.d.ts.map +1 -0
- package/dist/daemon/http-server.js +275 -0
- package/dist/daemon/http-server.js.map +1 -0
- package/dist/daemon/proxy.d.ts +10 -0
- package/dist/daemon/proxy.d.ts.map +1 -0
- package/dist/daemon/proxy.js +93 -0
- package/dist/daemon/proxy.js.map +1 -0
- package/dist/embedding/embed.d.ts +59 -0
- package/dist/embedding/embed.d.ts.map +1 -0
- package/dist/embedding/embed.js +233 -0
- package/dist/embedding/embed.js.map +1 -0
- package/dist/embedding/fastembed-provider.d.ts +19 -0
- package/dist/embedding/fastembed-provider.d.ts.map +1 -0
- package/dist/embedding/fastembed-provider.js +51 -0
- package/dist/embedding/fastembed-provider.js.map +1 -0
- package/dist/embedding/key-terms.d.ts +12 -0
- package/dist/embedding/key-terms.d.ts.map +1 -0
- package/dist/embedding/key-terms.js +234 -0
- package/dist/embedding/key-terms.js.map +1 -0
- package/dist/extraction/boilerplate.d.ts +15 -0
- package/dist/extraction/boilerplate.d.ts.map +1 -0
- package/dist/extraction/boilerplate.js +52 -0
- package/dist/extraction/boilerplate.js.map +1 -0
- package/dist/extraction/defuddle.d.ts.map +1 -1
- package/dist/extraction/defuddle.js +27 -23
- package/dist/extraction/defuddle.js.map +1 -1
- package/dist/extraction/extract.d.ts.map +1 -1
- package/dist/extraction/extract.js +76 -76
- package/dist/extraction/extract.js.map +1 -1
- package/dist/extraction/jsonld.js +50 -54
- package/dist/extraction/jsonld.js.map +1 -1
- package/dist/extraction/lang-hints.d.ts +2 -0
- package/dist/extraction/lang-hints.d.ts.map +1 -0
- package/dist/extraction/lang-hints.js +30 -0
- package/dist/extraction/lang-hints.js.map +1 -0
- package/dist/extraction/llm-fallback.d.ts +17 -0
- package/dist/extraction/llm-fallback.d.ts.map +1 -0
- package/dist/extraction/llm-fallback.js +130 -0
- package/dist/extraction/llm-fallback.js.map +1 -0
- package/dist/extraction/markdown-sanitize.d.ts +2 -0
- package/dist/extraction/markdown-sanitize.d.ts.map +1 -0
- package/dist/extraction/markdown-sanitize.js +151 -0
- package/dist/extraction/markdown-sanitize.js.map +1 -0
- package/dist/extraction/markdown.d.ts +11 -0
- package/dist/extraction/markdown.d.ts.map +1 -1
- package/dist/extraction/markdown.js +195 -91
- package/dist/extraction/markdown.js.map +1 -1
- package/dist/extraction/pipeline.d.ts +8 -0
- package/dist/extraction/pipeline.d.ts.map +1 -1
- package/dist/extraction/pipeline.js +57 -91
- package/dist/extraction/pipeline.js.map +1 -1
- package/dist/extraction/readability.d.ts +1 -1
- package/dist/extraction/readability.d.ts.map +1 -1
- package/dist/extraction/readability.js +28 -29
- package/dist/extraction/readability.js.map +1 -1
- package/dist/extraction/schema.d.ts +12 -0
- package/dist/extraction/schema.d.ts.map +1 -1
- package/dist/extraction/schema.js +135 -72
- package/dist/extraction/schema.js.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.d.ts.map +1 -1
- package/dist/extraction/site-extractors/docs-generic.js +81 -91
- package/dist/extraction/site-extractors/docs-generic.js.map +1 -1
- package/dist/extraction/site-extractors/github.d.ts.map +1 -1
- package/dist/extraction/site-extractors/github.js +87 -95
- package/dist/extraction/site-extractors/github.js.map +1 -1
- package/dist/extraction/site-extractors/mdn.d.ts.map +1 -1
- package/dist/extraction/site-extractors/mdn.js +46 -54
- package/dist/extraction/site-extractors/mdn.js.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.d.ts.map +1 -1
- package/dist/extraction/site-extractors/stackoverflow.js +71 -80
- package/dist/extraction/site-extractors/stackoverflow.js.map +1 -1
- package/dist/extraction/structured-data.d.ts +4 -0
- package/dist/extraction/structured-data.d.ts.map +1 -0
- package/dist/extraction/structured-data.js +173 -0
- package/dist/extraction/structured-data.js.map +1 -0
- package/dist/extraction/structured.d.ts +4 -0
- package/dist/extraction/structured.d.ts.map +1 -0
- package/dist/extraction/structured.js +163 -0
- package/dist/extraction/structured.js.map +1 -0
- package/dist/extraction/v1/classifier.d.ts +3 -0
- package/dist/extraction/v1/classifier.d.ts.map +1 -0
- package/dist/extraction/v1/classifier.js +110 -0
- package/dist/extraction/v1/classifier.js.map +1 -0
- package/dist/extraction/v1/extract-provider.d.ts +16 -0
- package/dist/extraction/v1/extract-provider.d.ts.map +1 -0
- package/dist/extraction/v1/extract-provider.js +43 -0
- package/dist/extraction/v1/extract-provider.js.map +1 -0
- package/dist/extraction/v1/local-llm.d.ts +8 -0
- package/dist/extraction/v1/local-llm.d.ts.map +1 -0
- package/dist/extraction/v1/local-llm.js +58 -0
- package/dist/extraction/v1/local-llm.js.map +1 -0
- package/dist/extraction/v1/news.d.ts +3 -0
- package/dist/extraction/v1/news.d.ts.map +1 -0
- package/dist/extraction/v1/news.js +61 -0
- package/dist/extraction/v1/news.js.map +1 -0
- package/dist/extraction/v1/product.d.ts +3 -0
- package/dist/extraction/v1/product.d.ts.map +1 -0
- package/dist/extraction/v1/product.js +166 -0
- package/dist/extraction/v1/product.js.map +1 -0
- package/dist/extraction/v1/recipe.d.ts +3 -0
- package/dist/extraction/v1/recipe.d.ts.map +1 -0
- package/dist/extraction/v1/recipe.js +136 -0
- package/dist/extraction/v1/recipe.js.map +1 -0
- package/dist/extraction/v1/routed.d.ts +17 -0
- package/dist/extraction/v1/routed.d.ts.map +1 -0
- package/dist/extraction/v1/routed.js +68 -0
- package/dist/extraction/v1/routed.js.map +1 -0
- package/dist/extraction/v1/schemas/Article.d.ts +11 -0
- package/dist/extraction/v1/schemas/Article.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Article.js +23 -0
- package/dist/extraction/v1/schemas/Article.js.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts +9 -0
- package/dist/extraction/v1/schemas/CodeSnippet.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js +90 -0
- package/dist/extraction/v1/schemas/CodeSnippet.js.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts +10 -0
- package/dist/extraction/v1/schemas/EventListing.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/EventListing.js +122 -0
- package/dist/extraction/v1/schemas/EventListing.js.map +1 -0
- package/dist/extraction/v1/schemas/Paper.d.ts +10 -0
- package/dist/extraction/v1/schemas/Paper.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Paper.js +156 -0
- package/dist/extraction/v1/schemas/Paper.js.map +1 -0
- package/dist/extraction/v1/schemas/Product.d.ts +17 -0
- package/dist/extraction/v1/schemas/Product.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Product.js +149 -0
- package/dist/extraction/v1/schemas/Product.js.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts +14 -0
- package/dist/extraction/v1/schemas/Recipe.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/Recipe.js +160 -0
- package/dist/extraction/v1/schemas/Recipe.js.map +1 -0
- package/dist/extraction/v1/schemas/index.d.ts +13 -0
- package/dist/extraction/v1/schemas/index.d.ts.map +1 -0
- package/dist/extraction/v1/schemas/index.js +44 -0
- package/dist/extraction/v1/schemas/index.js.map +1 -0
- package/dist/extraction/v1/site-extractors.d.ts +5 -0
- package/dist/extraction/v1/site-extractors.d.ts.map +1 -0
- package/dist/extraction/v1/site-extractors.js +31 -0
- package/dist/extraction/v1/site-extractors.js.map +1 -0
- package/dist/fetch/action-executor.d.ts +28 -0
- package/dist/fetch/action-executor.d.ts.map +1 -0
- package/dist/fetch/action-executor.js +88 -0
- package/dist/fetch/action-executor.js.map +1 -0
- package/dist/fetch/auth.d.ts +2 -1
- package/dist/fetch/auth.d.ts.map +1 -1
- package/dist/fetch/auth.js +56 -26
- package/dist/fetch/auth.js.map +1 -1
- package/dist/fetch/browser-pool.d.ts +30 -11
- package/dist/fetch/browser-pool.d.ts.map +1 -1
- package/dist/fetch/browser-pool.js +303 -127
- package/dist/fetch/browser-pool.js.map +1 -1
- package/dist/fetch/browser-selector.d.ts +17 -0
- package/dist/fetch/browser-selector.d.ts.map +1 -0
- package/dist/fetch/browser-selector.js +72 -0
- package/dist/fetch/browser-selector.js.map +1 -0
- package/dist/fetch/browser-types.d.ts +3 -0
- package/dist/fetch/browser-types.d.ts.map +1 -0
- package/dist/fetch/browser-types.js +45 -0
- package/dist/fetch/browser-types.js.map +1 -0
- package/dist/fetch/cdp-client.d.ts +9 -0
- package/dist/fetch/cdp-client.d.ts.map +1 -0
- package/dist/fetch/cdp-client.js +89 -0
- package/dist/fetch/cdp-client.js.map +1 -0
- package/dist/fetch/content-check.js +39 -46
- package/dist/fetch/content-check.js.map +1 -1
- package/dist/fetch/http-client.d.ts +4 -0
- package/dist/fetch/http-client.d.ts.map +1 -1
- package/dist/fetch/http-client.js +147 -128
- package/dist/fetch/http-client.js.map +1 -1
- package/dist/fetch/lightpanda.d.ts +28 -0
- package/dist/fetch/lightpanda.d.ts.map +1 -0
- package/dist/fetch/lightpanda.js +174 -0
- package/dist/fetch/lightpanda.js.map +1 -0
- package/dist/fetch/playwright-tier.d.ts +19 -0
- package/dist/fetch/playwright-tier.d.ts.map +1 -0
- package/dist/fetch/playwright-tier.js +76 -0
- package/dist/fetch/playwright-tier.js.map +1 -0
- package/dist/fetch/router.d.ts +49 -3
- package/dist/fetch/router.d.ts.map +1 -1
- package/dist/fetch/router.js +185 -81
- package/dist/fetch/router.js.map +1 -1
- package/dist/index.js +97 -17
- package/dist/index.js.map +1 -1
- package/dist/instructions.d.ts +31 -0
- package/dist/instructions.d.ts.map +1 -0
- package/dist/instructions.js +245 -0
- package/dist/instructions.js.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts +3 -0
- package/dist/integrations/cloud/llm/anthropic.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/anthropic.js +41 -0
- package/dist/integrations/cloud/llm/anthropic.js.map +1 -0
- package/dist/integrations/cloud/llm/cache.d.ts +5 -0
- package/dist/integrations/cloud/llm/cache.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/cache.js +49 -0
- package/dist/integrations/cloud/llm/cache.js.map +1 -0
- package/dist/integrations/cloud/llm/gemini.d.ts +3 -0
- package/dist/integrations/cloud/llm/gemini.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/gemini.js +37 -0
- package/dist/integrations/cloud/llm/gemini.js.map +1 -0
- package/dist/integrations/cloud/llm/groq.d.ts +3 -0
- package/dist/integrations/cloud/llm/groq.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/groq.js +74 -0
- package/dist/integrations/cloud/llm/groq.js.map +1 -0
- package/dist/integrations/cloud/llm/hash.d.ts +3 -0
- package/dist/integrations/cloud/llm/hash.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/hash.js +26 -0
- package/dist/integrations/cloud/llm/hash.js.map +1 -0
- package/dist/integrations/cloud/llm/openai.d.ts +3 -0
- package/dist/integrations/cloud/llm/openai.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/openai.js +43 -0
- package/dist/integrations/cloud/llm/openai.js.map +1 -0
- package/dist/integrations/cloud/llm/select.d.ts +5 -0
- package/dist/integrations/cloud/llm/select.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/select.js +30 -0
- package/dist/integrations/cloud/llm/select.js.map +1 -0
- package/dist/integrations/cloud/llm/types.d.ts +24 -0
- package/dist/integrations/cloud/llm/types.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/types.js +1 -0
- package/dist/integrations/cloud/llm/types.js.map +1 -0
- package/dist/integrations/cloud/llm/validate.d.ts +6 -0
- package/dist/integrations/cloud/llm/validate.d.ts.map +1 -0
- package/dist/integrations/cloud/llm/validate.js +63 -0
- package/dist/integrations/cloud/llm/validate.js.map +1 -0
- package/dist/logger.d.ts +4 -1
- package/dist/logger.d.ts.map +1 -1
- package/dist/logger.js +71 -30
- package/dist/logger.js.map +1 -1
- package/dist/pdf-parse.d.js +1 -0
- package/dist/pdf-parse.d.js.map +1 -0
- package/dist/plugins/loader.d.ts +20 -0
- package/dist/plugins/loader.d.ts.map +1 -0
- package/dist/plugins/loader.js +157 -0
- package/dist/plugins/loader.js.map +1 -0
- package/dist/plugins/registry.d.ts +26 -0
- package/dist/plugins/registry.d.ts.map +1 -0
- package/dist/plugins/registry.js +71 -0
- package/dist/plugins/registry.js.map +1 -0
- package/dist/plugins/validate.d.ts +9 -0
- package/dist/plugins/validate.d.ts.map +1 -0
- package/dist/plugins/validate.js +79 -0
- package/dist/plugins/validate.js.map +1 -0
- package/dist/providers/embed-provider.d.ts +11 -0
- package/dist/providers/embed-provider.d.ts.map +1 -0
- package/dist/providers/embed-provider.js +24 -0
- package/dist/providers/embed-provider.js.map +1 -0
- package/dist/providers/extract-provider.d.ts +23 -0
- package/dist/providers/extract-provider.d.ts.map +1 -0
- package/dist/providers/extract-provider.js +25 -0
- package/dist/providers/extract-provider.js.map +1 -0
- package/dist/providers/rerank-provider.d.ts +16 -0
- package/dist/providers/rerank-provider.d.ts.map +1 -0
- package/dist/providers/rerank-provider.js +28 -0
- package/dist/providers/rerank-provider.js.map +1 -0
- package/dist/providers/search-provider.d.ts +25 -0
- package/dist/providers/search-provider.d.ts.map +1 -0
- package/dist/providers/search-provider.js +44 -0
- package/dist/providers/search-provider.js.map +1 -0
- package/dist/providers/vector-store.d.ts +27 -0
- package/dist/providers/vector-store.d.ts.map +1 -0
- package/dist/providers/vector-store.js +27 -0
- package/dist/providers/vector-store.js.map +1 -0
- package/dist/python-env.d.ts +9 -0
- package/dist/python-env.d.ts.map +1 -0
- package/dist/python-env.js +13 -0
- package/dist/python-env.js.map +1 -0
- package/dist/repl/commands/agent.d.ts +5 -0
- package/dist/repl/commands/agent.d.ts.map +1 -0
- package/dist/repl/commands/agent.js +62 -0
- package/dist/repl/commands/agent.js.map +1 -0
- package/dist/repl/commands/cache.d.ts +4 -0
- package/dist/repl/commands/cache.d.ts.map +1 -0
- package/dist/repl/commands/cache.js +43 -0
- package/dist/repl/commands/cache.js.map +1 -0
- package/dist/repl/commands/crawl.d.ts +7 -0
- package/dist/repl/commands/crawl.d.ts.map +1 -0
- package/dist/repl/commands/crawl.js +44 -0
- package/dist/repl/commands/crawl.js.map +1 -0
- package/dist/repl/commands/extract.d.ts +5 -0
- package/dist/repl/commands/extract.d.ts.map +1 -0
- package/dist/repl/commands/extract.js +47 -0
- package/dist/repl/commands/extract.js.map +1 -0
- package/dist/repl/commands/fetch.d.ts +5 -0
- package/dist/repl/commands/fetch.d.ts.map +1 -0
- package/dist/repl/commands/fetch.js +67 -0
- package/dist/repl/commands/fetch.js.map +1 -0
- package/dist/repl/commands/find-similar.d.ts +5 -0
- package/dist/repl/commands/find-similar.d.ts.map +1 -0
- package/dist/repl/commands/find-similar.js +74 -0
- package/dist/repl/commands/find-similar.js.map +1 -0
- package/dist/repl/commands/research.d.ts +5 -0
- package/dist/repl/commands/research.d.ts.map +1 -0
- package/dist/repl/commands/research.js +65 -0
- package/dist/repl/commands/research.js.map +1 -0
- package/dist/repl/commands/search.d.ts +5 -0
- package/dist/repl/commands/search.d.ts.map +1 -0
- package/dist/repl/commands/search.js +74 -0
- package/dist/repl/commands/search.js.map +1 -0
- package/dist/repl/commands/types.d.ts +9 -0
- package/dist/repl/commands/types.d.ts.map +1 -0
- package/dist/repl/commands/types.js +1 -0
- package/dist/repl/commands/types.js.map +1 -0
- package/dist/repl/formatters.d.ts +13 -0
- package/dist/repl/formatters.d.ts.map +1 -0
- package/dist/repl/formatters.js +283 -0
- package/dist/repl/formatters.js.map +1 -0
- package/dist/repl/parser.d.ts +9 -0
- package/dist/repl/parser.d.ts.map +1 -0
- package/dist/repl/parser.js +86 -0
- package/dist/repl/parser.js.map +1 -0
- package/dist/repl/shell.d.ts +8 -0
- package/dist/repl/shell.d.ts.map +1 -0
- package/dist/repl/shell.js +184 -0
- package/dist/repl/shell.js.map +1 -0
- package/dist/research/branch-exploration.d.ts +14 -0
- package/dist/research/branch-exploration.d.ts.map +1 -0
- package/dist/research/branch-exploration.js +100 -0
- package/dist/research/branch-exploration.js.map +1 -0
- package/dist/research/brief.d.ts +5 -0
- package/dist/research/brief.d.ts.map +1 -0
- package/dist/research/brief.js +242 -0
- package/dist/research/brief.js.map +1 -0
- package/dist/research/citation-graph.d.ts +9 -0
- package/dist/research/citation-graph.d.ts.map +1 -0
- package/dist/research/citation-graph.js +114 -0
- package/dist/research/citation-graph.js.map +1 -0
- package/dist/research/decompose.d.ts +14 -0
- package/dist/research/decompose.d.ts.map +1 -0
- package/dist/research/decompose.js +439 -0
- package/dist/research/decompose.js.map +1 -0
- package/dist/research/pipeline.d.ts +5 -0
- package/dist/research/pipeline.d.ts.map +1 -0
- package/dist/research/pipeline.js +269 -0
- package/dist/research/pipeline.js.map +1 -0
- package/dist/research/synthesis-local.d.ts +16 -0
- package/dist/research/synthesis-local.d.ts.map +1 -0
- package/dist/research/synthesis-local.js +73 -0
- package/dist/research/synthesis-local.js.map +1 -0
- package/dist/research/synthesize.d.ts +10 -0
- package/dist/research/synthesize.d.ts.map +1 -0
- package/dist/research/synthesize.js +137 -0
- package/dist/research/synthesize.js.map +1 -0
- package/dist/search/answer-synthesis.d.ts +33 -0
- package/dist/search/answer-synthesis.d.ts.map +1 -0
- package/dist/search/answer-synthesis.js +244 -0
- package/dist/search/answer-synthesis.js.map +1 -0
- package/dist/search/context-formatter.d.ts +3 -0
- package/dist/search/context-formatter.d.ts.map +1 -0
- package/dist/search/context-formatter.js +56 -0
- package/dist/search/context-formatter.js.map +1 -0
- package/dist/search/dedup.d.ts +1 -0
- package/dist/search/dedup.d.ts.map +1 -1
- package/dist/search/dedup.js +40 -32
- package/dist/search/dedup.js.map +1 -1
- package/dist/search/engines/arxiv.d.ts +7 -0
- package/dist/search/engines/arxiv.d.ts.map +1 -0
- package/dist/search/engines/arxiv.js +70 -0
- package/dist/search/engines/arxiv.js.map +1 -0
- package/dist/search/engines/bing-news.d.ts +7 -0
- package/dist/search/engines/bing-news.d.ts.map +1 -0
- package/dist/search/engines/bing-news.js +97 -0
- package/dist/search/engines/bing-news.js.map +1 -0
- package/dist/search/engines/bing.d.ts +1 -0
- package/dist/search/engines/bing.d.ts.map +1 -1
- package/dist/search/engines/bing.js +100 -44
- package/dist/search/engines/bing.js.map +1 -1
- package/dist/search/engines/devdocs.d.ts +6 -0
- package/dist/search/engines/devdocs.d.ts.map +1 -0
- package/dist/search/engines/devdocs.js +56 -0
- package/dist/search/engines/devdocs.js.map +1 -0
- package/dist/search/engines/duckduckgo.d.ts.map +1 -1
- package/dist/search/engines/duckduckgo.js +56 -44
- package/dist/search/engines/duckduckgo.js.map +1 -1
- package/dist/search/engines/github-code.d.ts +7 -0
- package/dist/search/engines/github-code.d.ts.map +1 -0
- package/dist/search/engines/github-code.js +55 -0
- package/dist/search/engines/github-code.js.map +1 -0
- package/dist/search/engines/hn-algolia.d.ts +7 -0
- package/dist/search/engines/hn-algolia.d.ts.map +1 -0
- package/dist/search/engines/hn-algolia.js +76 -0
- package/dist/search/engines/hn-algolia.js.map +1 -0
- package/dist/search/engines/lobsters.d.ts +7 -0
- package/dist/search/engines/lobsters.d.ts.map +1 -0
- package/dist/search/engines/lobsters.js +83 -0
- package/dist/search/engines/lobsters.js.map +1 -0
- package/dist/search/engines/mdn.d.ts +7 -0
- package/dist/search/engines/mdn.d.ts.map +1 -0
- package/dist/search/engines/mdn.js +48 -0
- package/dist/search/engines/mdn.js.map +1 -0
- package/dist/search/engines/semantic-scholar.d.ts +7 -0
- package/dist/search/engines/semantic-scholar.d.ts.map +1 -0
- package/dist/search/engines/semantic-scholar.js +69 -0
- package/dist/search/engines/semantic-scholar.js.map +1 -0
- package/dist/search/engines/stackoverflow.d.ts +7 -0
- package/dist/search/engines/stackoverflow.d.ts.map +1 -0
- package/dist/search/engines/stackoverflow.js +73 -0
- package/dist/search/engines/stackoverflow.js.map +1 -0
- package/dist/search/engines/startpage.d.ts.map +1 -1
- package/dist/search/engines/startpage.js +65 -46
- package/dist/search/engines/startpage.js.map +1 -1
- package/dist/search/evidence.d.ts +25 -0
- package/dist/search/evidence.d.ts.map +1 -0
- package/dist/search/evidence.js +220 -0
- package/dist/search/evidence.js.map +1 -0
- package/dist/search/filters.js +49 -55
- package/dist/search/filters.js.map +1 -1
- package/dist/search/find-similar/crawl-rank.d.ts +9 -0
- package/dist/search/find-similar/crawl-rank.d.ts.map +1 -0
- package/dist/search/find-similar/crawl-rank.js +272 -0
- package/dist/search/find-similar/crawl-rank.js.map +1 -0
- package/dist/search/find-similar/mode.d.ts +4 -0
- package/dist/search/find-similar/mode.d.ts.map +1 -0
- package/dist/search/find-similar/mode.js +12 -0
- package/dist/search/find-similar/mode.js.map +1 -0
- package/dist/search/find-similar.d.ts +5 -0
- package/dist/search/find-similar.d.ts.map +1 -0
- package/dist/search/find-similar.js +509 -0
- package/dist/search/find-similar.js.map +1 -0
- package/dist/search/highlights.d.ts +19 -0
- package/dist/search/highlights.d.ts.map +1 -0
- package/dist/search/highlights.js +167 -0
- package/dist/search/highlights.js.map +1 -0
- package/dist/search/language-filter.d.ts +29 -0
- package/dist/search/language-filter.d.ts.map +1 -0
- package/dist/search/language-filter.js +126 -0
- package/dist/search/language-filter.js.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts +4 -0
- package/dist/search/legacy/searxng-orchestrator.d.ts.map +1 -0
- package/dist/search/legacy/searxng-orchestrator.js +501 -0
- package/dist/search/legacy/searxng-orchestrator.js.map +1 -0
- package/dist/search/legacy/searxng-provider.d.ts +7 -0
- package/dist/search/legacy/searxng-provider.d.ts.map +1 -0
- package/dist/search/legacy/searxng-provider.js +11 -0
- package/dist/search/legacy/searxng-provider.js.map +1 -0
- package/dist/search/multi-query.d.ts +25 -0
- package/dist/search/multi-query.d.ts.map +1 -0
- package/dist/search/multi-query.js +228 -0
- package/dist/search/multi-query.js.map +1 -0
- package/dist/search/query.js +32 -34
- package/dist/search/query.js.map +1 -1
- package/dist/search/rerank.d.ts +3 -1
- package/dist/search/rerank.d.ts.map +1 -1
- package/dist/search/rerank.js +44 -35
- package/dist/search/rerank.js.map +1 -1
- package/dist/search/reranker/authority-boost.d.ts +3 -0
- package/dist/search/reranker/authority-boost.d.ts.map +1 -0
- package/dist/search/reranker/authority-boost.js +179 -0
- package/dist/search/reranker/authority-boost.js.map +1 -0
- package/dist/search/reranker/consensus-boost.d.ts +3 -0
- package/dist/search/reranker/consensus-boost.d.ts.map +1 -0
- package/dist/search/reranker/consensus-boost.js +27 -0
- package/dist/search/reranker/consensus-boost.js.map +1 -0
- package/dist/search/reranker/recency-boost.d.ts +3 -0
- package/dist/search/reranker/recency-boost.d.ts.map +1 -0
- package/dist/search/reranker/recency-boost.js +13 -0
- package/dist/search/reranker/recency-boost.js.map +1 -0
- package/dist/search/reranker/recency.d.ts +3 -0
- package/dist/search/reranker/recency.d.ts.map +1 -0
- package/dist/search/reranker/recency.js +23 -0
- package/dist/search/reranker/recency.js.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts +12 -0
- package/dist/search/reranker/transformers-rerank-provider.d.ts.map +1 -0
- package/dist/search/reranker/transformers-rerank-provider.js +78 -0
- package/dist/search/reranker/transformers-rerank-provider.js.map +1 -0
- package/dist/search/rrf.d.ts +17 -0
- package/dist/search/rrf.d.ts.map +1 -0
- package/dist/search/rrf.js +39 -0
- package/dist/search/rrf.js.map +1 -0
- package/dist/search/sampling.d.ts +25 -0
- package/dist/search/sampling.d.ts.map +1 -0
- package/dist/search/sampling.js +52 -0
- package/dist/search/sampling.js.map +1 -0
- package/dist/search/searxng.d.ts.map +1 -1
- package/dist/search/searxng.js +69 -79
- package/dist/search/searxng.js.map +1 -1
- package/dist/search/tokens.d.ts +3 -0
- package/dist/search/tokens.d.ts.map +1 -0
- package/dist/search/tokens.js +39 -0
- package/dist/search/tokens.js.map +1 -0
- package/dist/search/truncate.d.ts +6 -0
- package/dist/search/truncate.d.ts.map +1 -0
- package/dist/search/truncate.js +26 -0
- package/dist/search/truncate.js.map +1 -0
- package/dist/search/url-unwrap.d.ts +3 -0
- package/dist/search/url-unwrap.d.ts.map +1 -0
- package/dist/search/url-unwrap.js +43 -0
- package/dist/search/url-unwrap.js.map +1 -0
- package/dist/search/v1/context-rank.d.ts +13 -0
- package/dist/search/v1/context-rank.d.ts.map +1 -0
- package/dist/search/v1/context-rank.js +74 -0
- package/dist/search/v1/context-rank.js.map +1 -0
- package/dist/search/v1/engine-base.d.ts +27 -0
- package/dist/search/v1/engine-base.d.ts.map +1 -0
- package/dist/search/v1/engine-base.js +110 -0
- package/dist/search/v1/engine-base.js.map +1 -0
- package/dist/search/v1/intent-router.d.ts +22 -0
- package/dist/search/v1/intent-router.d.ts.map +1 -0
- package/dist/search/v1/intent-router.js +138 -0
- package/dist/search/v1/intent-router.js.map +1 -0
- package/dist/search/v1/orchestrator.d.ts +24 -0
- package/dist/search/v1/orchestrator.d.ts.map +1 -0
- package/dist/search/v1/orchestrator.js +163 -0
- package/dist/search/v1/orchestrator.js.map +1 -0
- package/dist/search/v1/recency-boost.d.ts +9 -0
- package/dist/search/v1/recency-boost.d.ts.map +1 -0
- package/dist/search/v1/recency-boost.js +37 -0
- package/dist/search/v1/recency-boost.js.map +1 -0
- package/dist/search/v1/recent-cache-dedup.d.ts +6 -0
- package/dist/search/v1/recent-cache-dedup.d.ts.map +1 -0
- package/dist/search/v1/recent-cache-dedup.js +85 -0
- package/dist/search/v1/recent-cache-dedup.js.map +1 -0
- package/dist/search/v1/rss/feed-config.d.ts +21 -0
- package/dist/search/v1/rss/feed-config.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-config.js +90 -0
- package/dist/search/v1/rss/feed-config.js.map +1 -0
- package/dist/search/v1/rss/feed-parser.d.ts +14 -0
- package/dist/search/v1/rss/feed-parser.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-parser.js +104 -0
- package/dist/search/v1/rss/feed-parser.js.map +1 -0
- package/dist/search/v1/rss/feed-poller.d.ts +22 -0
- package/dist/search/v1/rss/feed-poller.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-poller.js +102 -0
- package/dist/search/v1/rss/feed-poller.js.map +1 -0
- package/dist/search/v1/rss/feed-store.d.ts +30 -0
- package/dist/search/v1/rss/feed-store.d.ts.map +1 -0
- package/dist/search/v1/rss/feed-store.js +134 -0
- package/dist/search/v1/rss/feed-store.js.map +1 -0
- package/dist/search/v1/rss/rss-engine.d.ts +6 -0
- package/dist/search/v1/rss/rss-engine.d.ts.map +1 -0
- package/dist/search/v1/rss/rss-engine.js +28 -0
- package/dist/search/v1/rss/rss-engine.js.map +1 -0
- package/dist/search/v1/v1-provider.d.ts +7 -0
- package/dist/search/v1/v1-provider.d.ts.map +1 -0
- package/dist/search/v1/v1-provider.js +68 -0
- package/dist/search/v1/v1-provider.js.map +1 -0
- package/dist/search/v1/verticals/code.d.ts +4 -0
- package/dist/search/v1/verticals/code.d.ts.map +1 -0
- package/dist/search/v1/verticals/code.js +20 -0
- package/dist/search/v1/verticals/code.js.map +1 -0
- package/dist/search/v1/verticals/docs.d.ts +4 -0
- package/dist/search/v1/verticals/docs.d.ts.map +1 -0
- package/dist/search/v1/verticals/docs.js +20 -0
- package/dist/search/v1/verticals/docs.js.map +1 -0
- package/dist/search/v1/verticals/general.d.ts +4 -0
- package/dist/search/v1/verticals/general.d.ts.map +1 -0
- package/dist/search/v1/verticals/general.js +22 -0
- package/dist/search/v1/verticals/general.js.map +1 -0
- package/dist/search/v1/verticals/news.d.ts +10 -0
- package/dist/search/v1/verticals/news.d.ts.map +1 -0
- package/dist/search/v1/verticals/news.js +52 -0
- package/dist/search/v1/verticals/news.js.map +1 -0
- package/dist/search/v1/verticals/papers.d.ts +4 -0
- package/dist/search/v1/verticals/papers.d.ts.map +1 -0
- package/dist/search/v1/verticals/papers.js +23 -0
- package/dist/search/v1/verticals/papers.js.map +1 -0
- package/dist/search/validator.js +31 -31
- package/dist/search/validator.js.map +1 -1
- package/dist/searxng/bootstrap.d.ts +30 -0
- package/dist/searxng/bootstrap.d.ts.map +1 -1
- package/dist/searxng/bootstrap.js +223 -85
- package/dist/searxng/bootstrap.js.map +1 -1
- package/dist/searxng/docker.d.ts.map +1 -1
- package/dist/searxng/docker.js +69 -60
- package/dist/searxng/docker.js.map +1 -1
- package/dist/searxng/process.d.ts +13 -1
- package/dist/searxng/process.d.ts.map +1 -1
- package/dist/searxng/process.js +231 -164
- package/dist/searxng/process.js.map +1 -1
- package/dist/server/backend-status.d.ts +13 -0
- package/dist/server/backend-status.d.ts.map +1 -0
- package/dist/server/backend-status.js +40 -0
- package/dist/server/backend-status.js.map +1 -0
- package/dist/server/tool-schemas.d.ts +549 -0
- package/dist/server/tool-schemas.d.ts.map +1 -0
- package/dist/server/tool-schemas.js +464 -0
- package/dist/server/tool-schemas.js.map +1 -0
- package/dist/server/warmup-on-start.d.ts +9 -0
- package/dist/server/warmup-on-start.d.ts.map +1 -0
- package/dist/server/warmup-on-start.js +55 -0
- package/dist/server/warmup-on-start.js.map +1 -0
- package/dist/server.d.ts +17 -0
- package/dist/server.d.ts.map +1 -1
- package/dist/server.js +454 -297
- package/dist/server.js.map +1 -1
- package/dist/tools/agent.d.ts +5 -0
- package/dist/tools/agent.d.ts.map +1 -0
- package/dist/tools/agent.js +128 -0
- package/dist/tools/agent.js.map +1 -0
- package/dist/tools/cache.d.ts +2 -1
- package/dist/tools/cache.d.ts.map +1 -1
- package/dist/tools/cache.js +175 -44
- package/dist/tools/cache.js.map +1 -1
- package/dist/tools/crawl.d.ts.map +1 -1
- package/dist/tools/crawl.js +171 -88
- package/dist/tools/crawl.js.map +1 -1
- package/dist/tools/extract.d.ts +2 -2
- package/dist/tools/extract.d.ts.map +1 -1
- package/dist/tools/extract.js +175 -59
- package/dist/tools/extract.js.map +1 -1
- package/dist/tools/fetch.d.ts +2 -2
- package/dist/tools/fetch.d.ts.map +1 -1
- package/dist/tools/fetch.js +161 -68
- package/dist/tools/fetch.js.map +1 -1
- package/dist/tools/find-similar.d.ts +5 -0
- package/dist/tools/find-similar.d.ts.map +1 -0
- package/dist/tools/find-similar.js +127 -0
- package/dist/tools/find-similar.js.map +1 -0
- package/dist/tools/research.d.ts +5 -0
- package/dist/tools/research.d.ts.map +1 -0
- package/dist/tools/research.js +107 -0
- package/dist/tools/research.js.map +1 -0
- package/dist/tools/search.d.ts +10 -2
- package/dist/tools/search.d.ts.map +1 -1
- package/dist/tools/search.js +13 -158
- package/dist/tools/search.js.map +1 -1
- package/dist/types.d.ts +350 -7
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js +6 -1
- package/dist/types.js.map +1 -1
- package/dist/util/mode.d.ts +4 -0
- package/dist/util/mode.d.ts.map +1 -0
- package/dist/util/mode.js +34 -0
- package/dist/util/mode.js.map +1 -0
- package/package.json +78 -8
- package/dist/extraction/trafilatura.d.ts +0 -6
- package/dist/extraction/trafilatura.d.ts.map +0 -1
- package/dist/extraction/trafilatura.js +0 -105
- package/dist/extraction/trafilatura.js.map +0 -1
- package/dist/search/flashrank.d.ts +0 -12
- package/dist/search/flashrank.d.ts.map +0 -1
- package/dist/search/flashrank.js +0 -63
- package/dist/search/flashrank.js.map +0 -1
|
@@ -0,0 +1,110 @@
|
|
|
1
|
+
import { parseHTML } from "linkedom";
|
|
2
|
+
import { extractJsonLd } from "../jsonld.js";
|
|
3
|
+
const JSONLD_TYPE_MAP = {
|
|
4
|
+
recipe: "recipe",
|
|
5
|
+
product: "product",
|
|
6
|
+
newsarticle: "news",
|
|
7
|
+
article: "news",
|
|
8
|
+
blogposting: "news",
|
|
9
|
+
question: "code",
|
|
10
|
+
answer: "code",
|
|
11
|
+
qapage: "code",
|
|
12
|
+
techarticle: "docs",
|
|
13
|
+
apireference: "docs"
|
|
14
|
+
};
|
|
15
|
+
const OG_TYPE_MAP = {
|
|
16
|
+
article: "news",
|
|
17
|
+
product: "product",
|
|
18
|
+
recipe: "recipe"
|
|
19
|
+
};
|
|
20
|
+
const DOCS_PATH_PREFIXES = ["/docs/", "/documentation/", "/reference/", "/api/"];
|
|
21
|
+
function classifyContent(url, html) {
|
|
22
|
+
const fromJsonLd = classifyByJsonLd(html);
|
|
23
|
+
if (fromJsonLd) return fromJsonLd;
|
|
24
|
+
const { document } = parseHTML(html || "<html></html>");
|
|
25
|
+
const fromOg = classifyByOgType(document);
|
|
26
|
+
if (fromOg) return fromOg;
|
|
27
|
+
const fromHost = classifyByUrl(url);
|
|
28
|
+
if (fromHost) return fromHost;
|
|
29
|
+
const fromBody = classifyByBody(document);
|
|
30
|
+
if (fromBody) return fromBody;
|
|
31
|
+
return "generic";
|
|
32
|
+
}
|
|
33
|
+
function classifyByJsonLd(html) {
|
|
34
|
+
if (!html) return null;
|
|
35
|
+
const blocks = extractJsonLd(html);
|
|
36
|
+
for (const block of blocks) {
|
|
37
|
+
const mapped = mapJsonLdType(block["@type"]);
|
|
38
|
+
if (mapped) return mapped;
|
|
39
|
+
}
|
|
40
|
+
return null;
|
|
41
|
+
}
|
|
42
|
+
function mapJsonLdType(raw) {
|
|
43
|
+
if (typeof raw === "string") {
|
|
44
|
+
return JSONLD_TYPE_MAP[normalizeType(raw)] ?? null;
|
|
45
|
+
}
|
|
46
|
+
if (Array.isArray(raw)) {
|
|
47
|
+
for (const entry of raw) {
|
|
48
|
+
if (typeof entry !== "string") continue;
|
|
49
|
+
const mapped = JSONLD_TYPE_MAP[normalizeType(entry)];
|
|
50
|
+
if (mapped) return mapped;
|
|
51
|
+
}
|
|
52
|
+
}
|
|
53
|
+
return null;
|
|
54
|
+
}
|
|
55
|
+
function normalizeType(raw) {
|
|
56
|
+
const tail = raw.split(/[/#:]/).pop() ?? raw;
|
|
57
|
+
return tail.toLowerCase();
|
|
58
|
+
}
|
|
59
|
+
function classifyByOgType(document) {
|
|
60
|
+
const meta = document.querySelector('meta[property="og:type"]');
|
|
61
|
+
const content = meta?.getAttribute("content")?.trim().toLowerCase();
|
|
62
|
+
if (!content) return null;
|
|
63
|
+
return OG_TYPE_MAP[content] ?? null;
|
|
64
|
+
}
|
|
65
|
+
function classifyByUrl(url) {
|
|
66
|
+
let parsed;
|
|
67
|
+
try {
|
|
68
|
+
parsed = new URL(url);
|
|
69
|
+
} catch {
|
|
70
|
+
return null;
|
|
71
|
+
}
|
|
72
|
+
const host = parsed.hostname.toLowerCase();
|
|
73
|
+
const path = parsed.pathname.toLowerCase();
|
|
74
|
+
if (host === "github.com" || host === "gist.github.com" || host.endsWith(".github.com")) {
|
|
75
|
+
return "code";
|
|
76
|
+
}
|
|
77
|
+
if (host === "stackoverflow.com" || host.endsWith(".stackoverflow.com")) {
|
|
78
|
+
return "code";
|
|
79
|
+
}
|
|
80
|
+
if (host.endsWith(".stackexchange.com") || host === "stackexchange.com") {
|
|
81
|
+
return "code";
|
|
82
|
+
}
|
|
83
|
+
if (host === "developer.mozilla.org" || host === "devdocs.io") {
|
|
84
|
+
return "docs";
|
|
85
|
+
}
|
|
86
|
+
if (host.startsWith("docs.")) {
|
|
87
|
+
return "docs";
|
|
88
|
+
}
|
|
89
|
+
if (DOCS_PATH_PREFIXES.some((prefix) => path.startsWith(prefix))) {
|
|
90
|
+
return "docs";
|
|
91
|
+
}
|
|
92
|
+
return null;
|
|
93
|
+
}
|
|
94
|
+
function classifyByBody(document) {
|
|
95
|
+
const itemtypeNodes = document.querySelectorAll("[itemtype]");
|
|
96
|
+
for (const node of itemtypeNodes) {
|
|
97
|
+
const itemtype = node.getAttribute("itemtype")?.toLowerCase() ?? "";
|
|
98
|
+
if (itemtype.includes("recipe")) return "recipe";
|
|
99
|
+
if (itemtype.includes("product")) return "product";
|
|
100
|
+
}
|
|
101
|
+
const article = document.querySelector("article");
|
|
102
|
+
if (article && article.querySelector("time[datetime]")) {
|
|
103
|
+
return "news";
|
|
104
|
+
}
|
|
105
|
+
return null;
|
|
106
|
+
}
|
|
107
|
+
export {
|
|
108
|
+
classifyContent
|
|
109
|
+
};
|
|
110
|
+
//# sourceMappingURL=classifier.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../src/extraction/v1/classifier.ts"],"sourcesContent":["import { parseHTML } from 'linkedom';\nimport { extractJsonLd } from '../jsonld.js';\n\nexport type ContentType = 'news' | 'recipe' | 'product' | 'code' | 'docs' | 'generic';\n\nconst JSONLD_TYPE_MAP: Record<string, ContentType> = {\n recipe: 'recipe',\n product: 'product',\n newsarticle: 'news',\n article: 'news',\n blogposting: 'news',\n question: 'code',\n answer: 'code',\n qapage: 'code',\n techarticle: 'docs',\n apireference: 'docs',\n};\n\nconst OG_TYPE_MAP: Record<string, ContentType> = {\n article: 'news',\n product: 'product',\n recipe: 'recipe',\n};\n\nconst DOCS_PATH_PREFIXES = ['/docs/', '/documentation/', '/reference/', '/api/'];\n\nexport function classifyContent(url: string, html: string): ContentType {\n const fromJsonLd = classifyByJsonLd(html);\n if (fromJsonLd) return fromJsonLd;\n\n const { document } = parseHTML(html || '<html></html>');\n\n const fromOg = classifyByOgType(document);\n if (fromOg) return fromOg;\n\n const fromHost = classifyByUrl(url);\n if (fromHost) return fromHost;\n\n const fromBody = classifyByBody(document);\n if (fromBody) return fromBody;\n\n return 'generic';\n}\n\nfunction classifyByJsonLd(html: string): ContentType | null {\n if (!html) return null;\n const blocks = extractJsonLd(html);\n for (const block of blocks) {\n const mapped = mapJsonLdType(block['@type']);\n if (mapped) return mapped;\n }\n return null;\n}\n\nfunction mapJsonLdType(raw: unknown): ContentType | null {\n if (typeof raw === 'string') {\n return JSONLD_TYPE_MAP[normalizeType(raw)] ?? null;\n }\n if (Array.isArray(raw)) {\n for (const entry of raw) {\n if (typeof entry !== 'string') continue;\n const mapped = JSONLD_TYPE_MAP[normalizeType(entry)];\n if (mapped) return mapped;\n }\n }\n return null;\n}\n\nfunction normalizeType(raw: string): string {\n // Accept \"Recipe\", \"schema:Recipe\", \"http://schema.org/Recipe\", etc.\n const tail = raw.split(/[/#:]/).pop() ?? raw;\n return tail.toLowerCase();\n}\n\nfunction classifyByOgType(document: Document): ContentType | null {\n const meta = document.querySelector('meta[property=\"og:type\"]');\n const content = meta?.getAttribute('content')?.trim().toLowerCase();\n if (!content) return null;\n return OG_TYPE_MAP[content] ?? null;\n}\n\nfunction classifyByUrl(url: string): ContentType | null {\n let parsed: URL;\n try {\n parsed = new URL(url);\n } catch {\n return null;\n }\n\n const host = parsed.hostname.toLowerCase();\n const path = parsed.pathname.toLowerCase();\n\n if (host === 'github.com' || host === 'gist.github.com' || host.endsWith('.github.com')) {\n return 'code';\n }\n if (host === 'stackoverflow.com' || host.endsWith('.stackoverflow.com')) {\n return 'code';\n }\n if (host.endsWith('.stackexchange.com') || host === 'stackexchange.com') {\n return 'code';\n }\n\n if (host === 'developer.mozilla.org' || host === 'devdocs.io') {\n return 'docs';\n }\n if (host.startsWith('docs.')) {\n return 'docs';\n }\n if (DOCS_PATH_PREFIXES.some((prefix) => path.startsWith(prefix))) {\n return 'docs';\n }\n\n return null;\n}\n\nfunction classifyByBody(document: Document): ContentType | null {\n const itemtypeNodes = document.querySelectorAll('[itemtype]');\n for (const node of itemtypeNodes) {\n const itemtype = node.getAttribute('itemtype')?.toLowerCase() ?? '';\n if (itemtype.includes('recipe')) return 'recipe';\n if (itemtype.includes('product')) return 'product';\n }\n\n const article = document.querySelector('article');\n if (article && article.querySelector('time[datetime]')) {\n return 'news';\n }\n\n return null;\n}\n"],"mappings":"AAAA,SAAS,iBAAiB;AAC1B,SAAS,qBAAqB;AAI9B,MAAM,kBAA+C;AAAA,EACnD,QAAQ;AAAA,EACR,SAAS;AAAA,EACT,aAAa;AAAA,EACb,SAAS;AAAA,EACT,aAAa;AAAA,EACb,UAAU;AAAA,EACV,QAAQ;AAAA,EACR,QAAQ;AAAA,EACR,aAAa;AAAA,EACb,cAAc;AAChB;AAEA,MAAM,cAA2C;AAAA,EAC/C,SAAS;AAAA,EACT,SAAS;AAAA,EACT,QAAQ;AACV;AAEA,MAAM,qBAAqB,CAAC,UAAU,mBAAmB,eAAe,OAAO;AAExE,SAAS,gBAAgB,KAAa,MAA2B;AACtE,QAAM,aAAa,iBAAiB,IAAI;AACxC,MAAI,WAAY,QAAO;AAEvB,QAAM,EAAE,SAAS,IAAI,UAAU,QAAQ,eAAe;AAEtD,QAAM,SAAS,iBAAiB,QAAQ;AACxC,MAAI,OAAQ,QAAO;AAEnB,QAAM,WAAW,cAAc,GAAG;AAClC,MAAI,SAAU,QAAO;AAErB,QAAM,WAAW,eAAe,QAAQ;AACxC,MAAI,SAAU,QAAO;AAErB,SAAO;AACT;AAEA,SAAS,iBAAiB,MAAkC;AAC1D,MAAI,CAAC,KAAM,QAAO;AAClB,QAAM,SAAS,cAAc,IAAI;AACjC,aAAW,SAAS,QAAQ;AAC1B,UAAM,SAAS,cAAc,MAAM,OAAO,CAAC;AAC3C,QAAI,OAAQ,QAAO;AAAA,EACrB;AACA,SAAO;AACT;AAEA,SAAS,cAAc,KAAkC;AACvD,MAAI,OAAO,QAAQ,UAAU;AAC3B,WAAO,gBAAgB,cAAc,GAAG,CAAC,KAAK;AAAA,EAChD;AACA,MAAI,MAAM,QAAQ,GAAG,GAAG;AACtB,eAAW,SAAS,KAAK;AACvB,UAAI,OAAO,UAAU,SAAU;AAC/B,YAAM,SAAS,gBAAgB,cAAc,KAAK,CAAC;AACnD,UAAI,OAAQ,QAAO;AAAA,IACrB;AAAA,EACF;AACA,SAAO;AACT;AAEA,SAAS,cAAc,KAAqB;AAE1C,QAAM,OAAO,IAAI,MAAM,OAAO,EAAE,IAAI,KAAK;AACzC,SAAO,KAAK,YAAY;AAC1B;AAEA,SAAS,iBAAiB,UAAwC;AAChE,QAAM,OAAO,SAAS,cAAc,0BAA0B;AAC9D,QAAM,UAAU,MAAM,aAAa,SAAS,GAAG,KAAK,EAAE,YAAY;AAClE,MAAI,CAAC,QAAS,QAAO;AACrB,SAAO,YAAY,OAAO,KAAK;AACjC;AAEA,SAAS,cAAc,KAAiC;AACtD,MAAI;AACJ,MAAI;AACF,aAAS,IAAI,IAAI,GAAG;AAAA,EACtB,QAAQ;AACN,WAAO;AAAA,EACT;AAEA,QAAM,OAAO,OAAO,SAAS,YAAY;AACzC,QAAM,OAAO,OAAO,SAAS,YAAY;AAEzC,MAAI,SAAS,gBAAgB,SAAS,qBAAqB,KAAK,SAAS,aAAa,GAAG;AACvF,WAAO;AAAA,EACT;AACA,MAAI,SAAS,uBAAuB,KAAK,SAAS,oBAAoB,GAAG;AACvE,WAAO;AAAA,EACT;AACA,MAAI,KAAK,SAAS,oBAAoB,KAAK,SAAS,qBAAqB;AACvE,WAAO;AAAA,EACT;AAEA,MAAI,SAAS,2BAA2B,SAAS,cAAc;AAC7D,WAAO;AAAA,EACT;AACA,MAAI,KAAK,WAAW,OAAO,GAAG;AAC5B,WAAO;AAAA,EACT;AACA,MAAI,mBAAmB,KAAK,CAAC,WAAW,KAAK,WAAW,MAAM,CAAC,GAAG;AAChE,WAAO;AAAA,EACT;AAEA,SAAO;AACT;AAEA,SAAS,eAAe,UAAwC;AAC9D,QAAM,gBAAgB,SAAS,iBAAiB,YAAY;AAC5D,aAAW,QAAQ,eAAe;AAChC,UAAM,WAAW,KAAK,aAAa,UAAU,GAAG,YAAY,KAAK;AACjE,QAAI,SAAS,SAAS,QAAQ,EAAG,QAAO;AACxC,QAAI,SAAS,SAAS,SAAS,EAAG,QAAO;AAAA,EAC3C;AAEA,QAAM,UAAU,SAAS,cAAc,SAAS;AAChD,MAAI,WAAW,QAAQ,cAAc,gBAAgB,GAAG;AACtD,WAAO;AAAA,EACT;AAEA,SAAO;AACT;","names":[]}
|
|
@@ -0,0 +1,16 @@
|
|
|
1
|
+
import type { ExtractProvider, ExtractProviderOptions } from '../../providers/extract-provider.js';
|
|
2
|
+
import type { ExtractionResult } from '../../types.js';
|
|
3
|
+
/**
|
|
4
|
+
* V1 extract provider — wires the classifier + category extractors via the
|
|
5
|
+
* routed pipeline, then applies the legacy post-processing (URL resolution,
|
|
6
|
+
* boilerplate stripping, sanitization, section selection, link/image
|
|
7
|
+
* extraction, metadata merging, max_chars truncation) to preserve output
|
|
8
|
+
* parity with the legacy provider.
|
|
9
|
+
*
|
|
10
|
+
* PDF handling is kept inline (small enough) and matches legacy semantics.
|
|
11
|
+
*/
|
|
12
|
+
export declare class V1Extractor implements ExtractProvider {
|
|
13
|
+
readonly name: "v1";
|
|
14
|
+
extract(html: string, url: string, options?: ExtractProviderOptions): Promise<ExtractionResult>;
|
|
15
|
+
}
|
|
16
|
+
//# sourceMappingURL=extract-provider.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"extract-provider.d.ts","sourceRoot":"","sources":["../../../src/extraction/v1/extract-provider.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACV,eAAe,EACf,sBAAsB,EACvB,MAAM,qCAAqC,CAAC;AAC7C,OAAO,KAAK,EAAE,gBAAgB,EAAE,MAAM,gBAAgB,CAAC;AAOvD;;;;;;;;GAQG;AACH,qBAAa,WAAY,YAAW,eAAe;IACjD,QAAQ,CAAC,IAAI,EAAG,IAAI,CAAU;IAExB,OAAO,CACX,IAAI,EAAE,MAAM,EACZ,GAAG,EAAE,MAAM,EACX,OAAO,GAAE,sBAA2B,GACnC,OAAO,CAAC,gBAAgB,CAAC;CAc7B"}
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
import { routedExtract } from "./routed.js";
|
|
2
|
+
import { applyPostProcessing } from "../pipeline.js";
|
|
3
|
+
import { createLogger } from "../../logger.js";
|
|
4
|
+
const log = createLogger("extract");
|
|
5
|
+
class V1Extractor {
|
|
6
|
+
name = "v1";
|
|
7
|
+
async extract(html, url, options = {}) {
|
|
8
|
+
if (options.contentType === "application/pdf") {
|
|
9
|
+
const pdf = await handlePdf(html, url, options);
|
|
10
|
+
return applyPostProcessing(pdf, url, html, options);
|
|
11
|
+
}
|
|
12
|
+
const base = await routedExtract({
|
|
13
|
+
html,
|
|
14
|
+
url,
|
|
15
|
+
contentType: options.contentType
|
|
16
|
+
});
|
|
17
|
+
return applyPostProcessing(base, url, html, options);
|
|
18
|
+
}
|
|
19
|
+
}
|
|
20
|
+
async function handlePdf(_html, url, options) {
|
|
21
|
+
let pdfText = "";
|
|
22
|
+
if (options.pdfBuffer) {
|
|
23
|
+
try {
|
|
24
|
+
const pdfParse = (await import("pdf-parse")).default;
|
|
25
|
+
const parsed = await pdfParse(options.pdfBuffer);
|
|
26
|
+
pdfText = parsed.text ?? "";
|
|
27
|
+
} catch (err) {
|
|
28
|
+
log.warn("pdf-parse failed", { url, error: String(err) });
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
return {
|
|
32
|
+
title: "",
|
|
33
|
+
markdown: pdfText,
|
|
34
|
+
metadata: {},
|
|
35
|
+
links: [],
|
|
36
|
+
images: [],
|
|
37
|
+
extractor: "turndown"
|
|
38
|
+
};
|
|
39
|
+
}
|
|
40
|
+
export {
|
|
41
|
+
V1Extractor
|
|
42
|
+
};
|
|
43
|
+
//# sourceMappingURL=extract-provider.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../src/extraction/v1/extract-provider.ts"],"sourcesContent":["import type {\n ExtractProvider,\n ExtractProviderOptions,\n} from '../../providers/extract-provider.js';\nimport type { ExtractionResult } from '../../types.js';\nimport { routedExtract } from './routed.js';\nimport { applyPostProcessing } from '../pipeline.js';\nimport { createLogger } from '../../logger.js';\n\nconst log = createLogger('extract');\n\n/**\n * V1 extract provider — wires the classifier + category extractors via the\n * routed pipeline, then applies the legacy post-processing (URL resolution,\n * boilerplate stripping, sanitization, section selection, link/image\n * extraction, metadata merging, max_chars truncation) to preserve output\n * parity with the legacy provider.\n *\n * PDF handling is kept inline (small enough) and matches legacy semantics.\n */\nexport class V1Extractor implements ExtractProvider {\n readonly name = 'v1' as const;\n\n async extract(\n html: string,\n url: string,\n options: ExtractProviderOptions = {},\n ): Promise<ExtractionResult> {\n if (options.contentType === 'application/pdf') {\n const pdf = await handlePdf(html, url, options);\n return applyPostProcessing(pdf, url, html, options);\n }\n\n const base = await routedExtract({\n html,\n url,\n contentType: options.contentType,\n });\n\n return applyPostProcessing(base, url, html, options);\n }\n}\n\nasync function handlePdf(\n _html: string,\n url: string,\n options: ExtractProviderOptions,\n): Promise<ExtractionResult> {\n let pdfText = '';\n if (options.pdfBuffer) {\n try {\n const pdfParse = (await import('pdf-parse')).default;\n const parsed = await pdfParse(options.pdfBuffer);\n pdfText = parsed.text ?? '';\n } catch (err) {\n log.warn('pdf-parse failed', { url, error: String(err) });\n }\n }\n return {\n title: '',\n markdown: pdfText,\n metadata: {},\n links: [],\n images: [],\n extractor: 'turndown',\n };\n}\n"],"mappings":"AAKA,SAAS,qBAAqB;AAC9B,SAAS,2BAA2B;AACpC,SAAS,oBAAoB;AAE7B,MAAM,MAAM,aAAa,SAAS;AAW3B,MAAM,YAAuC;AAAA,EACzC,OAAO;AAAA,EAEhB,MAAM,QACJ,MACA,KACA,UAAkC,CAAC,GACR;AAC3B,QAAI,QAAQ,gBAAgB,mBAAmB;AAC7C,YAAM,MAAM,MAAM,UAAU,MAAM,KAAK,OAAO;AAC9C,aAAO,oBAAoB,KAAK,KAAK,MAAM,OAAO;AAAA,IACpD;AAEA,UAAM,OAAO,MAAM,cAAc;AAAA,MAC/B;AAAA,MACA;AAAA,MACA,aAAa,QAAQ;AAAA,IACvB,CAAC;AAED,WAAO,oBAAoB,MAAM,KAAK,MAAM,OAAO;AAAA,EACrD;AACF;AAEA,eAAe,UACb,OACA,KACA,SAC2B;AAC3B,MAAI,UAAU;AACd,MAAI,QAAQ,WAAW;AACrB,QAAI;AACF,YAAM,YAAY,MAAM,OAAO,WAAW,GAAG;AAC7C,YAAM,SAAS,MAAM,SAAS,QAAQ,SAAS;AAC/C,gBAAU,OAAO,QAAQ;AAAA,IAC3B,SAAS,KAAK;AACZ,UAAI,KAAK,oBAAoB,EAAE,KAAK,OAAO,OAAO,GAAG,EAAE,CAAC;AAAA,IAC1D;AAAA,EACF;AACA,SAAO;AAAA,IACL,OAAO;AAAA,IACP,UAAU;AAAA,IACV,UAAU,CAAC;AAAA,IACX,OAAO,CAAC;AAAA,IACR,QAAQ,CAAC;AAAA,IACT,WAAW;AAAA,EACb;AACF;","names":[]}
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
export declare function isLocalLlmEnabled(): boolean;
|
|
2
|
+
export interface LocalLlmRequest {
|
|
3
|
+
schema: Record<string, unknown>;
|
|
4
|
+
html: string;
|
|
5
|
+
url: string;
|
|
6
|
+
}
|
|
7
|
+
export declare function extractWithLocalLlm(request: LocalLlmRequest): Promise<Record<string, unknown> | null>;
|
|
8
|
+
//# sourceMappingURL=local-llm.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"local-llm.d.ts","sourceRoot":"","sources":["../../../src/extraction/v1/local-llm.ts"],"names":[],"mappings":"AAOA,wBAAgB,iBAAiB,IAAI,OAAO,CAE3C;AAED,MAAM,WAAW,eAAe;IAC9B,MAAM,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;IAChC,IAAI,EAAE,MAAM,CAAC;IACb,GAAG,EAAE,MAAM,CAAC;CACb;AAED,wBAAsB,mBAAmB,CACvC,OAAO,EAAE,eAAe,GACvB,OAAO,CAAC,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC,CA4DzC"}
|
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
import { createLogger } from "../../logger.js";
|
|
2
|
+
const log = createLogger("extract");
|
|
3
|
+
const MAX_HTML_CHARS = 5e4;
|
|
4
|
+
const REQUEST_TIMEOUT_MS = 3e4;
|
|
5
|
+
function isLocalLlmEnabled() {
|
|
6
|
+
return !!process.env["WIGOLO_LLM_PROVIDER"];
|
|
7
|
+
}
|
|
8
|
+
async function extractWithLocalLlm(request) {
|
|
9
|
+
if (!isLocalLlmEnabled()) return null;
|
|
10
|
+
const provider = process.env["WIGOLO_LLM_PROVIDER"];
|
|
11
|
+
const endpoint = provider.includes("/chat/completions") ? provider : provider.replace(/\/+$/, "") + "/v1/chat/completions";
|
|
12
|
+
const model = process.env["WIGOLO_LLM_MODEL"] ?? "local";
|
|
13
|
+
const htmlSlice = request.html.length > MAX_HTML_CHARS ? request.html.slice(0, MAX_HTML_CHARS) : request.html;
|
|
14
|
+
const prompt = `Extract data matching this JSON schema from the HTML. Return only valid JSON.
|
|
15
|
+
Schema: ${JSON.stringify(request.schema)}
|
|
16
|
+
URL: ${request.url}
|
|
17
|
+
HTML: ${htmlSlice}`;
|
|
18
|
+
const body = {
|
|
19
|
+
model,
|
|
20
|
+
messages: [{ role: "user", content: prompt }],
|
|
21
|
+
response_format: { type: "json_object" }
|
|
22
|
+
};
|
|
23
|
+
let response;
|
|
24
|
+
try {
|
|
25
|
+
response = await fetch(endpoint, {
|
|
26
|
+
method: "POST",
|
|
27
|
+
headers: { "content-type": "application/json" },
|
|
28
|
+
body: JSON.stringify(body),
|
|
29
|
+
signal: AbortSignal.timeout(REQUEST_TIMEOUT_MS)
|
|
30
|
+
});
|
|
31
|
+
} catch (err) {
|
|
32
|
+
log.error("local llm request failed", { error: String(err) });
|
|
33
|
+
throw err;
|
|
34
|
+
}
|
|
35
|
+
if (!response.ok) {
|
|
36
|
+
throw new Error(`Local LLM endpoint returned ${response.status}`);
|
|
37
|
+
}
|
|
38
|
+
const payload = await response.json();
|
|
39
|
+
const content = payload.choices?.[0]?.message?.content;
|
|
40
|
+
if (typeof content !== "string" || content.trim().length === 0) {
|
|
41
|
+
throw new Error("Local LLM response missing message content");
|
|
42
|
+
}
|
|
43
|
+
let parsed;
|
|
44
|
+
try {
|
|
45
|
+
parsed = JSON.parse(content);
|
|
46
|
+
} catch (err) {
|
|
47
|
+
throw new Error(`Local LLM returned invalid JSON: ${String(err)}`);
|
|
48
|
+
}
|
|
49
|
+
if (!parsed || typeof parsed !== "object" || Array.isArray(parsed)) {
|
|
50
|
+
throw new Error("Local LLM response is not a JSON object");
|
|
51
|
+
}
|
|
52
|
+
return parsed;
|
|
53
|
+
}
|
|
54
|
+
export {
|
|
55
|
+
extractWithLocalLlm,
|
|
56
|
+
isLocalLlmEnabled
|
|
57
|
+
};
|
|
58
|
+
//# sourceMappingURL=local-llm.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../src/extraction/v1/local-llm.ts"],"sourcesContent":["import { createLogger } from '../../logger.js';\n\nconst log = createLogger('extract');\n\nconst MAX_HTML_CHARS = 50000;\nconst REQUEST_TIMEOUT_MS = 30_000;\n\nexport function isLocalLlmEnabled(): boolean {\n return !!process.env['WIGOLO_LLM_PROVIDER'];\n}\n\nexport interface LocalLlmRequest {\n schema: Record<string, unknown>;\n html: string;\n url: string;\n}\n\nexport async function extractWithLocalLlm(\n request: LocalLlmRequest,\n): Promise<Record<string, unknown> | null> {\n if (!isLocalLlmEnabled()) return null;\n\n const provider = process.env['WIGOLO_LLM_PROVIDER']!;\n const endpoint = provider.includes('/chat/completions')\n ? provider\n : provider.replace(/\\/+$/, '') + '/v1/chat/completions';\n const model = process.env['WIGOLO_LLM_MODEL'] ?? 'local';\n\n const htmlSlice = request.html.length > MAX_HTML_CHARS\n ? request.html.slice(0, MAX_HTML_CHARS)\n : request.html;\n\n const prompt =\n 'Extract data matching this JSON schema from the HTML. Return only valid JSON.\\n' +\n `Schema: ${JSON.stringify(request.schema)}\\n` +\n `URL: ${request.url}\\n` +\n `HTML: ${htmlSlice}`;\n\n const body = {\n model,\n messages: [{ role: 'user', content: prompt }],\n response_format: { type: 'json_object' },\n };\n\n let response: Response;\n try {\n response = await fetch(endpoint, {\n method: 'POST',\n headers: { 'content-type': 'application/json' },\n body: JSON.stringify(body),\n signal: AbortSignal.timeout(REQUEST_TIMEOUT_MS),\n });\n } catch (err) {\n log.error('local llm request failed', { error: String(err) });\n throw err;\n }\n\n if (!response.ok) {\n throw new Error(`Local LLM endpoint returned ${response.status}`);\n }\n\n const payload = (await response.json()) as {\n choices?: Array<{ message?: { content?: string } }>;\n };\n const content = payload.choices?.[0]?.message?.content;\n if (typeof content !== 'string' || content.trim().length === 0) {\n throw new Error('Local LLM response missing message content');\n }\n\n let parsed: unknown;\n try {\n parsed = JSON.parse(content);\n } catch (err) {\n throw new Error(`Local LLM returned invalid JSON: ${String(err)}`);\n }\n if (!parsed || typeof parsed !== 'object' || Array.isArray(parsed)) {\n throw new Error('Local LLM response is not a JSON object');\n }\n return parsed as Record<string, unknown>;\n}\n"],"mappings":"AAAA,SAAS,oBAAoB;AAE7B,MAAM,MAAM,aAAa,SAAS;AAElC,MAAM,iBAAiB;AACvB,MAAM,qBAAqB;AAEpB,SAAS,oBAA6B;AAC3C,SAAO,CAAC,CAAC,QAAQ,IAAI,qBAAqB;AAC5C;AAQA,eAAsB,oBACpB,SACyC;AACzC,MAAI,CAAC,kBAAkB,EAAG,QAAO;AAEjC,QAAM,WAAW,QAAQ,IAAI,qBAAqB;AAClD,QAAM,WAAW,SAAS,SAAS,mBAAmB,IAClD,WACA,SAAS,QAAQ,QAAQ,EAAE,IAAI;AACnC,QAAM,QAAQ,QAAQ,IAAI,kBAAkB,KAAK;AAEjD,QAAM,YAAY,QAAQ,KAAK,SAAS,iBACpC,QAAQ,KAAK,MAAM,GAAG,cAAc,IACpC,QAAQ;AAEZ,QAAM,SACJ;AAAA,UACW,KAAK,UAAU,QAAQ,MAAM,CAAC;AAAA,OACjC,QAAQ,GAAG;AAAA,QACV,SAAS;AAEpB,QAAM,OAAO;AAAA,IACX;AAAA,IACA,UAAU,CAAC,EAAE,MAAM,QAAQ,SAAS,OAAO,CAAC;AAAA,IAC5C,iBAAiB,EAAE,MAAM,cAAc;AAAA,EACzC;AAEA,MAAI;AACJ,MAAI;AACF,eAAW,MAAM,MAAM,UAAU;AAAA,MAC/B,QAAQ;AAAA,MACR,SAAS,EAAE,gBAAgB,mBAAmB;AAAA,MAC9C,MAAM,KAAK,UAAU,IAAI;AAAA,MACzB,QAAQ,YAAY,QAAQ,kBAAkB;AAAA,IAChD,CAAC;AAAA,EACH,SAAS,KAAK;AACZ,QAAI,MAAM,4BAA4B,EAAE,OAAO,OAAO,GAAG,EAAE,CAAC;AAC5D,UAAM;AAAA,EACR;AAEA,MAAI,CAAC,SAAS,IAAI;AAChB,UAAM,IAAI,MAAM,+BAA+B,SAAS,MAAM,EAAE;AAAA,EAClE;AAEA,QAAM,UAAW,MAAM,SAAS,KAAK;AAGrC,QAAM,UAAU,QAAQ,UAAU,CAAC,GAAG,SAAS;AAC/C,MAAI,OAAO,YAAY,YAAY,QAAQ,KAAK,EAAE,WAAW,GAAG;AAC9D,UAAM,IAAI,MAAM,4CAA4C;AAAA,EAC9D;AAEA,MAAI;AACJ,MAAI;AACF,aAAS,KAAK,MAAM,OAAO;AAAA,EAC7B,SAAS,KAAK;AACZ,UAAM,IAAI,MAAM,oCAAoC,OAAO,GAAG,CAAC,EAAE;AAAA,EACnE;AACA,MAAI,CAAC,UAAU,OAAO,WAAW,YAAY,MAAM,QAAQ,MAAM,GAAG;AAClE,UAAM,IAAI,MAAM,yCAAyC;AAAA,EAC3D;AACA,SAAO;AACT;","names":[]}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"news.d.ts","sourceRoot":"","sources":["../../../src/extraction/v1/news.ts"],"names":[],"mappings":"AAGA,OAAO,KAAK,EAAE,gBAAgB,EAAE,MAAM,gBAAgB,CAAC;AAWvD,wBAAsB,WAAW,CAAC,IAAI,EAAE,MAAM,EAAE,GAAG,EAAE,MAAM,GAAG,OAAO,CAAC,gBAAgB,GAAG,IAAI,CAAC,CAY7F"}
|
|
@@ -0,0 +1,61 @@
|
|
|
1
|
+
import { parseHTML } from "linkedom";
|
|
2
|
+
import { readabilityExtract } from "../readability.js";
|
|
3
|
+
import { extractJsonLd } from "../jsonld.js";
|
|
4
|
+
const META_DATE_SELECTORS = [
|
|
5
|
+
'meta[property="article:published_time"]',
|
|
6
|
+
'meta[name="article:published_time"]',
|
|
7
|
+
'meta[itemprop="datePublished"]',
|
|
8
|
+
'meta[name="date"]',
|
|
9
|
+
'meta[name="dc.date"]',
|
|
10
|
+
'meta[name="DC.date.issued"]'
|
|
11
|
+
];
|
|
12
|
+
async function extractNews(html, url) {
|
|
13
|
+
const base = readabilityExtract(html, url);
|
|
14
|
+
if (!base) return null;
|
|
15
|
+
if (!base.metadata.date) {
|
|
16
|
+
const date = findPublishedDate(html);
|
|
17
|
+
if (date) {
|
|
18
|
+
return { ...base, metadata: { ...base.metadata, date } };
|
|
19
|
+
}
|
|
20
|
+
}
|
|
21
|
+
return base;
|
|
22
|
+
}
|
|
23
|
+
function findPublishedDate(html) {
|
|
24
|
+
if (!html) return void 0;
|
|
25
|
+
let document;
|
|
26
|
+
try {
|
|
27
|
+
({ document } = parseHTML(html));
|
|
28
|
+
} catch {
|
|
29
|
+
return void 0;
|
|
30
|
+
}
|
|
31
|
+
for (const selector of META_DATE_SELECTORS) {
|
|
32
|
+
const el = document.querySelector(selector);
|
|
33
|
+
const content = el?.getAttribute("content")?.trim();
|
|
34
|
+
if (content && isValidDate(content)) return content;
|
|
35
|
+
}
|
|
36
|
+
const article = document.querySelector("article");
|
|
37
|
+
const root = article ?? document;
|
|
38
|
+
const timeEl = root.querySelector("time[datetime]");
|
|
39
|
+
const datetime = timeEl?.getAttribute("datetime")?.trim();
|
|
40
|
+
if (datetime && isValidDate(datetime)) return datetime;
|
|
41
|
+
try {
|
|
42
|
+
const blocks = extractJsonLd(html);
|
|
43
|
+
for (const block of blocks) {
|
|
44
|
+
const published = block["datePublished"];
|
|
45
|
+
if (typeof published === "string" && isValidDate(published)) {
|
|
46
|
+
return published;
|
|
47
|
+
}
|
|
48
|
+
}
|
|
49
|
+
} catch {
|
|
50
|
+
}
|
|
51
|
+
return void 0;
|
|
52
|
+
}
|
|
53
|
+
function isValidDate(value) {
|
|
54
|
+
if (!value) return false;
|
|
55
|
+
const parsed = Date.parse(value);
|
|
56
|
+
return !Number.isNaN(parsed);
|
|
57
|
+
}
|
|
58
|
+
export {
|
|
59
|
+
extractNews
|
|
60
|
+
};
|
|
61
|
+
//# sourceMappingURL=news.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../src/extraction/v1/news.ts"],"sourcesContent":["import { parseHTML } from 'linkedom';\nimport { readabilityExtract } from '../readability.js';\nimport { extractJsonLd } from '../jsonld.js';\nimport type { ExtractionResult } from '../../types.js';\n\nconst META_DATE_SELECTORS = [\n 'meta[property=\"article:published_time\"]',\n 'meta[name=\"article:published_time\"]',\n 'meta[itemprop=\"datePublished\"]',\n 'meta[name=\"date\"]',\n 'meta[name=\"dc.date\"]',\n 'meta[name=\"DC.date.issued\"]',\n];\n\nexport async function extractNews(html: string, url: string): Promise<ExtractionResult | null> {\n const base = readabilityExtract(html, url);\n if (!base) return null;\n\n if (!base.metadata.date) {\n const date = findPublishedDate(html);\n if (date) {\n return { ...base, metadata: { ...base.metadata, date } };\n }\n }\n\n return base;\n}\n\nfunction findPublishedDate(html: string): string | undefined {\n if (!html) return undefined;\n\n let document: Document;\n try {\n ({ document } = parseHTML(html));\n } catch {\n return undefined;\n }\n\n for (const selector of META_DATE_SELECTORS) {\n const el = document.querySelector(selector);\n const content = el?.getAttribute('content')?.trim();\n if (content && isValidDate(content)) return content;\n }\n\n const article = document.querySelector('article');\n const root: ParentNode = article ?? document;\n const timeEl = root.querySelector('time[datetime]');\n const datetime = timeEl?.getAttribute('datetime')?.trim();\n if (datetime && isValidDate(datetime)) return datetime;\n\n try {\n const blocks = extractJsonLd(html);\n for (const block of blocks) {\n const published = block['datePublished'];\n if (typeof published === 'string' && isValidDate(published)) {\n return published;\n }\n }\n } catch {\n // jsonld parse failures already swallowed inside extractJsonLd\n }\n\n return undefined;\n}\n\nfunction isValidDate(value: string): boolean {\n if (!value) return false;\n const parsed = Date.parse(value);\n return !Number.isNaN(parsed);\n}\n"],"mappings":"AAAA,SAAS,iBAAiB;AAC1B,SAAS,0BAA0B;AACnC,SAAS,qBAAqB;AAG9B,MAAM,sBAAsB;AAAA,EAC1B;AAAA,EACA;AAAA,EACA;AAAA,EACA;AAAA,EACA;AAAA,EACA;AACF;AAEA,eAAsB,YAAY,MAAc,KAA+C;AAC7F,QAAM,OAAO,mBAAmB,MAAM,GAAG;AACzC,MAAI,CAAC,KAAM,QAAO;AAElB,MAAI,CAAC,KAAK,SAAS,MAAM;AACvB,UAAM,OAAO,kBAAkB,IAAI;AACnC,QAAI,MAAM;AACR,aAAO,EAAE,GAAG,MAAM,UAAU,EAAE,GAAG,KAAK,UAAU,KAAK,EAAE;AAAA,IACzD;AAAA,EACF;AAEA,SAAO;AACT;AAEA,SAAS,kBAAkB,MAAkC;AAC3D,MAAI,CAAC,KAAM,QAAO;AAElB,MAAI;AACJ,MAAI;AACF,KAAC,EAAE,SAAS,IAAI,UAAU,IAAI;AAAA,EAChC,QAAQ;AACN,WAAO;AAAA,EACT;AAEA,aAAW,YAAY,qBAAqB;AAC1C,UAAM,KAAK,SAAS,cAAc,QAAQ;AAC1C,UAAM,UAAU,IAAI,aAAa,SAAS,GAAG,KAAK;AAClD,QAAI,WAAW,YAAY,OAAO,EAAG,QAAO;AAAA,EAC9C;AAEA,QAAM,UAAU,SAAS,cAAc,SAAS;AAChD,QAAM,OAAmB,WAAW;AACpC,QAAM,SAAS,KAAK,cAAc,gBAAgB;AAClD,QAAM,WAAW,QAAQ,aAAa,UAAU,GAAG,KAAK;AACxD,MAAI,YAAY,YAAY,QAAQ,EAAG,QAAO;AAE9C,MAAI;AACF,UAAM,SAAS,cAAc,IAAI;AACjC,eAAW,SAAS,QAAQ;AAC1B,YAAM,YAAY,MAAM,eAAe;AACvC,UAAI,OAAO,cAAc,YAAY,YAAY,SAAS,GAAG;AAC3D,eAAO;AAAA,MACT;AAAA,IACF;AAAA,EACF,QAAQ;AAAA,EAER;AAEA,SAAO;AACT;AAEA,SAAS,YAAY,OAAwB;AAC3C,MAAI,CAAC,MAAO,QAAO;AACnB,QAAM,SAAS,KAAK,MAAM,KAAK;AAC/B,SAAO,CAAC,OAAO,MAAM,MAAM;AAC7B;","names":[]}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"product.d.ts","sourceRoot":"","sources":["../../../src/extraction/v1/product.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,gBAAgB,EAAE,MAAM,gBAAgB,CAAC;AAIvD,wBAAsB,cAAc,CAAC,IAAI,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,gBAAgB,GAAG,IAAI,CAAC,CAOjG"}
|
|
@@ -0,0 +1,166 @@
|
|
|
1
|
+
import { parseHTML } from "linkedom";
|
|
2
|
+
import { extractJsonLd } from "../jsonld.js";
|
|
3
|
+
const MIN_CONTENT_THRESHOLD = 100;
|
|
4
|
+
async function extractProduct(html, _url) {
|
|
5
|
+
if (!html) return null;
|
|
6
|
+
const fromJsonLd = tryJsonLd(html);
|
|
7
|
+
if (fromJsonLd) return fromJsonLd;
|
|
8
|
+
return tryOpenGraph(html);
|
|
9
|
+
}
|
|
10
|
+
function tryJsonLd(html) {
|
|
11
|
+
let blocks;
|
|
12
|
+
try {
|
|
13
|
+
blocks = extractJsonLd(html);
|
|
14
|
+
} catch {
|
|
15
|
+
return null;
|
|
16
|
+
}
|
|
17
|
+
const product = blocks.find((block) => typeIncludes(block["@type"], "product"));
|
|
18
|
+
if (!product) return null;
|
|
19
|
+
const name = stringField(product["name"]);
|
|
20
|
+
if (!name) return null;
|
|
21
|
+
const lines = [`# ${name}`];
|
|
22
|
+
const description = stringField(product["description"]);
|
|
23
|
+
if (description) lines.push("", description);
|
|
24
|
+
const detailLines = [];
|
|
25
|
+
const brand = readBrand(product["brand"]);
|
|
26
|
+
if (brand) detailLines.push(`**Brand:** ${brand}`);
|
|
27
|
+
const offer = pickOffer(product["offers"]);
|
|
28
|
+
const price = offer ? stringField(offer["price"]) : void 0;
|
|
29
|
+
const currency = offer ? stringField(offer["priceCurrency"]) : void 0;
|
|
30
|
+
if (price) {
|
|
31
|
+
detailLines.push(currency ? `**Price:** ${currency} ${price}` : `**Price:** ${price}`);
|
|
32
|
+
}
|
|
33
|
+
const rating = readRating(product["aggregateRating"]);
|
|
34
|
+
if (rating) detailLines.push(rating);
|
|
35
|
+
const sku = stringField(product["sku"]);
|
|
36
|
+
if (sku) detailLines.push(`**SKU:** ${sku}`);
|
|
37
|
+
if (detailLines.length > 0) {
|
|
38
|
+
lines.push("", ...detailLines);
|
|
39
|
+
}
|
|
40
|
+
const markdown = lines.join("\n").trim();
|
|
41
|
+
if (markdown.length < MIN_CONTENT_THRESHOLD) return null;
|
|
42
|
+
const image = firstImage(product["image"]);
|
|
43
|
+
return {
|
|
44
|
+
title: name,
|
|
45
|
+
markdown,
|
|
46
|
+
metadata: {
|
|
47
|
+
...description ? { description } : {},
|
|
48
|
+
...image ? { og_image: image } : {}
|
|
49
|
+
},
|
|
50
|
+
links: [],
|
|
51
|
+
images: [],
|
|
52
|
+
extractor: "site-specific"
|
|
53
|
+
};
|
|
54
|
+
}
|
|
55
|
+
function tryOpenGraph(html) {
|
|
56
|
+
let document;
|
|
57
|
+
try {
|
|
58
|
+
({ document } = parseHTML(html));
|
|
59
|
+
} catch {
|
|
60
|
+
return null;
|
|
61
|
+
}
|
|
62
|
+
const ogType = metaContent(document, 'meta[property="og:type"]')?.toLowerCase();
|
|
63
|
+
if (ogType !== "product" && ogType !== "og:product") return null;
|
|
64
|
+
const title = metaContent(document, 'meta[property="og:title"]');
|
|
65
|
+
if (!title) return null;
|
|
66
|
+
const description = metaContent(document, 'meta[property="og:description"]');
|
|
67
|
+
const price = metaContent(document, 'meta[property="product:price:amount"]');
|
|
68
|
+
const currency = metaContent(document, 'meta[property="product:price:currency"]');
|
|
69
|
+
const image = metaContent(document, 'meta[property="og:image"]');
|
|
70
|
+
const lines = [`# ${title}`];
|
|
71
|
+
if (description) lines.push("", description);
|
|
72
|
+
if (price) {
|
|
73
|
+
lines.push("", currency ? `**Price:** ${currency} ${price}` : `**Price:** ${price}`);
|
|
74
|
+
}
|
|
75
|
+
const markdown = lines.join("\n").trim();
|
|
76
|
+
if (markdown.length < MIN_CONTENT_THRESHOLD) return null;
|
|
77
|
+
return {
|
|
78
|
+
title,
|
|
79
|
+
markdown,
|
|
80
|
+
metadata: {
|
|
81
|
+
...description ? { description } : {},
|
|
82
|
+
...image ? { og_image: image } : {}
|
|
83
|
+
},
|
|
84
|
+
links: [],
|
|
85
|
+
images: [],
|
|
86
|
+
extractor: "site-specific"
|
|
87
|
+
};
|
|
88
|
+
}
|
|
89
|
+
function metaContent(document, selector) {
|
|
90
|
+
const el = document.querySelector(selector);
|
|
91
|
+
const content = el?.getAttribute("content")?.trim();
|
|
92
|
+
return content && content.length > 0 ? content : void 0;
|
|
93
|
+
}
|
|
94
|
+
function typeIncludes(raw, want) {
|
|
95
|
+
const target = want.toLowerCase();
|
|
96
|
+
if (typeof raw === "string") return normalizeType(raw) === target;
|
|
97
|
+
if (Array.isArray(raw)) {
|
|
98
|
+
return raw.some((entry) => typeof entry === "string" && normalizeType(entry) === target);
|
|
99
|
+
}
|
|
100
|
+
return false;
|
|
101
|
+
}
|
|
102
|
+
function normalizeType(raw) {
|
|
103
|
+
const tail = raw.split(/[/#:]/).pop() ?? raw;
|
|
104
|
+
return tail.toLowerCase();
|
|
105
|
+
}
|
|
106
|
+
function stringField(value) {
|
|
107
|
+
if (typeof value === "string") {
|
|
108
|
+
const trimmed = value.trim();
|
|
109
|
+
return trimmed.length > 0 ? trimmed : void 0;
|
|
110
|
+
}
|
|
111
|
+
if (typeof value === "number" && Number.isFinite(value)) {
|
|
112
|
+
return String(value);
|
|
113
|
+
}
|
|
114
|
+
return void 0;
|
|
115
|
+
}
|
|
116
|
+
function readBrand(value) {
|
|
117
|
+
if (typeof value === "string") return stringField(value);
|
|
118
|
+
if (Array.isArray(value)) {
|
|
119
|
+
for (const entry of value) {
|
|
120
|
+
const name = readBrand(entry);
|
|
121
|
+
if (name) return name;
|
|
122
|
+
}
|
|
123
|
+
return void 0;
|
|
124
|
+
}
|
|
125
|
+
if (value && typeof value === "object") {
|
|
126
|
+
const name = value["name"];
|
|
127
|
+
return stringField(name);
|
|
128
|
+
}
|
|
129
|
+
return void 0;
|
|
130
|
+
}
|
|
131
|
+
function pickOffer(value) {
|
|
132
|
+
if (Array.isArray(value)) {
|
|
133
|
+
const first = value.find((entry) => entry && typeof entry === "object");
|
|
134
|
+
return first;
|
|
135
|
+
}
|
|
136
|
+
if (value && typeof value === "object") return value;
|
|
137
|
+
return void 0;
|
|
138
|
+
}
|
|
139
|
+
function readRating(value) {
|
|
140
|
+
if (!value || typeof value !== "object") return void 0;
|
|
141
|
+
const obj = value;
|
|
142
|
+
const rating = stringField(obj["ratingValue"]);
|
|
143
|
+
const count = stringField(obj["reviewCount"]);
|
|
144
|
+
if (!rating) return void 0;
|
|
145
|
+
if (count) return `**Rating:** ${rating} (${count} reviews)`;
|
|
146
|
+
return `**Rating:** ${rating}`;
|
|
147
|
+
}
|
|
148
|
+
function firstImage(value) {
|
|
149
|
+
if (typeof value === "string") return stringField(value);
|
|
150
|
+
if (Array.isArray(value)) {
|
|
151
|
+
for (const entry of value) {
|
|
152
|
+
const img = firstImage(entry);
|
|
153
|
+
if (img) return img;
|
|
154
|
+
}
|
|
155
|
+
return void 0;
|
|
156
|
+
}
|
|
157
|
+
if (value && typeof value === "object") {
|
|
158
|
+
const url = value["url"];
|
|
159
|
+
return stringField(url);
|
|
160
|
+
}
|
|
161
|
+
return void 0;
|
|
162
|
+
}
|
|
163
|
+
export {
|
|
164
|
+
extractProduct
|
|
165
|
+
};
|
|
166
|
+
//# sourceMappingURL=product.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../../../src/extraction/v1/product.ts"],"sourcesContent":["import { parseHTML } from 'linkedom';\nimport { extractJsonLd } from '../jsonld.js';\nimport type { ExtractionResult } from '../../types.js';\n\nconst MIN_CONTENT_THRESHOLD = 100;\n\nexport async function extractProduct(html: string, _url: string): Promise<ExtractionResult | null> {\n if (!html) return null;\n\n const fromJsonLd = tryJsonLd(html);\n if (fromJsonLd) return fromJsonLd;\n\n return tryOpenGraph(html);\n}\n\nfunction tryJsonLd(html: string): ExtractionResult | null {\n let blocks: Record<string, unknown>[];\n try {\n blocks = extractJsonLd(html);\n } catch {\n return null;\n }\n\n const product = blocks.find((block) => typeIncludes(block['@type'], 'product'));\n if (!product) return null;\n\n const name = stringField(product['name']);\n if (!name) return null;\n\n const lines: string[] = [`# ${name}`];\n\n const description = stringField(product['description']);\n if (description) lines.push('', description);\n\n const detailLines: string[] = [];\n const brand = readBrand(product['brand']);\n if (brand) detailLines.push(`**Brand:** ${brand}`);\n\n const offer = pickOffer(product['offers']);\n const price = offer ? stringField(offer['price']) : undefined;\n const currency = offer ? stringField(offer['priceCurrency']) : undefined;\n if (price) {\n detailLines.push(currency ? `**Price:** ${currency} ${price}` : `**Price:** ${price}`);\n }\n\n const rating = readRating(product['aggregateRating']);\n if (rating) detailLines.push(rating);\n\n const sku = stringField(product['sku']);\n if (sku) detailLines.push(`**SKU:** ${sku}`);\n\n if (detailLines.length > 0) {\n lines.push('', ...detailLines);\n }\n\n const markdown = lines.join('\\n').trim();\n if (markdown.length < MIN_CONTENT_THRESHOLD) return null;\n\n const image = firstImage(product['image']);\n\n return {\n title: name,\n markdown,\n metadata: {\n ...(description ? { description } : {}),\n ...(image ? { og_image: image } : {}),\n },\n links: [],\n images: [],\n extractor: 'site-specific',\n };\n}\n\nfunction tryOpenGraph(html: string): ExtractionResult | null {\n let document: Document;\n try {\n ({ document } = parseHTML(html));\n } catch {\n return null;\n }\n\n const ogType = metaContent(document, 'meta[property=\"og:type\"]')?.toLowerCase();\n if (ogType !== 'product' && ogType !== 'og:product') return null;\n\n const title = metaContent(document, 'meta[property=\"og:title\"]');\n if (!title) return null;\n\n const description = metaContent(document, 'meta[property=\"og:description\"]');\n const price = metaContent(document, 'meta[property=\"product:price:amount\"]');\n const currency = metaContent(document, 'meta[property=\"product:price:currency\"]');\n const image = metaContent(document, 'meta[property=\"og:image\"]');\n\n const lines: string[] = [`# ${title}`];\n if (description) lines.push('', description);\n if (price) {\n lines.push('', currency ? `**Price:** ${currency} ${price}` : `**Price:** ${price}`);\n }\n\n const markdown = lines.join('\\n').trim();\n if (markdown.length < MIN_CONTENT_THRESHOLD) return null;\n\n return {\n title,\n markdown,\n metadata: {\n ...(description ? { description } : {}),\n ...(image ? { og_image: image } : {}),\n },\n links: [],\n images: [],\n extractor: 'site-specific',\n };\n}\n\nfunction metaContent(document: Document, selector: string): string | undefined {\n const el = document.querySelector(selector);\n const content = el?.getAttribute('content')?.trim();\n return content && content.length > 0 ? content : undefined;\n}\n\nfunction typeIncludes(raw: unknown, want: string): boolean {\n const target = want.toLowerCase();\n if (typeof raw === 'string') return normalizeType(raw) === target;\n if (Array.isArray(raw)) {\n return raw.some((entry) => typeof entry === 'string' && normalizeType(entry) === target);\n }\n return false;\n}\n\nfunction normalizeType(raw: string): string {\n const tail = raw.split(/[/#:]/).pop() ?? raw;\n return tail.toLowerCase();\n}\n\nfunction stringField(value: unknown): string | undefined {\n if (typeof value === 'string') {\n const trimmed = value.trim();\n return trimmed.length > 0 ? trimmed : undefined;\n }\n if (typeof value === 'number' && Number.isFinite(value)) {\n return String(value);\n }\n return undefined;\n}\n\nfunction readBrand(value: unknown): string | undefined {\n if (typeof value === 'string') return stringField(value);\n if (Array.isArray(value)) {\n for (const entry of value) {\n const name = readBrand(entry);\n if (name) return name;\n }\n return undefined;\n }\n if (value && typeof value === 'object') {\n const name = (value as Record<string, unknown>)['name'];\n return stringField(name);\n }\n return undefined;\n}\n\nfunction pickOffer(value: unknown): Record<string, unknown> | undefined {\n if (Array.isArray(value)) {\n const first = value.find((entry) => entry && typeof entry === 'object');\n return first as Record<string, unknown> | undefined;\n }\n if (value && typeof value === 'object') return value as Record<string, unknown>;\n return undefined;\n}\n\nfunction readRating(value: unknown): string | undefined {\n if (!value || typeof value !== 'object') return undefined;\n const obj = value as Record<string, unknown>;\n const rating = stringField(obj['ratingValue']);\n const count = stringField(obj['reviewCount']);\n if (!rating) return undefined;\n if (count) return `**Rating:** ${rating} (${count} reviews)`;\n return `**Rating:** ${rating}`;\n}\n\nfunction firstImage(value: unknown): string | undefined {\n if (typeof value === 'string') return stringField(value);\n if (Array.isArray(value)) {\n for (const entry of value) {\n const img = firstImage(entry);\n if (img) return img;\n }\n return undefined;\n }\n if (value && typeof value === 'object') {\n const url = (value as Record<string, unknown>)['url'];\n return stringField(url);\n }\n return undefined;\n}\n"],"mappings":"AAAA,SAAS,iBAAiB;AAC1B,SAAS,qBAAqB;AAG9B,MAAM,wBAAwB;AAE9B,eAAsB,eAAe,MAAc,MAAgD;AACjG,MAAI,CAAC,KAAM,QAAO;AAElB,QAAM,aAAa,UAAU,IAAI;AACjC,MAAI,WAAY,QAAO;AAEvB,SAAO,aAAa,IAAI;AAC1B;AAEA,SAAS,UAAU,MAAuC;AACxD,MAAI;AACJ,MAAI;AACF,aAAS,cAAc,IAAI;AAAA,EAC7B,QAAQ;AACN,WAAO;AAAA,EACT;AAEA,QAAM,UAAU,OAAO,KAAK,CAAC,UAAU,aAAa,MAAM,OAAO,GAAG,SAAS,CAAC;AAC9E,MAAI,CAAC,QAAS,QAAO;AAErB,QAAM,OAAO,YAAY,QAAQ,MAAM,CAAC;AACxC,MAAI,CAAC,KAAM,QAAO;AAElB,QAAM,QAAkB,CAAC,KAAK,IAAI,EAAE;AAEpC,QAAM,cAAc,YAAY,QAAQ,aAAa,CAAC;AACtD,MAAI,YAAa,OAAM,KAAK,IAAI,WAAW;AAE3C,QAAM,cAAwB,CAAC;AAC/B,QAAM,QAAQ,UAAU,QAAQ,OAAO,CAAC;AACxC,MAAI,MAAO,aAAY,KAAK,cAAc,KAAK,EAAE;AAEjD,QAAM,QAAQ,UAAU,QAAQ,QAAQ,CAAC;AACzC,QAAM,QAAQ,QAAQ,YAAY,MAAM,OAAO,CAAC,IAAI;AACpD,QAAM,WAAW,QAAQ,YAAY,MAAM,eAAe,CAAC,IAAI;AAC/D,MAAI,OAAO;AACT,gBAAY,KAAK,WAAW,cAAc,QAAQ,IAAI,KAAK,KAAK,cAAc,KAAK,EAAE;AAAA,EACvF;AAEA,QAAM,SAAS,WAAW,QAAQ,iBAAiB,CAAC;AACpD,MAAI,OAAQ,aAAY,KAAK,MAAM;AAEnC,QAAM,MAAM,YAAY,QAAQ,KAAK,CAAC;AACtC,MAAI,IAAK,aAAY,KAAK,YAAY,GAAG,EAAE;AAE3C,MAAI,YAAY,SAAS,GAAG;AAC1B,UAAM,KAAK,IAAI,GAAG,WAAW;AAAA,EAC/B;AAEA,QAAM,WAAW,MAAM,KAAK,IAAI,EAAE,KAAK;AACvC,MAAI,SAAS,SAAS,sBAAuB,QAAO;AAEpD,QAAM,QAAQ,WAAW,QAAQ,OAAO,CAAC;AAEzC,SAAO;AAAA,IACL,OAAO;AAAA,IACP;AAAA,IACA,UAAU;AAAA,MACR,GAAI,cAAc,EAAE,YAAY,IAAI,CAAC;AAAA,MACrC,GAAI,QAAQ,EAAE,UAAU,MAAM,IAAI,CAAC;AAAA,IACrC;AAAA,IACA,OAAO,CAAC;AAAA,IACR,QAAQ,CAAC;AAAA,IACT,WAAW;AAAA,EACb;AACF;AAEA,SAAS,aAAa,MAAuC;AAC3D,MAAI;AACJ,MAAI;AACF,KAAC,EAAE,SAAS,IAAI,UAAU,IAAI;AAAA,EAChC,QAAQ;AACN,WAAO;AAAA,EACT;AAEA,QAAM,SAAS,YAAY,UAAU,0BAA0B,GAAG,YAAY;AAC9E,MAAI,WAAW,aAAa,WAAW,aAAc,QAAO;AAE5D,QAAM,QAAQ,YAAY,UAAU,2BAA2B;AAC/D,MAAI,CAAC,MAAO,QAAO;AAEnB,QAAM,cAAc,YAAY,UAAU,iCAAiC;AAC3E,QAAM,QAAQ,YAAY,UAAU,uCAAuC;AAC3E,QAAM,WAAW,YAAY,UAAU,yCAAyC;AAChF,QAAM,QAAQ,YAAY,UAAU,2BAA2B;AAE/D,QAAM,QAAkB,CAAC,KAAK,KAAK,EAAE;AACrC,MAAI,YAAa,OAAM,KAAK,IAAI,WAAW;AAC3C,MAAI,OAAO;AACT,UAAM,KAAK,IAAI,WAAW,cAAc,QAAQ,IAAI,KAAK,KAAK,cAAc,KAAK,EAAE;AAAA,EACrF;AAEA,QAAM,WAAW,MAAM,KAAK,IAAI,EAAE,KAAK;AACvC,MAAI,SAAS,SAAS,sBAAuB,QAAO;AAEpD,SAAO;AAAA,IACL;AAAA,IACA;AAAA,IACA,UAAU;AAAA,MACR,GAAI,cAAc,EAAE,YAAY,IAAI,CAAC;AAAA,MACrC,GAAI,QAAQ,EAAE,UAAU,MAAM,IAAI,CAAC;AAAA,IACrC;AAAA,IACA,OAAO,CAAC;AAAA,IACR,QAAQ,CAAC;AAAA,IACT,WAAW;AAAA,EACb;AACF;AAEA,SAAS,YAAY,UAAoB,UAAsC;AAC7E,QAAM,KAAK,SAAS,cAAc,QAAQ;AAC1C,QAAM,UAAU,IAAI,aAAa,SAAS,GAAG,KAAK;AAClD,SAAO,WAAW,QAAQ,SAAS,IAAI,UAAU;AACnD;AAEA,SAAS,aAAa,KAAc,MAAuB;AACzD,QAAM,SAAS,KAAK,YAAY;AAChC,MAAI,OAAO,QAAQ,SAAU,QAAO,cAAc,GAAG,MAAM;AAC3D,MAAI,MAAM,QAAQ,GAAG,GAAG;AACtB,WAAO,IAAI,KAAK,CAAC,UAAU,OAAO,UAAU,YAAY,cAAc,KAAK,MAAM,MAAM;AAAA,EACzF;AACA,SAAO;AACT;AAEA,SAAS,cAAc,KAAqB;AAC1C,QAAM,OAAO,IAAI,MAAM,OAAO,EAAE,IAAI,KAAK;AACzC,SAAO,KAAK,YAAY;AAC1B;AAEA,SAAS,YAAY,OAAoC;AACvD,MAAI,OAAO,UAAU,UAAU;AAC7B,UAAM,UAAU,MAAM,KAAK;AAC3B,WAAO,QAAQ,SAAS,IAAI,UAAU;AAAA,EACxC;AACA,MAAI,OAAO,UAAU,YAAY,OAAO,SAAS,KAAK,GAAG;AACvD,WAAO,OAAO,KAAK;AAAA,EACrB;AACA,SAAO;AACT;AAEA,SAAS,UAAU,OAAoC;AACrD,MAAI,OAAO,UAAU,SAAU,QAAO,YAAY,KAAK;AACvD,MAAI,MAAM,QAAQ,KAAK,GAAG;AACxB,eAAW,SAAS,OAAO;AACzB,YAAM,OAAO,UAAU,KAAK;AAC5B,UAAI,KAAM,QAAO;AAAA,IACnB;AACA,WAAO;AAAA,EACT;AACA,MAAI,SAAS,OAAO,UAAU,UAAU;AACtC,UAAM,OAAQ,MAAkC,MAAM;AACtD,WAAO,YAAY,IAAI;AAAA,EACzB;AACA,SAAO;AACT;AAEA,SAAS,UAAU,OAAqD;AACtE,MAAI,MAAM,QAAQ,KAAK,GAAG;AACxB,UAAM,QAAQ,MAAM,KAAK,CAAC,UAAU,SAAS,OAAO,UAAU,QAAQ;AACtE,WAAO;AAAA,EACT;AACA,MAAI,SAAS,OAAO,UAAU,SAAU,QAAO;AAC/C,SAAO;AACT;AAEA,SAAS,WAAW,OAAoC;AACtD,MAAI,CAAC,SAAS,OAAO,UAAU,SAAU,QAAO;AAChD,QAAM,MAAM;AACZ,QAAM,SAAS,YAAY,IAAI,aAAa,CAAC;AAC7C,QAAM,QAAQ,YAAY,IAAI,aAAa,CAAC;AAC5C,MAAI,CAAC,OAAQ,QAAO;AACpB,MAAI,MAAO,QAAO,eAAe,MAAM,KAAK,KAAK;AACjD,SAAO,eAAe,MAAM;AAC9B;AAEA,SAAS,WAAW,OAAoC;AACtD,MAAI,OAAO,UAAU,SAAU,QAAO,YAAY,KAAK;AACvD,MAAI,MAAM,QAAQ,KAAK,GAAG;AACxB,eAAW,SAAS,OAAO;AACzB,YAAM,MAAM,WAAW,KAAK;AAC5B,UAAI,IAAK,QAAO;AAAA,IAClB;AACA,WAAO;AAAA,EACT;AACA,MAAI,SAAS,OAAO,UAAU,UAAU;AACtC,UAAM,MAAO,MAAkC,KAAK;AACpD,WAAO,YAAY,GAAG;AAAA,EACxB;AACA,SAAO;AACT;","names":[]}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"recipe.d.ts","sourceRoot":"","sources":["../../../src/extraction/v1/recipe.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,EAAE,gBAAgB,EAAE,MAAM,gBAAgB,CAAC;AAIvD,wBAAsB,aAAa,CAAC,IAAI,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,gBAAgB,GAAG,IAAI,CAAC,CAwEhG"}
|