webpeel 0.14.6 → 0.15.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/cli.js +2 -0
- package/dist/cli.js.map +1 -1
- package/dist/core/browser-fetch.d.ts.map +1 -1
- package/dist/core/browser-fetch.js +75 -8
- package/dist/core/browser-fetch.js.map +1 -1
- package/dist/core/content-pruner.d.ts.map +1 -1
- package/dist/core/content-pruner.js +32 -0
- package/dist/core/content-pruner.js.map +1 -1
- package/dist/core/http-fetch.d.ts +2 -0
- package/dist/core/http-fetch.d.ts.map +1 -1
- package/dist/core/http-fetch.js +12 -0
- package/dist/core/http-fetch.js.map +1 -1
- package/dist/core/json-ld.d.ts +16 -0
- package/dist/core/json-ld.d.ts.map +1 -0
- package/dist/core/json-ld.js +618 -0
- package/dist/core/json-ld.js.map +1 -0
- package/dist/core/markdown.d.ts.map +1 -1
- package/dist/core/markdown.js +24 -0
- package/dist/core/markdown.js.map +1 -1
- package/dist/core/metadata.d.ts.map +1 -1
- package/dist/core/metadata.js +110 -0
- package/dist/core/metadata.js.map +1 -1
- package/dist/core/pipeline.d.ts +8 -0
- package/dist/core/pipeline.d.ts.map +1 -1
- package/dist/core/pipeline.js +104 -0
- package/dist/core/pipeline.js.map +1 -1
- package/dist/core/quick-answer.d.ts.map +1 -1
- package/dist/core/quick-answer.js +65 -4
- package/dist/core/quick-answer.js.map +1 -1
- package/dist/core/strategies.d.ts.map +1 -1
- package/dist/core/strategies.js +27 -0
- package/dist/core/strategies.js.map +1 -1
- package/dist/mcp/server.js +20 -1
- package/dist/mcp/server.js.map +1 -1
- package/dist/server/routes/fetch.d.ts.map +1 -1
- package/dist/server/routes/fetch.js +16 -2
- package/dist/server/routes/fetch.js.map +1 -1
- package/dist/server/routes/mcp.d.ts.map +1 -1
- package/dist/server/routes/mcp.js +32 -1
- package/dist/server/routes/mcp.js.map +1 -1
- package/dist/types.d.ts +22 -1
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js.map +1 -1
- package/package.json +1 -1
package/dist/cli.js
CHANGED
|
@@ -207,6 +207,7 @@ program
|
|
|
207
207
|
.option('--images', 'Output image URLs from the page')
|
|
208
208
|
.option('--meta', 'Output only the page metadata (title, description, author, etc.)')
|
|
209
209
|
.option('--raw', 'Return full page without smart content extraction')
|
|
210
|
+
.option('--lite', 'Lite mode — minimal processing, maximum speed (skip pruning, budget, metadata)')
|
|
210
211
|
.option('--action <actions...>', 'Page actions before scraping (e.g., "click:.btn" "wait:2000" "scroll:bottom")')
|
|
211
212
|
.option('--extract <json>', 'Extract structured data using CSS selectors (JSON object of field:selector pairs)')
|
|
212
213
|
.option('--llm-extract [instruction]', 'Extract structured data using LLM (optional instruction, e.g. "extract hotel names and prices")')
|
|
@@ -584,6 +585,7 @@ program
|
|
|
584
585
|
headers,
|
|
585
586
|
cookies: options.cookie,
|
|
586
587
|
raw: options.raw || false,
|
|
588
|
+
lite: options.lite || false,
|
|
587
589
|
actions,
|
|
588
590
|
maxTokens: options.maxTokens,
|
|
589
591
|
// Note: budget is applied AFTER caching (so cache stores full content)
|