imperium-crawl 2.3.1 → 2.5.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +146 -11
- package/dist/cli-explore.d.ts +30 -0
- package/dist/cli-explore.d.ts.map +1 -0
- package/dist/cli-explore.js +427 -0
- package/dist/cli-explore.js.map +1 -0
- package/dist/cli-recorder.d.ts +44 -0
- package/dist/cli-recorder.d.ts.map +1 -0
- package/dist/cli-recorder.js +67 -0
- package/dist/cli-recorder.js.map +1 -0
- package/dist/cli.d.ts.map +1 -1
- package/dist/cli.js +51 -3
- package/dist/cli.js.map +1 -1
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +3 -0
- package/dist/config.js.map +1 -1
- package/dist/constants.d.ts +1 -1
- package/dist/constants.d.ts.map +1 -1
- package/dist/constants.js +31 -1
- package/dist/constants.js.map +1 -1
- package/dist/flows/engine.d.ts +7 -0
- package/dist/flows/engine.d.ts.map +1 -0
- package/dist/flows/engine.js +183 -0
- package/dist/flows/engine.js.map +1 -0
- package/dist/flows/index.d.ts +6 -0
- package/dist/flows/index.d.ts.map +1 -0
- package/dist/flows/index.js +6 -0
- package/dist/flows/index.js.map +1 -0
- package/dist/flows/server.d.ts +11 -0
- package/dist/flows/server.d.ts.map +1 -0
- package/dist/flows/server.js +81 -0
- package/dist/flows/server.js.map +1 -0
- package/dist/flows/smart-target.d.ts +9 -0
- package/dist/flows/smart-target.d.ts.map +1 -0
- package/dist/flows/smart-target.js +84 -0
- package/dist/flows/smart-target.js.map +1 -0
- package/dist/flows/storage.d.ts +26 -0
- package/dist/flows/storage.d.ts.map +1 -0
- package/dist/flows/storage.js +118 -0
- package/dist/flows/storage.js.map +1 -0
- package/dist/flows/templates.d.ts +4 -0
- package/dist/flows/templates.d.ts.map +1 -0
- package/dist/flows/templates.js +35 -0
- package/dist/flows/templates.js.map +1 -0
- package/dist/flows/types.d.ts +3356 -0
- package/dist/flows/types.d.ts.map +1 -0
- package/dist/flows/types.js +133 -0
- package/dist/flows/types.js.map +1 -0
- package/dist/knowledge/index.d.ts +1 -0
- package/dist/knowledge/index.d.ts.map +1 -1
- package/dist/knowledge/index.js +1 -0
- package/dist/knowledge/index.js.map +1 -1
- package/dist/knowledge/record-browser.d.ts +17 -0
- package/dist/knowledge/record-browser.d.ts.map +1 -0
- package/dist/knowledge/record-browser.js +29 -0
- package/dist/knowledge/record-browser.js.map +1 -0
- package/dist/knowledge/store.d.ts +19 -0
- package/dist/knowledge/store.d.ts.map +1 -1
- package/dist/knowledge/store.js +63 -4
- package/dist/knowledge/store.js.map +1 -1
- package/dist/llm/retry.d.ts +4 -2
- package/dist/llm/retry.d.ts.map +1 -1
- package/dist/llm/retry.js +15 -4
- package/dist/llm/retry.js.map +1 -1
- package/dist/sessions/browser-connect.d.ts +30 -0
- package/dist/sessions/browser-connect.d.ts.map +1 -0
- package/dist/sessions/browser-connect.js +68 -0
- package/dist/sessions/browser-connect.js.map +1 -0
- package/dist/sessions/browser-state.d.ts +35 -0
- package/dist/sessions/browser-state.d.ts.map +1 -0
- package/dist/sessions/browser-state.js +74 -0
- package/dist/sessions/browser-state.js.map +1 -0
- package/dist/sessions/index.d.ts +1 -1
- package/dist/sessions/index.d.ts.map +1 -1
- package/dist/sessions/index.js +1 -1
- package/dist/sessions/index.js.map +1 -1
- package/dist/sessions/inject-cookies.d.ts +20 -0
- package/dist/sessions/inject-cookies.d.ts.map +1 -0
- package/dist/sessions/inject-cookies.js +57 -0
- package/dist/sessions/inject-cookies.js.map +1 -0
- package/dist/sessions/manager.d.ts +31 -1
- package/dist/sessions/manager.d.ts.map +1 -1
- package/dist/sessions/manager.js +97 -6
- package/dist/sessions/manager.js.map +1 -1
- package/dist/sessions/types.d.ts +2 -0
- package/dist/sessions/types.d.ts.map +1 -1
- package/dist/skills/chain.d.ts +61 -0
- package/dist/skills/chain.d.ts.map +1 -0
- package/dist/skills/chain.js +182 -0
- package/dist/skills/chain.js.map +1 -0
- package/dist/skills/conditions.d.ts +14 -0
- package/dist/skills/conditions.d.ts.map +1 -0
- package/dist/skills/conditions.js +208 -0
- package/dist/skills/conditions.js.map +1 -0
- package/dist/skills/manager.d.ts +47 -2
- package/dist/skills/manager.d.ts.map +1 -1
- package/dist/skills/manager.js.map +1 -1
- package/dist/skills/parameters.d.ts +49 -0
- package/dist/skills/parameters.d.ts.map +1 -0
- package/dist/skills/parameters.js +157 -0
- package/dist/skills/parameters.js.map +1 -0
- package/dist/snapshot/store.d.ts +8 -0
- package/dist/snapshot/store.d.ts.map +1 -1
- package/dist/snapshot/store.js +48 -0
- package/dist/snapshot/store.js.map +1 -1
- package/dist/stealth/antibot-detector.d.ts +1 -1
- package/dist/stealth/antibot-detector.d.ts.map +1 -1
- package/dist/stealth/antibot-detector.js +56 -0
- package/dist/stealth/antibot-detector.js.map +1 -1
- package/dist/stealth/browser-image-extract.d.ts +43 -0
- package/dist/stealth/browser-image-extract.d.ts.map +1 -0
- package/dist/stealth/browser-image-extract.js +268 -0
- package/dist/stealth/browser-image-extract.js.map +1 -0
- package/dist/stealth/browser.d.ts +5 -0
- package/dist/stealth/browser.d.ts.map +1 -1
- package/dist/stealth/browser.js +82 -1
- package/dist/stealth/browser.js.map +1 -1
- package/dist/stealth/chrome-profile.d.ts +1 -0
- package/dist/stealth/chrome-profile.d.ts.map +1 -1
- package/dist/stealth/chrome-profile.js +28 -5
- package/dist/stealth/chrome-profile.js.map +1 -1
- package/dist/stealth/detector.d.ts +10 -1
- package/dist/stealth/detector.d.ts.map +1 -1
- package/dist/stealth/detector.js +117 -25
- package/dist/stealth/detector.js.map +1 -1
- package/dist/stealth/headers.d.ts +1 -1
- package/dist/stealth/headers.d.ts.map +1 -1
- package/dist/stealth/headers.js +94 -2
- package/dist/stealth/headers.js.map +1 -1
- package/dist/stealth/index.d.ts +5 -0
- package/dist/stealth/index.d.ts.map +1 -1
- package/dist/stealth/index.js +257 -27
- package/dist/stealth/index.js.map +1 -1
- package/dist/stealth/proxy.d.ts +40 -1
- package/dist/stealth/proxy.d.ts.map +1 -1
- package/dist/stealth/proxy.js +90 -6
- package/dist/stealth/proxy.js.map +1 -1
- package/dist/tools/action-executor.d.ts +66 -0
- package/dist/tools/action-executor.d.ts.map +1 -0
- package/dist/tools/action-executor.js +403 -0
- package/dist/tools/action-executor.js.map +1 -0
- package/dist/tools/batch-download.d.ts +33 -0
- package/dist/tools/batch-download.d.ts.map +1 -0
- package/dist/tools/batch-download.js +208 -0
- package/dist/tools/batch-download.js.map +1 -0
- package/dist/tools/batch-scrape.d.ts +2 -2
- package/dist/tools/browser.d.ts +100 -0
- package/dist/tools/browser.d.ts.map +1 -0
- package/dist/tools/browser.js +448 -0
- package/dist/tools/browser.js.map +1 -0
- package/dist/tools/crawl.d.ts +2 -2
- package/dist/tools/create-skill.d.ts +2 -2
- package/dist/tools/discover-apis.d.ts +1 -1
- package/dist/tools/discover-apis.d.ts.map +1 -1
- package/dist/tools/discover-apis.js +3 -0
- package/dist/tools/discover-apis.js.map +1 -1
- package/dist/tools/download.d.ts +39 -6
- package/dist/tools/download.d.ts.map +1 -1
- package/dist/tools/download.js +248 -44
- package/dist/tools/download.js.map +1 -1
- package/dist/tools/extract.d.ts +1 -1
- package/dist/tools/image-search.d.ts +1 -1
- package/dist/tools/index.d.ts.map +1 -1
- package/dist/tools/index.js +26 -0
- package/dist/tools/index.js.map +1 -1
- package/dist/tools/inspect-flow.d.ts +24 -0
- package/dist/tools/inspect-flow.d.ts.map +1 -0
- package/dist/tools/inspect-flow.js +23 -0
- package/dist/tools/inspect-flow.js.map +1 -0
- package/dist/tools/instagram.d.ts +2 -2
- package/dist/tools/interact.d.ts +91 -50
- package/dist/tools/interact.d.ts.map +1 -1
- package/dist/tools/interact.js +80 -299
- package/dist/tools/interact.js.map +1 -1
- package/dist/tools/knowledge.d.ts +24 -0
- package/dist/tools/knowledge.d.ts.map +1 -0
- package/dist/tools/knowledge.js +99 -0
- package/dist/tools/knowledge.js.map +1 -0
- package/dist/tools/list-flows.d.ts +21 -0
- package/dist/tools/list-flows.d.ts.map +1 -0
- package/dist/tools/list-flows.js +18 -0
- package/dist/tools/list-flows.js.map +1 -0
- package/dist/tools/list-skills.js +1 -1
- package/dist/tools/list-skills.js.map +1 -1
- package/dist/tools/manifest.d.ts.map +1 -1
- package/dist/tools/manifest.js +48 -0
- package/dist/tools/manifest.js.map +1 -1
- package/dist/tools/monitor-websocket.d.ts +1 -1
- package/dist/tools/monitor.d.ts +46 -0
- package/dist/tools/monitor.d.ts.map +1 -0
- package/dist/tools/monitor.js +213 -0
- package/dist/tools/monitor.js.map +1 -0
- package/dist/tools/news-search.d.ts +1 -1
- package/dist/tools/pdf-extract.d.ts +38 -0
- package/dist/tools/pdf-extract.d.ts.map +1 -0
- package/dist/tools/pdf-extract.js +244 -0
- package/dist/tools/pdf-extract.js.map +1 -0
- package/dist/tools/query-api.d.ts +6 -6
- package/dist/tools/readability.d.ts +2 -2
- package/dist/tools/record-flow.d.ts +39 -0
- package/dist/tools/record-flow.d.ts.map +1 -0
- package/dist/tools/record-flow.js +406 -0
- package/dist/tools/record-flow.js.map +1 -0
- package/dist/tools/reddit.d.ts +4 -4
- package/dist/tools/run-flow.d.ts +54 -0
- package/dist/tools/run-flow.d.ts.map +1 -0
- package/dist/tools/run-flow.js +47 -0
- package/dist/tools/run-flow.js.map +1 -0
- package/dist/tools/run-skill.d.ts +14 -4
- package/dist/tools/run-skill.d.ts.map +1 -1
- package/dist/tools/run-skill.js +74 -0
- package/dist/tools/run-skill.js.map +1 -1
- package/dist/tools/scrape.d.ts +9 -6
- package/dist/tools/scrape.d.ts.map +1 -1
- package/dist/tools/scrape.js +19 -1
- package/dist/tools/scrape.js.map +1 -1
- package/dist/tools/screenshot.d.ts.map +1 -1
- package/dist/tools/screenshot.js +6 -0
- package/dist/tools/screenshot.js.map +1 -1
- package/dist/tools/search.d.ts +1 -1
- package/dist/tools/serve-flow.d.ts +36 -0
- package/dist/tools/serve-flow.d.ts.map +1 -0
- package/dist/tools/serve-flow.js +42 -0
- package/dist/tools/serve-flow.js.map +1 -0
- package/dist/tools/snapshot.d.ts +5 -5
- package/dist/tools/snapshot.d.ts.map +1 -1
- package/dist/tools/snapshot.js +3 -0
- package/dist/tools/snapshot.js.map +1 -1
- package/dist/tools/validate-flow.d.ts +24 -0
- package/dist/tools/validate-flow.d.ts.map +1 -0
- package/dist/tools/validate-flow.js +23 -0
- package/dist/tools/validate-flow.js.map +1 -0
- package/dist/tools/video-search.d.ts +1 -1
- package/dist/tools/watch.d.ts +68 -0
- package/dist/tools/watch.d.ts.map +1 -0
- package/dist/tools/watch.js +224 -0
- package/dist/tools/watch.js.map +1 -0
- package/dist/tools/youtube.d.ts +2 -2
- package/dist/utils/fetcher.d.ts +13 -4
- package/dist/utils/fetcher.d.ts.map +1 -1
- package/dist/utils/fetcher.js +153 -23
- package/dist/utils/fetcher.js.map +1 -1
- package/package.json +19 -5
|
@@ -0,0 +1,244 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* pdf-extract — extract text, pages, tables, and metadata from a PDF.
|
|
3
|
+
*
|
|
4
|
+
* v2.5.0: native strategy only (pdfjs-dist text layer).
|
|
5
|
+
* OCR + Claude Vision fallbacks are deferred to v2.6.0.
|
|
6
|
+
*
|
|
7
|
+
* Accepts a local path or a remote URL (auto-download to tmp).
|
|
8
|
+
*/
|
|
9
|
+
import { z } from "zod";
|
|
10
|
+
import { readFile, writeFile, mkdtemp } from "node:fs/promises";
|
|
11
|
+
import { existsSync } from "node:fs";
|
|
12
|
+
import { tmpdir } from "node:os";
|
|
13
|
+
import { join, resolve as resolvePath } from "node:path";
|
|
14
|
+
import { toolResult, errorResult } from "../utils/tool-response.js";
|
|
15
|
+
import { debugLog } from "../utils/debug.js";
|
|
16
|
+
export const name = "pdf_extract";
|
|
17
|
+
export const description = "Extract text, pages, tables, and metadata from a local or remote PDF. Native text-layer strategy (pdfjs-dist). OCR/Vision fallbacks deferred to v2.6.0.";
|
|
18
|
+
export const schema = z.object({
|
|
19
|
+
input: z
|
|
20
|
+
.string()
|
|
21
|
+
.min(1)
|
|
22
|
+
.describe("Local PDF path or remote URL (http/https). URL inputs are downloaded to a temp file."),
|
|
23
|
+
output: z
|
|
24
|
+
.string()
|
|
25
|
+
.default("./extracted.json")
|
|
26
|
+
.describe("Output JSON path"),
|
|
27
|
+
preserve_layout: z
|
|
28
|
+
.boolean()
|
|
29
|
+
.default(true)
|
|
30
|
+
.describe("Preserve line breaks and approximate layout when assembling text"),
|
|
31
|
+
extract_tables: z
|
|
32
|
+
.boolean()
|
|
33
|
+
.default(true)
|
|
34
|
+
.describe("Run basic regex-based table extraction"),
|
|
35
|
+
max_pages: z
|
|
36
|
+
.number()
|
|
37
|
+
.min(0)
|
|
38
|
+
.default(0)
|
|
39
|
+
.describe("Limit pages to extract (0 = all)"),
|
|
40
|
+
});
|
|
41
|
+
async function downloadToTmp(url) {
|
|
42
|
+
const res = await fetch(url);
|
|
43
|
+
if (!res.ok)
|
|
44
|
+
throw new Error(`Failed to download PDF (${res.status} ${res.statusText}): ${url}`);
|
|
45
|
+
const buf = Buffer.from(await res.arrayBuffer());
|
|
46
|
+
const dir = await mkdtemp(join(tmpdir(), "imperium-pdf-"));
|
|
47
|
+
const file = join(dir, "input.pdf");
|
|
48
|
+
await writeFile(file, buf);
|
|
49
|
+
return file;
|
|
50
|
+
}
|
|
51
|
+
/**
|
|
52
|
+
* Assemble text from pdfjs text items. When preserveLayout is true, we insert
|
|
53
|
+
* newlines on hasEOL markers and approximate line breaks using y-coordinate deltas.
|
|
54
|
+
*/
|
|
55
|
+
function assemblePageText(items, preserveLayout) {
|
|
56
|
+
if (!preserveLayout) {
|
|
57
|
+
return items.map((i) => i.str).join(" ").replace(/\s+/g, " ").trim();
|
|
58
|
+
}
|
|
59
|
+
const lines = [];
|
|
60
|
+
let current = "";
|
|
61
|
+
let lastY = null;
|
|
62
|
+
for (const it of items) {
|
|
63
|
+
const y = Array.isArray(it.transform) && it.transform.length >= 6 ? it.transform[5] : null;
|
|
64
|
+
const yChanged = y !== null && lastY !== null && Math.abs(y - lastY) > 2;
|
|
65
|
+
if (yChanged) {
|
|
66
|
+
if (current.trim())
|
|
67
|
+
lines.push(current.trimEnd());
|
|
68
|
+
current = "";
|
|
69
|
+
}
|
|
70
|
+
current += it.str;
|
|
71
|
+
if (it.hasEOL) {
|
|
72
|
+
if (current.trim())
|
|
73
|
+
lines.push(current.trimEnd());
|
|
74
|
+
current = "";
|
|
75
|
+
}
|
|
76
|
+
if (y !== null)
|
|
77
|
+
lastY = y;
|
|
78
|
+
}
|
|
79
|
+
if (current.trim())
|
|
80
|
+
lines.push(current.trimEnd());
|
|
81
|
+
return lines.join("\n");
|
|
82
|
+
}
|
|
83
|
+
/**
|
|
84
|
+
* Basic table extraction: looks for lines with 2+ runs of whitespace (≥2 spaces
|
|
85
|
+
* or tabs) as column separators. A table is ≥2 consecutive rows with the same
|
|
86
|
+
* column count.
|
|
87
|
+
*/
|
|
88
|
+
function extractTablesFromText(text, pageNum) {
|
|
89
|
+
const lines = text.split("\n");
|
|
90
|
+
const tables = [];
|
|
91
|
+
let buffer = [];
|
|
92
|
+
let colCount = 0;
|
|
93
|
+
const flush = () => {
|
|
94
|
+
if (buffer.length >= 2) {
|
|
95
|
+
tables.push({ page: pageNum, rows: buffer });
|
|
96
|
+
}
|
|
97
|
+
buffer = [];
|
|
98
|
+
colCount = 0;
|
|
99
|
+
};
|
|
100
|
+
for (const line of lines) {
|
|
101
|
+
const trimmed = line.trim();
|
|
102
|
+
if (!trimmed) {
|
|
103
|
+
flush();
|
|
104
|
+
continue;
|
|
105
|
+
}
|
|
106
|
+
// Split on 2+ whitespace or tab
|
|
107
|
+
const cells = trimmed.split(/\s{2,}|\t+/).map((c) => c.trim()).filter(Boolean);
|
|
108
|
+
if (cells.length >= 2) {
|
|
109
|
+
if (colCount === 0) {
|
|
110
|
+
colCount = cells.length;
|
|
111
|
+
buffer.push(cells);
|
|
112
|
+
}
|
|
113
|
+
else if (cells.length === colCount) {
|
|
114
|
+
buffer.push(cells);
|
|
115
|
+
}
|
|
116
|
+
else {
|
|
117
|
+
flush();
|
|
118
|
+
colCount = cells.length;
|
|
119
|
+
buffer.push(cells);
|
|
120
|
+
}
|
|
121
|
+
}
|
|
122
|
+
else {
|
|
123
|
+
flush();
|
|
124
|
+
}
|
|
125
|
+
}
|
|
126
|
+
flush();
|
|
127
|
+
return tables;
|
|
128
|
+
}
|
|
129
|
+
function computeConfidence(text) {
|
|
130
|
+
if (!text)
|
|
131
|
+
return 0;
|
|
132
|
+
const trimmed = text.trim();
|
|
133
|
+
if (trimmed.length === 0)
|
|
134
|
+
return 0;
|
|
135
|
+
// Heuristic: ratio of printable ASCII + basic unicode letters vs total chars.
|
|
136
|
+
let printable = 0;
|
|
137
|
+
for (const ch of trimmed) {
|
|
138
|
+
const code = ch.charCodeAt(0);
|
|
139
|
+
if (code >= 32 && code < 127)
|
|
140
|
+
printable++;
|
|
141
|
+
else if (/\p{L}|\p{N}|\p{P}|\s/u.test(ch))
|
|
142
|
+
printable++;
|
|
143
|
+
}
|
|
144
|
+
const ratio = printable / trimmed.length;
|
|
145
|
+
// Length factor: at least 50 chars = full confidence contribution
|
|
146
|
+
const lengthFactor = Math.min(1, trimmed.length / 50);
|
|
147
|
+
return Math.min(1, ratio * lengthFactor);
|
|
148
|
+
}
|
|
149
|
+
export async function execute(input) {
|
|
150
|
+
const warnings = [];
|
|
151
|
+
try {
|
|
152
|
+
// Resolve input (URL or local path)
|
|
153
|
+
let pdfPath;
|
|
154
|
+
const isUrl = /^https?:\/\//i.test(input.input);
|
|
155
|
+
if (isUrl) {
|
|
156
|
+
debugLog("pdf-extract", "downloading url", input.input);
|
|
157
|
+
pdfPath = await downloadToTmp(input.input);
|
|
158
|
+
}
|
|
159
|
+
else {
|
|
160
|
+
pdfPath = resolvePath(input.input);
|
|
161
|
+
if (!existsSync(pdfPath)) {
|
|
162
|
+
return errorResult(`PDF not found at path: ${pdfPath}`);
|
|
163
|
+
}
|
|
164
|
+
}
|
|
165
|
+
// Load pdfjs-dist (legacy build works in Node w/o DOMMatrix)
|
|
166
|
+
// eslint-disable-next-line @typescript-eslint/no-explicit-any
|
|
167
|
+
const pdfjs = await import("pdfjs-dist/legacy/build/pdf.mjs");
|
|
168
|
+
const data = new Uint8Array(await readFile(pdfPath));
|
|
169
|
+
const loadingTask = pdfjs.getDocument({
|
|
170
|
+
data,
|
|
171
|
+
useSystemFonts: true,
|
|
172
|
+
// Disable font loading / canvas / workers for Node
|
|
173
|
+
isEvalSupported: false,
|
|
174
|
+
disableFontFace: true,
|
|
175
|
+
});
|
|
176
|
+
const doc = await loadingTask.promise;
|
|
177
|
+
const totalPages = doc.numPages;
|
|
178
|
+
const pageLimit = input.max_pages > 0 ? Math.min(input.max_pages, totalPages) : totalPages;
|
|
179
|
+
const pages = [];
|
|
180
|
+
const tables = [];
|
|
181
|
+
const textChunks = [];
|
|
182
|
+
for (let p = 1; p <= pageLimit; p++) {
|
|
183
|
+
try {
|
|
184
|
+
const page = await doc.getPage(p);
|
|
185
|
+
const content = await page.getTextContent();
|
|
186
|
+
const pageText = assemblePageText(content.items, input.preserve_layout);
|
|
187
|
+
const conf = computeConfidence(pageText);
|
|
188
|
+
pages.push({ num: p, text: pageText, confidence: conf });
|
|
189
|
+
textChunks.push(pageText);
|
|
190
|
+
if (input.extract_tables) {
|
|
191
|
+
const pageTables = extractTablesFromText(pageText, p);
|
|
192
|
+
tables.push(...pageTables);
|
|
193
|
+
}
|
|
194
|
+
}
|
|
195
|
+
catch (pageErr) {
|
|
196
|
+
warnings.push(`Page ${p}: ${pageErr instanceof Error ? pageErr.message : String(pageErr)}`);
|
|
197
|
+
pages.push({ num: p, text: "", confidence: 0 });
|
|
198
|
+
}
|
|
199
|
+
}
|
|
200
|
+
let metadataInfo = {};
|
|
201
|
+
try {
|
|
202
|
+
const md = await doc.getMetadata();
|
|
203
|
+
metadataInfo = (md.info || {});
|
|
204
|
+
}
|
|
205
|
+
catch (mdErr) {
|
|
206
|
+
warnings.push(`Metadata: ${mdErr instanceof Error ? mdErr.message : String(mdErr)}`);
|
|
207
|
+
}
|
|
208
|
+
const overall = pages.length > 0
|
|
209
|
+
? pages.reduce((s, p) => s + p.confidence, 0) / pages.length
|
|
210
|
+
: 0;
|
|
211
|
+
const fullText = textChunks.join("\n\n");
|
|
212
|
+
if (!fullText.trim()) {
|
|
213
|
+
warnings.push("No text extracted via native text layer. PDF may be a scanned image — OCR fallback will land in v2.6.0.");
|
|
214
|
+
}
|
|
215
|
+
const result = {
|
|
216
|
+
text: fullText,
|
|
217
|
+
pages,
|
|
218
|
+
tables,
|
|
219
|
+
metadata: {
|
|
220
|
+
title: typeof metadataInfo.Title === "string" ? metadataInfo.Title : undefined,
|
|
221
|
+
author: typeof metadataInfo.Author === "string" ? metadataInfo.Author : undefined,
|
|
222
|
+
pages: totalPages,
|
|
223
|
+
extracted_at: new Date().toISOString(),
|
|
224
|
+
source: input.input,
|
|
225
|
+
},
|
|
226
|
+
strategy_used: "native",
|
|
227
|
+
overall_confidence: overall,
|
|
228
|
+
warnings,
|
|
229
|
+
};
|
|
230
|
+
// Always write output JSON to disk
|
|
231
|
+
try {
|
|
232
|
+
await writeFile(resolvePath(input.output), JSON.stringify(result, null, 2), "utf-8");
|
|
233
|
+
}
|
|
234
|
+
catch (wErr) {
|
|
235
|
+
warnings.push(`Failed to write output file: ${wErr instanceof Error ? wErr.message : String(wErr)}`);
|
|
236
|
+
}
|
|
237
|
+
return toolResult({ ...result, output_file: resolvePath(input.output) });
|
|
238
|
+
}
|
|
239
|
+
catch (err) {
|
|
240
|
+
debugLog("pdf-extract", "failed", err);
|
|
241
|
+
return errorResult(err instanceof Error ? err.message : String(err));
|
|
242
|
+
}
|
|
243
|
+
}
|
|
244
|
+
//# sourceMappingURL=pdf-extract.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"pdf-extract.js","sourceRoot":"","sources":["../../src/tools/pdf-extract.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AAEH,OAAO,EAAE,CAAC,EAAE,MAAM,KAAK,CAAC;AACxB,OAAO,EAAE,QAAQ,EAAE,SAAS,EAAE,OAAO,EAAE,MAAM,kBAAkB,CAAC;AAChE,OAAO,EAAE,UAAU,EAAE,MAAM,SAAS,CAAC;AACrC,OAAO,EAAE,MAAM,EAAE,MAAM,SAAS,CAAC;AACjC,OAAO,EAAE,IAAI,EAAE,OAAO,IAAI,WAAW,EAAE,MAAM,WAAW,CAAC;AACzD,OAAO,EAAE,UAAU,EAAE,WAAW,EAAE,MAAM,2BAA2B,CAAC;AACpE,OAAO,EAAE,QAAQ,EAAE,MAAM,mBAAmB,CAAC;AAE7C,MAAM,CAAC,MAAM,IAAI,GAAG,aAAa,CAAC;AAElC,MAAM,CAAC,MAAM,WAAW,GACtB,yJAAyJ,CAAC;AAE5J,MAAM,CAAC,MAAM,MAAM,GAAG,CAAC,CAAC,MAAM,CAAC;IAC7B,KAAK,EAAE,CAAC;SACL,MAAM,EAAE;SACR,GAAG,CAAC,CAAC,CAAC;SACN,QAAQ,CAAC,sFAAsF,CAAC;IACnG,MAAM,EAAE,CAAC;SACN,MAAM,EAAE;SACR,OAAO,CAAC,kBAAkB,CAAC;SAC3B,QAAQ,CAAC,kBAAkB,CAAC;IAC/B,eAAe,EAAE,CAAC;SACf,OAAO,EAAE;SACT,OAAO,CAAC,IAAI,CAAC;SACb,QAAQ,CAAC,kEAAkE,CAAC;IAC/E,cAAc,EAAE,CAAC;SACd,OAAO,EAAE;SACT,OAAO,CAAC,IAAI,CAAC;SACb,QAAQ,CAAC,wCAAwC,CAAC;IACrD,SAAS,EAAE,CAAC;SACT,MAAM,EAAE;SACR,GAAG,CAAC,CAAC,CAAC;SACN,OAAO,CAAC,CAAC,CAAC;SACV,QAAQ,CAAC,kCAAkC,CAAC;CAChD,CAAC,CAAC;AAiDH,KAAK,UAAU,aAAa,CAAC,GAAW;IACtC,MAAM,GAAG,GAAG,MAAM,KAAK,CAAC,GAAG,CAAC,CAAC;IAC7B,IAAI,CAAC,GAAG,CAAC,EAAE;QAAE,MAAM,IAAI,KAAK,CAAC,2BAA2B,GAAG,CAAC,MAAM,IAAI,GAAG,CAAC,UAAU,MAAM,GAAG,EAAE,CAAC,CAAC;IACjG,MAAM,GAAG,GAAG,MAAM,CAAC,IAAI,CAAC,MAAM,GAAG,CAAC,WAAW,EAAE,CAAC,CAAC;IACjD,MAAM,GAAG,GAAG,MAAM,OAAO,CAAC,IAAI,CAAC,MAAM,EAAE,EAAE,eAAe,CAAC,CAAC,CAAC;IAC3D,MAAM,IAAI,GAAG,IAAI,CAAC,GAAG,EAAE,WAAW,CAAC,CAAC;IACpC,MAAM,SAAS,CAAC,IAAI,EAAE,GAAG,CAAC,CAAC;IAC3B,OAAO,IAAI,CAAC;AACd,CAAC;AAED;;;GAGG;AACH,SAAS,gBAAgB,CAAC,KAAqB,EAAE,cAAuB;IACtE,IAAI,CAAC,cAAc,EAAE,CAAC;QACpB,OAAO,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,OAAO,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC,IAAI,EAAE,CAAC;IACvE,CAAC;IAED,MAAM,KAAK,GAAa,EAAE,CAAC;IAC3B,IAAI,OAAO,GAAG,EAAE,CAAC;IACjB,IAAI,KAAK,GAAkB,IAAI,CAAC;IAEhC,KAAK,MAAM,EAAE,IAAI,KAAK,EAAE,CAAC;QACvB,MAAM,CAAC,GAAG,KAAK,CAAC,OAAO,CAAC,EAAE,CAAC,SAAS,CAAC,IAAI,EAAE,CAAC,SAAS,CAAC,MAAM,IAAI,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC,SAAS,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC;QAC3F,MAAM,QAAQ,GAAG,CAAC,KAAK,IAAI,IAAI,KAAK,KAAK,IAAI,IAAI,IAAI,CAAC,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,CAAC,CAAC;QAEzE,IAAI,QAAQ,EAAE,CAAC;YACb,IAAI,OAAO,CAAC,IAAI,EAAE;gBAAE,KAAK,CAAC,IAAI,CAAC,OAAO,CAAC,OAAO,EAAE,CAAC,CAAC;YAClD,OAAO,GAAG,EAAE,CAAC;QACf,CAAC;QAED,OAAO,IAAI,EAAE,CAAC,GAAG,CAAC;QAElB,IAAI,EAAE,CAAC,MAAM,EAAE,CAAC;YACd,IAAI,OAAO,CAAC,IAAI,EAAE;gBAAE,KAAK,CAAC,IAAI,CAAC,OAAO,CAAC,OAAO,EAAE,CAAC,CAAC;YAClD,OAAO,GAAG,EAAE,CAAC;QACf,CAAC;QAED,IAAI,CAAC,KAAK,IAAI;YAAE,KAAK,GAAG,CAAC,CAAC;IAC5B,CAAC;IAED,IAAI,OAAO,CAAC,IAAI,EAAE;QAAE,KAAK,CAAC,IAAI,CAAC,OAAO,CAAC,OAAO,EAAE,CAAC,CAAC;IAClD,OAAO,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;AAC1B,CAAC;AAED;;;;GAIG;AACH,SAAS,qBAAqB,CAAC,IAAY,EAAE,OAAe;IAC1D,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC;IAC/B,MAAM,MAAM,GAAkB,EAAE,CAAC;IACjC,IAAI,MAAM,GAAe,EAAE,CAAC;IAC5B,IAAI,QAAQ,GAAG,CAAC,CAAC;IAEjB,MAAM,KAAK,GAAG,GAAG,EAAE;QACjB,IAAI,MAAM,CAAC,MAAM,IAAI,CAAC,EAAE,CAAC;YACvB,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,MAAM,EAAE,CAAC,CAAC;QAC/C,CAAC;QACD,MAAM,GAAG,EAAE,CAAC;QACZ,QAAQ,GAAG,CAAC,CAAC;IACf,CAAC,CAAC;IAEF,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QACzB,MAAM,OAAO,GAAG,IAAI,CAAC,IAAI,EAAE,CAAC;QAC5B,IAAI,CAAC,OAAO,EAAE,CAAC;YACb,KAAK,EAAE,CAAC;YACR,SAAS;QACX,CAAC;QACD,gCAAgC;QAChC,MAAM,KAAK,GAAG,OAAO,CAAC,KAAK,CAAC,YAAY,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC;QAC/E,IAAI,KAAK,CAAC,MAAM,IAAI,CAAC,EAAE,CAAC;YACtB,IAAI,QAAQ,KAAK,CAAC,EAAE,CAAC;gBACnB,QAAQ,GAAG,KAAK,CAAC,MAAM,CAAC;gBACxB,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YACrB,CAAC;iBAAM,IAAI,KAAK,CAAC,MAAM,KAAK,QAAQ,EAAE,CAAC;gBACrC,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YACrB,CAAC;iBAAM,CAAC;gBACN,KAAK,EAAE,CAAC;gBACR,QAAQ,GAAG,KAAK,CAAC,MAAM,CAAC;gBACxB,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YACrB,CAAC;QACH,CAAC;aAAM,CAAC;YACN,KAAK,EAAE,CAAC;QACV,CAAC;IACH,CAAC;IACD,KAAK,EAAE,CAAC;IAER,OAAO,MAAM,CAAC;AAChB,CAAC;AAED,SAAS,iBAAiB,CAAC,IAAY;IACrC,IAAI,CAAC,IAAI;QAAE,OAAO,CAAC,CAAC;IACpB,MAAM,OAAO,GAAG,IAAI,CAAC,IAAI,EAAE,CAAC;IAC5B,IAAI,OAAO,CAAC,MAAM,KAAK,CAAC;QAAE,OAAO,CAAC,CAAC;IAEnC,8EAA8E;IAC9E,IAAI,SAAS,GAAG,CAAC,CAAC;IAClB,KAAK,MAAM,EAAE,IAAI,OAAO,EAAE,CAAC;QACzB,MAAM,IAAI,GAAG,EAAE,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;QAC9B,IAAI,IAAI,IAAI,EAAE,IAAI,IAAI,GAAG,GAAG;YAAE,SAAS,EAAE,CAAC;aACrC,IAAI,uBAAuB,CAAC,IAAI,CAAC,EAAE,CAAC;YAAE,SAAS,EAAE,CAAC;IACzD,CAAC;IACD,MAAM,KAAK,GAAG,SAAS,GAAG,OAAO,CAAC,MAAM,CAAC;IACzC,kEAAkE;IAClE,MAAM,YAAY,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,OAAO,CAAC,MAAM,GAAG,EAAE,CAAC,CAAC;IACtD,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,GAAG,YAAY,CAAC,CAAC;AAC3C,CAAC;AAED,MAAM,CAAC,KAAK,UAAU,OAAO,CAAC,KAAsB;IAClD,MAAM,QAAQ,GAAa,EAAE,CAAC;IAE9B,IAAI,CAAC;QACH,oCAAoC;QACpC,IAAI,OAAe,CAAC;QACpB,MAAM,KAAK,GAAG,eAAe,CAAC,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;QAChD,IAAI,KAAK,EAAE,CAAC;YACV,QAAQ,CAAC,aAAa,EAAE,iBAAiB,EAAE,KAAK,CAAC,KAAK,CAAC,CAAC;YACxD,OAAO,GAAG,MAAM,aAAa,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;QAC7C,CAAC;aAAM,CAAC;YACN,OAAO,GAAG,WAAW,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;YACnC,IAAI,CAAC,UAAU,CAAC,OAAO,CAAC,EAAE,CAAC;gBACzB,OAAO,WAAW,CAAC,0BAA0B,OAAO,EAAE,CAAC,CAAC;YAC1D,CAAC;QACH,CAAC;QAED,6DAA6D;QAC7D,8DAA8D;QAC9D,MAAM,KAAK,GAAQ,MAAM,MAAM,CAAC,iCAAiC,CAAC,CAAC;QAEnE,MAAM,IAAI,GAAG,IAAI,UAAU,CAAC,MAAM,QAAQ,CAAC,OAAO,CAAC,CAAC,CAAC;QACrD,MAAM,WAAW,GAAG,KAAK,CAAC,WAAW,CAAC;YACpC,IAAI;YACJ,cAAc,EAAE,IAAI;YACpB,mDAAmD;YACnD,eAAe,EAAE,KAAK;YACtB,eAAe,EAAE,IAAI;SACtB,CAAC,CAAC;QACH,MAAM,GAAG,GAAoB,MAAM,WAAW,CAAC,OAAO,CAAC;QAEvD,MAAM,UAAU,GAAG,GAAG,CAAC,QAAQ,CAAC;QAChC,MAAM,SAAS,GAAG,KAAK,CAAC,SAAS,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,KAAK,CAAC,SAAS,EAAE,UAAU,CAAC,CAAC,CAAC,CAAC,UAAU,CAAC;QAE3F,MAAM,KAAK,GAAiB,EAAE,CAAC;QAC/B,MAAM,MAAM,GAAkB,EAAE,CAAC;QACjC,MAAM,UAAU,GAAa,EAAE,CAAC;QAEhC,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,IAAI,SAAS,EAAE,CAAC,EAAE,EAAE,CAAC;YACpC,IAAI,CAAC;gBACH,MAAM,IAAI,GAAG,MAAM,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC;gBAClC,MAAM,OAAO,GAAG,MAAM,IAAI,CAAC,cAAc,EAAE,CAAC;gBAC5C,MAAM,QAAQ,GAAG,gBAAgB,CAAC,OAAO,CAAC,KAAK,EAAE,KAAK,CAAC,eAAe,CAAC,CAAC;gBACxE,MAAM,IAAI,GAAG,iBAAiB,CAAC,QAAQ,CAAC,CAAC;gBACzC,KAAK,CAAC,IAAI,CAAC,EAAE,GAAG,EAAE,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,UAAU,EAAE,IAAI,EAAE,CAAC,CAAC;gBACzD,UAAU,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;gBAC1B,IAAI,KAAK,CAAC,cAAc,EAAE,CAAC;oBACzB,MAAM,UAAU,GAAG,qBAAqB,CAAC,QAAQ,EAAE,CAAC,CAAC,CAAC;oBACtD,MAAM,CAAC,IAAI,CAAC,GAAG,UAAU,CAAC,CAAC;gBAC7B,CAAC;YACH,CAAC;YAAC,OAAO,OAAO,EAAE,CAAC;gBACjB,QAAQ,CAAC,IAAI,CAAC,QAAQ,CAAC,KAAK,OAAO,YAAY,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,EAAE,CAAC,CAAC;gBAC5F,KAAK,CAAC,IAAI,CAAC,EAAE,GAAG,EAAE,CAAC,EAAE,IAAI,EAAE,EAAE,EAAE,UAAU,EAAE,CAAC,EAAE,CAAC,CAAC;YAClD,CAAC;QACH,CAAC;QAED,IAAI,YAAY,GAA4B,EAAE,CAAC;QAC/C,IAAI,CAAC;YACH,MAAM,EAAE,GAAG,MAAM,GAAG,CAAC,WAAW,EAAE,CAAC;YACnC,YAAY,GAAG,CAAC,EAAE,CAAC,IAAI,IAAI,EAAE,CAA4B,CAAC;QAC5D,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,QAAQ,CAAC,IAAI,CAAC,aAAa,KAAK,YAAY,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC;QACvF,CAAC;QAED,MAAM,OAAO,GACX,KAAK,CAAC,MAAM,GAAG,CAAC;YACd,CAAC,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,UAAU,EAAE,CAAC,CAAC,GAAG,KAAK,CAAC,MAAM;YAC5D,CAAC,CAAC,CAAC,CAAC;QAER,MAAM,QAAQ,GAAG,UAAU,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QAEzC,IAAI,CAAC,QAAQ,CAAC,IAAI,EAAE,EAAE,CAAC;YACrB,QAAQ,CAAC,IAAI,CACX,yGAAyG,CAC1G,CAAC;QACJ,CAAC;QAED,MAAM,MAAM,GAAqB;YAC/B,IAAI,EAAE,QAAQ;YACd,KAAK;YACL,MAAM;YACN,QAAQ,EAAE;gBACR,KAAK,EAAE,OAAO,YAAY,CAAC,KAAK,KAAK,QAAQ,CAAC,CAAC,CAAE,YAAY,CAAC,KAAgB,CAAC,CAAC,CAAC,SAAS;gBAC1F,MAAM,EAAE,OAAO,YAAY,CAAC,MAAM,KAAK,QAAQ,CAAC,CAAC,CAAE,YAAY,CAAC,MAAiB,CAAC,CAAC,CAAC,SAAS;gBAC7F,KAAK,EAAE,UAAU;gBACjB,YAAY,EAAE,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE;gBACtC,MAAM,EAAE,KAAK,CAAC,KAAK;aACpB;YACD,aAAa,EAAE,QAAQ;YACvB,kBAAkB,EAAE,OAAO;YAC3B,QAAQ;SACT,CAAC;QAEF,mCAAmC;QACnC,IAAI,CAAC;YACH,MAAM,SAAS,CAAC,WAAW,CAAC,KAAK,CAAC,MAAM,CAAC,EAAE,IAAI,CAAC,SAAS,CAAC,MAAM,EAAE,IAAI,EAAE,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC;QACvF,CAAC;QAAC,OAAO,IAAI,EAAE,CAAC;YACd,QAAQ,CAAC,IAAI,CAAC,gCAAgC,IAAI,YAAY,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC;QACvG,CAAC;QAED,OAAO,UAAU,CAAC,EAAE,GAAG,MAAM,EAAE,WAAW,EAAE,WAAW,CAAC,KAAK,CAAC,MAAM,CAAC,EAAE,CAAC,CAAC;IAC3E,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,QAAQ,CAAC,aAAa,EAAE,QAAQ,EAAE,GAAG,CAAC,CAAC;QACvC,OAAO,WAAW,CAAC,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC,CAAC;IACvE,CAAC;AACH,CAAC"}
|
|
@@ -12,20 +12,20 @@ export declare const schema: z.ZodObject<{
|
|
|
12
12
|
proxy: z.ZodOptional<z.ZodString>;
|
|
13
13
|
}, "strip", z.ZodTypeAny, {
|
|
14
14
|
url: string;
|
|
15
|
-
method: "POST" | "GET" | "PUT" | "PATCH" | "DELETE";
|
|
16
15
|
timeout: number;
|
|
16
|
+
method: "POST" | "GET" | "PUT" | "PATCH" | "DELETE";
|
|
17
17
|
stealth_headers: boolean;
|
|
18
|
-
headers?: Record<string, string> | undefined;
|
|
19
|
-
proxy?: string | undefined;
|
|
20
18
|
body?: string | undefined;
|
|
19
|
+
proxy?: string | undefined;
|
|
20
|
+
headers?: Record<string, string> | undefined;
|
|
21
21
|
params?: Record<string, string> | undefined;
|
|
22
22
|
}, {
|
|
23
23
|
url: string;
|
|
24
|
-
headers?: Record<string, string> | undefined;
|
|
25
|
-
method?: "POST" | "GET" | "PUT" | "PATCH" | "DELETE" | undefined;
|
|
26
|
-
proxy?: string | undefined;
|
|
27
24
|
body?: string | undefined;
|
|
28
25
|
timeout?: number | undefined;
|
|
26
|
+
method?: "POST" | "GET" | "PUT" | "PATCH" | "DELETE" | undefined;
|
|
27
|
+
proxy?: string | undefined;
|
|
28
|
+
headers?: Record<string, string> | undefined;
|
|
29
29
|
params?: Record<string, string> | undefined;
|
|
30
30
|
stealth_headers?: boolean | undefined;
|
|
31
31
|
}>;
|
|
@@ -8,13 +8,13 @@ export declare const schema: z.ZodObject<{
|
|
|
8
8
|
chrome_profile: z.ZodOptional<z.ZodString>;
|
|
9
9
|
}, "strip", z.ZodTypeAny, {
|
|
10
10
|
url: string;
|
|
11
|
-
format: "
|
|
11
|
+
format: "text" | "html" | "markdown";
|
|
12
12
|
proxy?: string | undefined;
|
|
13
13
|
chrome_profile?: string | undefined;
|
|
14
14
|
}, {
|
|
15
15
|
url: string;
|
|
16
16
|
proxy?: string | undefined;
|
|
17
|
-
format?: "
|
|
17
|
+
format?: "text" | "html" | "markdown" | undefined;
|
|
18
18
|
chrome_profile?: string | undefined;
|
|
19
19
|
}>;
|
|
20
20
|
export type ReadabilityInput = z.infer<typeof schema>;
|
|
@@ -0,0 +1,39 @@
|
|
|
1
|
+
import { z } from "zod";
|
|
2
|
+
export declare const name = "record_flow";
|
|
3
|
+
export declare const description = "Record a headed browser workflow and save it as a generic Imperium Flow family/variant.";
|
|
4
|
+
export declare const schema: z.ZodObject<{
|
|
5
|
+
family: z.ZodString;
|
|
6
|
+
variant: z.ZodString;
|
|
7
|
+
url: z.ZodString;
|
|
8
|
+
description: z.ZodOptional<z.ZodString>;
|
|
9
|
+
flows_dir: z.ZodOptional<z.ZodString>;
|
|
10
|
+
global: z.ZodDefault<z.ZodBoolean>;
|
|
11
|
+
session_id: z.ZodOptional<z.ZodString>;
|
|
12
|
+
captcha: z.ZodDefault<z.ZodEnum<["auto", "manual", "off", "fail"]>>;
|
|
13
|
+
}, "strip", z.ZodTypeAny, {
|
|
14
|
+
url: string;
|
|
15
|
+
captcha: "auto" | "off" | "manual" | "fail";
|
|
16
|
+
family: string;
|
|
17
|
+
variant: string;
|
|
18
|
+
global: boolean;
|
|
19
|
+
description?: string | undefined;
|
|
20
|
+
session_id?: string | undefined;
|
|
21
|
+
flows_dir?: string | undefined;
|
|
22
|
+
}, {
|
|
23
|
+
url: string;
|
|
24
|
+
family: string;
|
|
25
|
+
variant: string;
|
|
26
|
+
description?: string | undefined;
|
|
27
|
+
captcha?: "auto" | "off" | "manual" | "fail" | undefined;
|
|
28
|
+
session_id?: string | undefined;
|
|
29
|
+
flows_dir?: string | undefined;
|
|
30
|
+
global?: boolean | undefined;
|
|
31
|
+
}>;
|
|
32
|
+
export type RecordFlowInput = z.infer<typeof schema>;
|
|
33
|
+
export declare function execute(input: RecordFlowInput): Promise<{
|
|
34
|
+
content: {
|
|
35
|
+
type: "text";
|
|
36
|
+
text: string;
|
|
37
|
+
}[];
|
|
38
|
+
}>;
|
|
39
|
+
//# sourceMappingURL=record-flow.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"record-flow.d.ts","sourceRoot":"","sources":["../../src/tools/record-flow.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,CAAC,EAAE,MAAM,KAAK,CAAC;AAgBxB,eAAO,MAAM,IAAI,gBAAgB,CAAC;AAClC,eAAO,MAAM,WAAW,4FAA4F,CAAC;AAErH,eAAO,MAAM,MAAM;;;;;;;;;;;;;;;;;;;;;;;;;;;EASjB,CAAC;AAEH,MAAM,MAAM,eAAe,GAAG,CAAC,CAAC,KAAK,CAAC,OAAO,MAAM,CAAC,CAAC;AAmSrD,wBAAsB,OAAO,CAAC,KAAK,EAAE,eAAe;;;;;GAoGnD"}
|