ai-contextify 0.1.0 → 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/cli.js +1 -1
- package/dist/parsers/docx.d.ts.map +1 -1
- package/dist/parsers/docx.js +26 -5
- package/dist/parsers/docx.js.map +1 -1
- package/package.json +1 -1
package/dist/cli.js
CHANGED
|
@@ -10,7 +10,7 @@ const program = new Command();
|
|
|
10
10
|
program
|
|
11
11
|
.name("ai-contextify")
|
|
12
12
|
.description("Convert files and entire projects into optimized context for LLMs (Claude, ChatGPT, Gemini).")
|
|
13
|
-
.version("0.1.
|
|
13
|
+
.version("0.1.1")
|
|
14
14
|
.argument("<input>", "File or directory to convert into LLM context")
|
|
15
15
|
.option("-o, --output <dir>", "Output directory", "context-output")
|
|
16
16
|
.option("-i, --include <patterns...>", "Glob patterns to include (default: everything)")
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"docx.d.ts","sourceRoot":"","sources":["../../src/parsers/docx.ts"],"names":[],"mappings":"AAEA,wBAAsB,SAAS,CAAC,YAAY,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,
|
|
1
|
+
{"version":3,"file":"docx.d.ts","sourceRoot":"","sources":["../../src/parsers/docx.ts"],"names":[],"mappings":"AAEA,wBAAsB,SAAS,CAAC,YAAY,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAmCrE"}
|
package/dist/parsers/docx.js
CHANGED
|
@@ -4,13 +4,34 @@ export async function parseDocx(absolutePath) {
|
|
|
4
4
|
// so we narrow the shape ourselves and fall back to plain text on failure.
|
|
5
5
|
const mammothAny = mammoth;
|
|
6
6
|
if (typeof mammothAny.convertToMarkdown === "function") {
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
7
|
+
// Tell mammoth to drop images entirely instead of inlining them as
|
|
8
|
+
// base64 data URIs, which would explode the output size and waste tokens.
|
|
9
|
+
const options = mammothAny.images?.imgElement
|
|
10
|
+
? {
|
|
11
|
+
convertImage: mammothAny.images.imgElement(async () => ({
|
|
12
|
+
src: "",
|
|
13
|
+
})),
|
|
14
|
+
}
|
|
15
|
+
: undefined;
|
|
16
|
+
const { value } = await mammothAny.convertToMarkdown({ path: absolutePath }, options);
|
|
17
|
+
return stripImageNoise(value);
|
|
12
18
|
}
|
|
13
19
|
const { value } = await mammoth.extractRawText({ path: absolutePath });
|
|
14
20
|
return value.replace(/\r\n/g, "\n").trim();
|
|
15
21
|
}
|
|
22
|
+
/**
|
|
23
|
+
* Belt-and-suspenders: even with `convertImage` set to empty src, older
|
|
24
|
+
* mammoth versions still emit base64 data URIs. Strip them out, along with
|
|
25
|
+
* any leftover empty image links, then collapse the resulting whitespace.
|
|
26
|
+
*/
|
|
27
|
+
function stripImageNoise(markdown) {
|
|
28
|
+
return markdown
|
|
29
|
+
.replace(/\r\n/g, "\n")
|
|
30
|
+
.replace(/!\[[^\]]*\]\(data:[^)]+\)/g, "")
|
|
31
|
+
.replace(/!\[[^\]]*\]\([^)]*\)/g, "")
|
|
32
|
+
.replace(/!\[\]\(\)/g, "")
|
|
33
|
+
.replace(/[ \t]+\n/g, "\n")
|
|
34
|
+
.replace(/\n{3,}/g, "\n\n")
|
|
35
|
+
.trim();
|
|
36
|
+
}
|
|
16
37
|
//# sourceMappingURL=docx.js.map
|
package/dist/parsers/docx.js.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"docx.js","sourceRoot":"","sources":["../../src/parsers/docx.ts"],"names":[],"mappings":"AAAA,OAAO,OAAO,MAAM,SAAS,CAAC;AAE9B,MAAM,CAAC,KAAK,UAAU,SAAS,CAAC,YAAoB;IAClD,6EAA6E;IAC7E,2EAA2E;IAC3E,MAAM,UAAU,GAAG,
|
|
1
|
+
{"version":3,"file":"docx.js","sourceRoot":"","sources":["../../src/parsers/docx.ts"],"names":[],"mappings":"AAAA,OAAO,OAAO,MAAM,SAAS,CAAC;AAE9B,MAAM,CAAC,KAAK,UAAU,SAAS,CAAC,YAAoB;IAClD,6EAA6E;IAC7E,2EAA2E;IAC3E,MAAM,UAAU,GAAG,OASlB,CAAC;IAEF,IAAI,OAAO,UAAU,CAAC,iBAAiB,KAAK,UAAU,EAAE,CAAC;QACvD,mEAAmE;QACnE,0EAA0E;QAC1E,MAAM,OAAO,GACX,UAAU,CAAC,MAAM,EAAE,UAAU;YAC3B,CAAC,CAAC;gBACE,YAAY,EAAE,UAAU,CAAC,MAAM,CAAC,UAAU,CAAC,KAAK,IAAI,EAAE,CAAC,CAAC;oBACtD,GAAG,EAAE,EAAE;iBACR,CAAC,CAAC;aACJ;YACH,CAAC,CAAC,SAAS,CAAC;QAEhB,MAAM,EAAE,KAAK,EAAE,GAAG,MAAM,UAAU,CAAC,iBAAiB,CAClD,EAAE,IAAI,EAAE,YAAY,EAAE,EACtB,OAAO,CACR,CAAC;QACF,OAAO,eAAe,CAAC,KAAK,CAAC,CAAC;IAChC,CAAC;IAED,MAAM,EAAE,KAAK,EAAE,GAAG,MAAM,OAAO,CAAC,cAAc,CAAC,EAAE,IAAI,EAAE,YAAY,EAAE,CAAC,CAAC;IACvE,OAAO,KAAK,CAAC,OAAO,CAAC,OAAO,EAAE,IAAI,CAAC,CAAC,IAAI,EAAE,CAAC;AAC7C,CAAC;AAED;;;;GAIG;AACH,SAAS,eAAe,CAAC,QAAgB;IACvC,OAAO,QAAQ;SACZ,OAAO,CAAC,OAAO,EAAE,IAAI,CAAC;SACtB,OAAO,CAAC,4BAA4B,EAAE,EAAE,CAAC;SACzC,OAAO,CAAC,uBAAuB,EAAE,EAAE,CAAC;SACpC,OAAO,CAAC,YAAY,EAAE,EAAE,CAAC;SACzB,OAAO,CAAC,WAAW,EAAE,IAAI,CAAC;SAC1B,OAAO,CAAC,SAAS,EAAE,MAAM,CAAC;SAC1B,IAAI,EAAE,CAAC;AACZ,CAAC"}
|