@lov3kaizen/agentsea-ingest 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/package.json ADDED
@@ -0,0 +1,89 @@
1
+ {
2
+ "name": "@lov3kaizen/agentsea-ingest",
3
+ "version": "0.5.1",
4
+ "description": "Comprehensive document processing pipeline for Node.js - PDF, DOCX, HTML, Markdown parsing with intelligent chunking, table/image extraction, and OCR",
5
+ "type": "module",
6
+ "main": "./dist/index.js",
7
+ "module": "./dist/index.js",
8
+ "types": "./dist/index.d.ts",
9
+ "exports": {
10
+ ".": {
11
+ "import": "./dist/index.js",
12
+ "types": "./dist/index.d.ts"
13
+ }
14
+ },
15
+ "files": [
16
+ "dist",
17
+ "README.md"
18
+ ],
19
+ "dependencies": {
20
+ "cheerio": "^1.0.0",
21
+ "eventemitter3": "^5.0.1",
22
+ "file-type": "^19.6.0",
23
+ "franc": "^6.2.0",
24
+ "mammoth": "^1.8.0",
25
+ "marked": "^15.0.4",
26
+ "nanoid": "^5.0.7",
27
+ "natural": "^8.0.1",
28
+ "pdf-parse": "^1.1.1",
29
+ "xlsx": "^0.18.5",
30
+ "zod": "^3.24.1"
31
+ },
32
+ "optionalDependencies": {
33
+ "tesseract.js": "^5.1.1"
34
+ },
35
+ "devDependencies": {
36
+ "@types/node": "^22.9.0",
37
+ "@types/pdf-parse": "^1.1.4",
38
+ "rimraf": "^6.0.1",
39
+ "tsup": "^8.5.0",
40
+ "typescript": "^5.9.3",
41
+ "vitest": "^3.2.3"
42
+ },
43
+ "peerDependencies": {
44
+ "@google-cloud/vision": "^4.0.0",
45
+ "@lov3kaizen/agentsea-core": "0.5.1",
46
+ "@lov3kaizen/agentsea-embeddings": "0.5.1"
47
+ },
48
+ "peerDependenciesMeta": {
49
+ "@google-cloud/vision": {
50
+ "optional": true
51
+ },
52
+ "@lov3kaizen/agentsea-core": {
53
+ "optional": true
54
+ },
55
+ "@lov3kaizen/agentsea-embeddings": {
56
+ "optional": true
57
+ }
58
+ },
59
+ "keywords": [
60
+ "document",
61
+ "processing",
62
+ "pdf",
63
+ "docx",
64
+ "html",
65
+ "markdown",
66
+ "chunking",
67
+ "rag",
68
+ "ingestion",
69
+ "ocr",
70
+ "table-extraction",
71
+ "ai",
72
+ "llm"
73
+ ],
74
+ "author": "lov3kaizen",
75
+ "license": "MIT",
76
+ "repository": {
77
+ "type": "git",
78
+ "url": "https://github.com/lov3kaizen/agentsea-ingest"
79
+ },
80
+ "scripts": {
81
+ "build": "tsup",
82
+ "dev": "tsup --watch",
83
+ "typecheck": "tsc --noEmit",
84
+ "test": "vitest run",
85
+ "test:watch": "vitest",
86
+ "lint": "eslint src --ext .ts",
87
+ "clean": "rimraf dist"
88
+ }
89
+ }