pdf-oxide 0.3.24 → 0.3.28

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (271) hide show
  1. package/lib/builders/annotation-builder.d.ts +199 -0
  2. package/lib/builders/annotation-builder.d.ts.map +1 -0
  3. package/lib/builders/annotation-builder.js +318 -0
  4. package/lib/builders/annotation-builder.js.map +1 -0
  5. package/lib/builders/conversion-options-builder.d.ts +107 -0
  6. package/lib/builders/conversion-options-builder.d.ts.map +1 -0
  7. package/lib/builders/conversion-options-builder.js +215 -0
  8. package/lib/builders/conversion-options-builder.js.map +1 -0
  9. package/{src/builders/index.ts → lib/builders/index.d.ts} +1 -1
  10. package/lib/builders/index.d.ts.map +1 -0
  11. package/lib/builders/index.js +12 -0
  12. package/lib/builders/index.js.map +1 -0
  13. package/lib/builders/metadata-builder.d.ts +202 -0
  14. package/lib/builders/metadata-builder.d.ts.map +1 -0
  15. package/lib/builders/metadata-builder.js +286 -0
  16. package/lib/builders/metadata-builder.js.map +1 -0
  17. package/lib/builders/pdf-builder.d.ts +215 -0
  18. package/lib/builders/pdf-builder.d.ts.map +1 -0
  19. package/lib/builders/pdf-builder.js +339 -0
  20. package/lib/builders/pdf-builder.js.map +1 -0
  21. package/lib/builders/search-options-builder.d.ts +74 -0
  22. package/lib/builders/search-options-builder.d.ts.map +1 -0
  23. package/lib/builders/search-options-builder.js +130 -0
  24. package/lib/builders/search-options-builder.js.map +1 -0
  25. package/lib/document-editor-manager.d.ts +140 -0
  26. package/lib/document-editor-manager.d.ts.map +1 -0
  27. package/lib/document-editor-manager.js +257 -0
  28. package/lib/document-editor-manager.js.map +1 -0
  29. package/lib/errors.d.ts +383 -0
  30. package/lib/errors.d.ts.map +1 -0
  31. package/lib/errors.js +1117 -0
  32. package/lib/errors.js.map +1 -0
  33. package/lib/form-field-manager.d.ts +300 -0
  34. package/lib/form-field-manager.d.ts.map +1 -0
  35. package/lib/form-field-manager.js +567 -0
  36. package/lib/form-field-manager.js.map +1 -0
  37. package/lib/hybrid-ml-manager.d.ts +143 -0
  38. package/lib/hybrid-ml-manager.d.ts.map +1 -0
  39. package/lib/hybrid-ml-manager.js +209 -0
  40. package/lib/hybrid-ml-manager.js.map +1 -0
  41. package/lib/index.d.ts +23 -0
  42. package/lib/index.d.ts.map +1 -0
  43. package/lib/index.js +280 -0
  44. package/lib/index.js.map +1 -0
  45. package/lib/managers/accessibility-manager.d.ts +149 -0
  46. package/lib/managers/accessibility-manager.d.ts.map +1 -0
  47. package/lib/managers/accessibility-manager.js +224 -0
  48. package/lib/managers/accessibility-manager.js.map +1 -0
  49. package/lib/managers/annotation-manager.d.ts +220 -0
  50. package/lib/managers/annotation-manager.d.ts.map +1 -0
  51. package/lib/managers/annotation-manager.js +360 -0
  52. package/lib/managers/annotation-manager.js.map +1 -0
  53. package/lib/managers/barcode-manager.d.ts +80 -0
  54. package/lib/managers/barcode-manager.d.ts.map +1 -0
  55. package/lib/managers/barcode-manager.js +226 -0
  56. package/lib/managers/barcode-manager.js.map +1 -0
  57. package/lib/managers/batch-manager.d.ts +186 -0
  58. package/lib/managers/batch-manager.d.ts.map +1 -0
  59. package/lib/managers/batch-manager.js +389 -0
  60. package/lib/managers/batch-manager.js.map +1 -0
  61. package/lib/managers/cache-manager.d.ts +182 -0
  62. package/lib/managers/cache-manager.d.ts.map +1 -0
  63. package/lib/managers/cache-manager.js +387 -0
  64. package/lib/managers/cache-manager.js.map +1 -0
  65. package/lib/managers/compliance-manager.d.ts +104 -0
  66. package/lib/managers/compliance-manager.d.ts.map +1 -0
  67. package/lib/managers/compliance-manager.js +415 -0
  68. package/lib/managers/compliance-manager.js.map +1 -0
  69. package/lib/managers/content-manager.d.ts +121 -0
  70. package/lib/managers/content-manager.d.ts.map +1 -0
  71. package/lib/managers/content-manager.js +295 -0
  72. package/lib/managers/content-manager.js.map +1 -0
  73. package/lib/managers/document-utility-manager.d.ts +370 -0
  74. package/lib/managers/document-utility-manager.d.ts.map +1 -0
  75. package/lib/managers/document-utility-manager.js +731 -0
  76. package/lib/managers/document-utility-manager.js.map +1 -0
  77. package/lib/managers/dom-pdf-creator.d.ts +105 -0
  78. package/lib/managers/dom-pdf-creator.d.ts.map +1 -0
  79. package/lib/managers/dom-pdf-creator.js +300 -0
  80. package/lib/managers/dom-pdf-creator.js.map +1 -0
  81. package/lib/managers/editing-manager.d.ts +249 -0
  82. package/lib/managers/editing-manager.d.ts.map +1 -0
  83. package/lib/managers/editing-manager.js +388 -0
  84. package/lib/managers/editing-manager.js.map +1 -0
  85. package/lib/managers/enterprise-manager.d.ts +193 -0
  86. package/lib/managers/enterprise-manager.d.ts.map +1 -0
  87. package/lib/managers/enterprise-manager.js +305 -0
  88. package/lib/managers/enterprise-manager.js.map +1 -0
  89. package/lib/managers/extended-managers.d.ts +123 -0
  90. package/lib/managers/extended-managers.d.ts.map +1 -0
  91. package/lib/managers/extended-managers.js +658 -0
  92. package/lib/managers/extended-managers.js.map +1 -0
  93. package/lib/managers/extraction-manager.d.ts +247 -0
  94. package/lib/managers/extraction-manager.d.ts.map +1 -0
  95. package/lib/managers/extraction-manager.js +478 -0
  96. package/lib/managers/extraction-manager.js.map +1 -0
  97. package/lib/managers/final-utilities.d.ts +128 -0
  98. package/lib/managers/final-utilities.d.ts.map +1 -0
  99. package/lib/managers/final-utilities.js +653 -0
  100. package/lib/managers/final-utilities.js.map +1 -0
  101. package/lib/managers/hybrid-ml-advanced.d.ts +137 -0
  102. package/lib/managers/hybrid-ml-advanced.d.ts.map +1 -0
  103. package/lib/managers/hybrid-ml-advanced.js +707 -0
  104. package/lib/managers/hybrid-ml-advanced.js.map +1 -0
  105. package/lib/managers/index.d.ts +65 -0
  106. package/lib/managers/index.d.ts.map +1 -0
  107. package/lib/managers/index.js +70 -0
  108. package/lib/managers/index.js.map +1 -0
  109. package/lib/managers/layer-manager.d.ts +204 -0
  110. package/lib/managers/layer-manager.d.ts.map +1 -0
  111. package/lib/managers/layer-manager.js +403 -0
  112. package/lib/managers/layer-manager.js.map +1 -0
  113. package/lib/managers/metadata-manager.d.ts +149 -0
  114. package/lib/managers/metadata-manager.d.ts.map +1 -0
  115. package/lib/managers/metadata-manager.js +281 -0
  116. package/lib/managers/metadata-manager.js.map +1 -0
  117. package/lib/managers/ocr-manager.d.ts +195 -0
  118. package/lib/managers/ocr-manager.d.ts.map +1 -0
  119. package/lib/managers/ocr-manager.js +583 -0
  120. package/lib/managers/ocr-manager.js.map +1 -0
  121. package/lib/managers/optimization-manager.d.ts +103 -0
  122. package/lib/managers/optimization-manager.d.ts.map +1 -0
  123. package/lib/managers/optimization-manager.js +194 -0
  124. package/lib/managers/optimization-manager.js.map +1 -0
  125. package/lib/managers/outline-manager.d.ts +102 -0
  126. package/lib/managers/outline-manager.d.ts.map +1 -0
  127. package/lib/managers/outline-manager.js +170 -0
  128. package/lib/managers/outline-manager.js.map +1 -0
  129. package/lib/managers/page-manager.d.ts +143 -0
  130. package/lib/managers/page-manager.d.ts.map +1 -0
  131. package/lib/managers/page-manager.js +237 -0
  132. package/lib/managers/page-manager.js.map +1 -0
  133. package/lib/managers/pattern-detection.d.ts +170 -0
  134. package/lib/managers/pattern-detection.d.ts.map +1 -0
  135. package/lib/managers/pattern-detection.js +325 -0
  136. package/lib/managers/pattern-detection.js.map +1 -0
  137. package/lib/managers/rendering-manager.d.ts +354 -0
  138. package/lib/managers/rendering-manager.d.ts.map +1 -0
  139. package/lib/managers/rendering-manager.js +680 -0
  140. package/lib/managers/rendering-manager.js.map +1 -0
  141. package/lib/managers/search-manager.d.ts +236 -0
  142. package/lib/managers/search-manager.d.ts.map +1 -0
  143. package/lib/managers/search-manager.js +330 -0
  144. package/lib/managers/search-manager.js.map +1 -0
  145. package/lib/managers/security-manager.d.ts +162 -0
  146. package/lib/managers/security-manager.d.ts.map +1 -0
  147. package/lib/managers/security-manager.js +293 -0
  148. package/lib/managers/security-manager.js.map +1 -0
  149. package/lib/managers/signature-manager.d.ts +725 -0
  150. package/lib/managers/signature-manager.d.ts.map +1 -0
  151. package/lib/managers/signature-manager.js +1365 -0
  152. package/lib/managers/signature-manager.js.map +1 -0
  153. package/lib/managers/streams.d.ts +263 -0
  154. package/lib/managers/streams.d.ts.map +1 -0
  155. package/lib/managers/streams.js +472 -0
  156. package/lib/managers/streams.js.map +1 -0
  157. package/lib/managers/xfa-manager.d.ts +228 -0
  158. package/lib/managers/xfa-manager.d.ts.map +1 -0
  159. package/lib/managers/xfa-manager.js +490 -0
  160. package/lib/managers/xfa-manager.js.map +1 -0
  161. package/lib/pdf-creator-manager.d.ts +201 -0
  162. package/lib/pdf-creator-manager.d.ts.map +1 -0
  163. package/lib/pdf-creator-manager.js +379 -0
  164. package/lib/pdf-creator-manager.js.map +1 -0
  165. package/lib/properties.d.ts +80 -0
  166. package/lib/properties.d.ts.map +1 -0
  167. package/lib/properties.js +455 -0
  168. package/lib/properties.js.map +1 -0
  169. package/lib/result-accessors-manager.d.ts +347 -0
  170. package/lib/result-accessors-manager.d.ts.map +1 -0
  171. package/lib/result-accessors-manager.js +705 -0
  172. package/lib/result-accessors-manager.js.map +1 -0
  173. package/lib/thumbnail-manager.d.ts +122 -0
  174. package/lib/thumbnail-manager.d.ts.map +1 -0
  175. package/lib/thumbnail-manager.js +206 -0
  176. package/lib/thumbnail-manager.js.map +1 -0
  177. package/lib/types/common.d.ts +93 -0
  178. package/lib/types/common.d.ts.map +1 -0
  179. package/lib/types/common.js +5 -0
  180. package/lib/types/common.js.map +1 -0
  181. package/lib/types/document-types.d.ts +353 -0
  182. package/lib/types/document-types.d.ts.map +1 -0
  183. package/lib/types/document-types.js +83 -0
  184. package/lib/types/document-types.js.map +1 -0
  185. package/{src/types/index.ts → lib/types/index.d.ts} +1 -1
  186. package/lib/types/index.d.ts.map +1 -0
  187. package/lib/types/index.js +6 -0
  188. package/lib/types/index.js.map +1 -0
  189. package/lib/types/manager-types.d.ts +180 -0
  190. package/lib/types/manager-types.d.ts.map +1 -0
  191. package/lib/types/manager-types.js +99 -0
  192. package/lib/types/manager-types.js.map +1 -0
  193. package/lib/types/native-bindings.d.ts +440 -0
  194. package/lib/types/native-bindings.d.ts.map +1 -0
  195. package/lib/types/native-bindings.js +8 -0
  196. package/lib/types/native-bindings.js.map +1 -0
  197. package/{src/workers/index.ts → lib/workers/index.d.ts} +1 -1
  198. package/lib/workers/index.d.ts.map +1 -0
  199. package/lib/workers/index.js +6 -0
  200. package/lib/workers/index.js.map +1 -0
  201. package/lib/workers/pool.d.ts +65 -0
  202. package/lib/workers/pool.d.ts.map +1 -0
  203. package/lib/workers/pool.js +195 -0
  204. package/lib/workers/pool.js.map +1 -0
  205. package/lib/workers/worker.d.ts +6 -0
  206. package/lib/workers/worker.d.ts.map +1 -0
  207. package/lib/workers/worker.js +100 -0
  208. package/lib/workers/worker.js.map +1 -0
  209. package/package.json +12 -22
  210. package/prebuilds/darwin-arm64/pdf_oxide.node +0 -0
  211. package/prebuilds/darwin-x64/pdf_oxide.node +0 -0
  212. package/prebuilds/linux-arm64/pdf_oxide.node +0 -0
  213. package/prebuilds/linux-x64/pdf_oxide.node +0 -0
  214. package/prebuilds/win32-x64/pdf_oxide.node +0 -0
  215. package/binding.gyp +0 -35
  216. package/src/builders/annotation-builder.ts +0 -367
  217. package/src/builders/conversion-options-builder.ts +0 -257
  218. package/src/builders/metadata-builder.ts +0 -317
  219. package/src/builders/pdf-builder.ts +0 -386
  220. package/src/builders/search-options-builder.ts +0 -151
  221. package/src/document-editor-manager.ts +0 -318
  222. package/src/errors.ts +0 -1629
  223. package/src/form-field-manager.ts +0 -666
  224. package/src/hybrid-ml-manager.ts +0 -283
  225. package/src/index.ts +0 -453
  226. package/src/managers/accessibility-manager.ts +0 -338
  227. package/src/managers/annotation-manager.ts +0 -439
  228. package/src/managers/barcode-manager.ts +0 -235
  229. package/src/managers/batch-manager.ts +0 -533
  230. package/src/managers/cache-manager.ts +0 -486
  231. package/src/managers/compliance-manager.ts +0 -375
  232. package/src/managers/content-manager.ts +0 -339
  233. package/src/managers/document-utility-manager.ts +0 -922
  234. package/src/managers/dom-pdf-creator.ts +0 -365
  235. package/src/managers/editing-manager.ts +0 -514
  236. package/src/managers/enterprise-manager.ts +0 -478
  237. package/src/managers/extended-managers.ts +0 -437
  238. package/src/managers/extraction-manager.ts +0 -583
  239. package/src/managers/final-utilities.ts +0 -429
  240. package/src/managers/hybrid-ml-advanced.ts +0 -479
  241. package/src/managers/index.ts +0 -239
  242. package/src/managers/layer-manager.ts +0 -500
  243. package/src/managers/metadata-manager.ts +0 -303
  244. package/src/managers/ocr-manager.ts +0 -756
  245. package/src/managers/optimization-manager.ts +0 -262
  246. package/src/managers/outline-manager.ts +0 -196
  247. package/src/managers/page-manager.ts +0 -289
  248. package/src/managers/pattern-detection.ts +0 -440
  249. package/src/managers/rendering-manager.ts +0 -863
  250. package/src/managers/search-manager.ts +0 -385
  251. package/src/managers/security-manager.ts +0 -345
  252. package/src/managers/signature-manager.ts +0 -1664
  253. package/src/managers/streams.ts +0 -618
  254. package/src/managers/xfa-manager.ts +0 -500
  255. package/src/pdf-creator-manager.ts +0 -494
  256. package/src/properties.ts +0 -522
  257. package/src/result-accessors-manager.ts +0 -867
  258. package/src/tests/advanced-features.test.ts +0 -414
  259. package/src/tests/advanced.test.ts +0 -266
  260. package/src/tests/extended-managers.test.ts +0 -316
  261. package/src/tests/final-utilities.test.ts +0 -455
  262. package/src/tests/foundation.test.ts +0 -315
  263. package/src/tests/high-demand.test.ts +0 -257
  264. package/src/tests/specialized.test.ts +0 -97
  265. package/src/thumbnail-manager.ts +0 -272
  266. package/src/types/common.ts +0 -142
  267. package/src/types/document-types.ts +0 -457
  268. package/src/types/manager-types.ts +0 -284
  269. package/src/types/native-bindings.ts +0 -517
  270. package/src/workers/pool.ts +0 -274
  271. package/src/workers/worker.ts +0 -131
@@ -1,756 +0,0 @@
1
- /**
2
- * OcrManager - Canonical OCR Manager (merged from 3 implementations)
3
- *
4
- * Consolidates:
5
- * - src/ocr-manager.ts (simple API with setLanguage, extractText, analyzePage)
6
- * - src/managers/ocr-compliance-cache.ts OCRManager (engine lifecycle)
7
- * - src/managers/ocr-manager-typed.ts OCRManager (full TypeScript, FFI-wired)
8
- *
9
- * Provides optical character recognition operations with complete type safety,
10
- * proper error handling, and full FFI integration.
11
- */
12
-
13
- import {
14
- BaseManager,
15
- OcrLanguage,
16
- OcrResult,
17
- OcrBatchResult,
18
- TextRegion,
19
- PdfDocumentHandle,
20
- ManagerOptions,
21
- } from '../types/manager-types.js';
22
- import { promises as fs } from 'fs';
23
- import { dirname } from 'path';
24
-
25
- // Re-export types for convenience
26
- export { OcrLanguage };
27
- export type { OcrResult, OcrBatchResult, TextRegion };
28
-
29
- /**
30
- * OCR detection modes for accuracy/speed tradeoff
31
- */
32
- export enum OcrDetectionMode {
33
- Accurate = 'accurate',
34
- Fast = 'fast',
35
- Balanced = 'balanced',
36
- }
37
-
38
- /**
39
- * Configuration for OCR operations
40
- */
41
- export interface OcrConfig {
42
- language?: OcrLanguage;
43
- detectionMode?: OcrDetectionMode;
44
- detectionThreshold?: number;
45
- recognitionThreshold?: number;
46
- maxSideLen?: number;
47
- useGpu?: boolean;
48
- gpuDeviceId?: number;
49
- }
50
-
51
- /**
52
- * A recognized text span with position and confidence
53
- */
54
- export interface OcrSpan {
55
- text: string;
56
- confidence: number;
57
- x: number;
58
- y: number;
59
- width: number;
60
- height: number;
61
- charCount: number;
62
- }
63
-
64
- /**
65
- * Analysis result for a single page
66
- */
67
- export interface OcrPageAnalysis {
68
- pageIndex: number;
69
- needsOcr: boolean;
70
- confidence: number;
71
- spanCount: number;
72
- text: string;
73
- }
74
-
75
- /**
76
- * Canonical OcrManager - Comprehensive OCR with full TypeScript support
77
- *
78
- * Features:
79
- * - Full text recognition with confidence scoring
80
- * - Batch page processing with skip optimization
81
- * - Text region detection with coordinates
82
- * - Multi-language support
83
- * - Comprehensive event emission
84
- * - Automatic resource cleanup
85
- * - Legacy API compatibility (setLanguage, extractText, analyzePage, etc.)
86
- */
87
- export class OcrManager extends BaseManager<PdfDocumentHandle> {
88
- private ocrEngine: unknown | null = null;
89
- private currentLanguage: OcrLanguage = OcrLanguage.ENGLISH;
90
- private preprocessingType: string = 'auto';
91
- private native: any;
92
-
93
- constructor(document: PdfDocumentHandle, options?: ManagerOptions) {
94
- super(document, options);
95
- try {
96
- this.native = require('../../index.node');
97
- } catch {
98
- this.native = null;
99
- }
100
- }
101
-
102
- // ==========================================================================
103
- // Engine Lifecycle (from typed version)
104
- // ==========================================================================
105
-
106
- /**
107
- * Initialize OCR engine with specified configuration
108
- */
109
- async initializeEngine(
110
- detectionThreshold: number = 0.5,
111
- recognitionThreshold: number = 0.5,
112
- maxSideLen: number = 960,
113
- useGpu: boolean = false,
114
- gpuDeviceId: number = 0
115
- ): Promise<boolean> {
116
- try {
117
- this.recordOperation();
118
-
119
- if (this.ocrEngine) {
120
- return true;
121
- }
122
-
123
- this.ocrEngine = await (this.document as any)?.createOcrEngine(
124
- detectionThreshold,
125
- recognitionThreshold,
126
- maxSideLen,
127
- useGpu,
128
- gpuDeviceId
129
- );
130
-
131
- if (this.ocrEngine) {
132
- this.emit('ocr-engine-initialized', {
133
- useGpu,
134
- gpuDeviceId,
135
- detectionThreshold,
136
- recognitionThreshold,
137
- });
138
- return true;
139
- }
140
-
141
- return false;
142
- } catch (error) {
143
- this.recordError(error instanceof Error ? error : new Error(String(error)));
144
- throw error;
145
- }
146
- }
147
-
148
- /**
149
- * Destroy OCR engine and free resources
150
- */
151
- async destroyOcrEngine(): Promise<void> {
152
- try {
153
- this.recordOperation();
154
-
155
- if (this.ocrEngine) {
156
- await (this.document as any)?.destroyOcrEngine(this.ocrEngine);
157
- this.ocrEngine = null;
158
- this.emit('ocr-engine-destroyed', { timestamp: Date.now() });
159
- }
160
- } catch (error) {
161
- this.recordError(error instanceof Error ? error : new Error(String(error)));
162
- throw error;
163
- }
164
- }
165
-
166
- // ==========================================================================
167
- // Core Recognition (from typed version)
168
- // ==========================================================================
169
-
170
- /**
171
- * Check if page needs OCR processing
172
- */
173
- async pageNeedsOcr(pageIndex: number): Promise<boolean> {
174
- try {
175
- this.recordOperation();
176
- return (await (this.document as any)?.pageNeedsOcr(pageIndex)) || false;
177
- } catch (error) {
178
- this.recordError(error instanceof Error ? error : new Error(String(error)));
179
- throw error;
180
- }
181
- }
182
-
183
- /**
184
- * Recognize text on a page with full confidence scoring
185
- */
186
- async recognizePage(pageIndex: number): Promise<string> {
187
- try {
188
- this.recordOperation();
189
-
190
- if (!this.ocrEngine) {
191
- throw new Error('OCR engine not initialized. Call initializeEngine() first.');
192
- }
193
-
194
- const text = await (this.document as any)?.recognizePage(
195
- pageIndex,
196
- this.ocrEngine
197
- );
198
-
199
- this.emit('page-recognized', {
200
- pageIndex,
201
- textLength: text?.length || 0,
202
- timestamp: Date.now(),
203
- });
204
-
205
- return text || '';
206
- } catch (error) {
207
- this.recordError(error instanceof Error ? error : new Error(String(error)));
208
- throw error;
209
- }
210
- }
211
-
212
- /**
213
- * Get OCR confidence score for a page
214
- */
215
- async getOcrConfidence(pageIndex: number): Promise<number> {
216
- try {
217
- this.recordOperation();
218
-
219
- if (!this.ocrEngine) {
220
- return 0;
221
- }
222
-
223
- return (await (this.document as any)?.getOcrConfidence(pageIndex)) || 0;
224
- } catch (error) {
225
- this.recordError(error instanceof Error ? error : new Error(String(error)));
226
- throw error;
227
- }
228
- }
229
-
230
- /**
231
- * Detect text regions on a page with bounding boxes
232
- */
233
- async detectTextRegions(pageIndex: number): Promise<TextRegion[]> {
234
- try {
235
- this.recordOperation();
236
-
237
- if (!this.ocrEngine) {
238
- return [];
239
- }
240
-
241
- const regions = await (this.document as any)?.detectTextRegions(
242
- pageIndex,
243
- this.ocrEngine
244
- );
245
-
246
- return regions || [];
247
- } catch (error) {
248
- this.recordError(error instanceof Error ? error : new Error(String(error)));
249
- throw error;
250
- }
251
- }
252
-
253
- // ==========================================================================
254
- // Language Configuration (from typed + root versions)
255
- // ==========================================================================
256
-
257
- /**
258
- * Set OCR language for recognition (FFI-wired)
259
- */
260
- async setOcrLanguage(language: OcrLanguage | string): Promise<boolean> {
261
- try {
262
- this.recordOperation();
263
-
264
- if (!this.ocrEngine) {
265
- throw new Error('OCR engine not initialized');
266
- }
267
-
268
- const result = await (this.document as any)?.setOcrLanguage(
269
- this.ocrEngine,
270
- language
271
- );
272
-
273
- if (result) {
274
- this.currentLanguage = (language as OcrLanguage) || OcrLanguage.ENGLISH;
275
- this.emit('language-changed', {
276
- language,
277
- timestamp: Date.now(),
278
- });
279
- }
280
-
281
- return !!result;
282
- } catch (error) {
283
- this.recordError(error instanceof Error ? error : new Error(String(error)));
284
- throw error;
285
- }
286
- }
287
-
288
- /**
289
- * Sets the OCR language (convenience alias for setOcrLanguage)
290
- * From root-level OCRManager
291
- */
292
- setLanguage(language: OcrLanguage): void {
293
- this.currentLanguage = language;
294
- this.invalidateCache('ocr');
295
- this.emit('languageChanged', language);
296
- }
297
-
298
- /**
299
- * Gets the current OCR language
300
- * From root-level OCRManager
301
- */
302
- getLanguage(): OcrLanguage {
303
- return this.currentLanguage;
304
- }
305
-
306
- /**
307
- * Get available OCR languages
308
- */
309
- async getAvailableLanguages(): Promise<OcrLanguage[]> {
310
- try {
311
- this.recordOperation();
312
-
313
- const languages =
314
- (await (this.document as any)?.getAvailableLanguages()) ||
315
- Object.values(OcrLanguage);
316
-
317
- return languages;
318
- } catch (error) {
319
- this.recordError(error instanceof Error ? error : new Error(String(error)));
320
- throw error;
321
- }
322
- }
323
-
324
- // ==========================================================================
325
- // Processing & Export (from typed version)
326
- // ==========================================================================
327
-
328
- /**
329
- * Preprocess page before OCR for better recognition
330
- */
331
- async preprocessPage(
332
- pageIndex: number,
333
- preprocessingType: string = 'auto'
334
- ): Promise<boolean> {
335
- try {
336
- this.recordOperation();
337
-
338
- const result = await (this.document as any)?.preprocessPage(
339
- pageIndex,
340
- preprocessingType
341
- );
342
-
343
- this.preprocessingType = preprocessingType;
344
- this.emit('page-preprocessed', {
345
- pageIndex,
346
- type: preprocessingType,
347
- timestamp: Date.now(),
348
- });
349
-
350
- return !!result;
351
- } catch (error) {
352
- this.recordError(error instanceof Error ? error : new Error(String(error)));
353
- throw error;
354
- }
355
- }
356
-
357
- /**
358
- * Export OCR text to file
359
- */
360
- async exportOcrText(
361
- pageIndex: number,
362
- filePath: string,
363
- format: 'txt' | 'json' | 'xml' = 'txt'
364
- ): Promise<boolean> {
365
- try {
366
- this.recordOperation();
367
-
368
- const text = await this.recognizePage(pageIndex);
369
-
370
- await fs.mkdir(dirname(filePath), { recursive: true });
371
-
372
- let content: string;
373
- switch (format) {
374
- case 'json':
375
- content = JSON.stringify(
376
- { pageIndex, text, timestamp: Date.now() },
377
- null,
378
- 2
379
- );
380
- break;
381
- case 'xml':
382
- content = `<?xml version="1.0"?>\n<page index="${pageIndex}">\n${text.split('\n').map(line => ` <line>${line}</line>`).join('\n')}\n</page>`;
383
- break;
384
- default:
385
- content = text;
386
- }
387
-
388
- await fs.writeFile(filePath, content, 'utf8');
389
-
390
- this.emit('text-exported', {
391
- pageIndex,
392
- filePath,
393
- format,
394
- size: content.length,
395
- timestamp: Date.now(),
396
- });
397
-
398
- return true;
399
- } catch (error) {
400
- this.recordError(error instanceof Error ? error : new Error(String(error)));
401
- throw error;
402
- }
403
- }
404
-
405
- // ==========================================================================
406
- // Statistics & Batch (from typed version)
407
- // ==========================================================================
408
-
409
- /**
410
- * Get comprehensive OCR statistics for a page
411
- */
412
- async getOcrStatistics(pageIndex: number): Promise<OcrResult> {
413
- try {
414
- this.recordOperation();
415
-
416
- const text = await this.recognizePage(pageIndex);
417
- const confidence = await this.getOcrConfidence(pageIndex);
418
- const regions = await this.detectTextRegions(pageIndex);
419
-
420
- return {
421
- pageIndex,
422
- text,
423
- confidence,
424
- regionCount: regions.length,
425
- };
426
- } catch (error) {
427
- this.recordError(error instanceof Error ? error : new Error(String(error)));
428
- throw error;
429
- }
430
- }
431
-
432
- /**
433
- * Batch recognize multiple pages
434
- */
435
- async batchRecognizePages(
436
- startPage: number,
437
- endPage: number
438
- ): Promise<Map<number, string>> {
439
- try {
440
- this.recordOperation();
441
-
442
- const results = new Map<number, string>();
443
-
444
- for (let i = startPage; i <= endPage; i++) {
445
- const text = await this.recognizePage(i);
446
- results.set(i, text);
447
- }
448
-
449
- this.emit('batch-recognized', {
450
- startPage,
451
- endPage,
452
- pageCount: endPage - startPage + 1,
453
- totalCharacters: Array.from(results.values()).reduce((s, t) => s + t.length, 0),
454
- timestamp: Date.now(),
455
- });
456
-
457
- return results;
458
- } catch (error) {
459
- this.recordError(error instanceof Error ? error : new Error(String(error)));
460
- throw error;
461
- }
462
- }
463
-
464
- /**
465
- * Extract OCR text with aggregated statistics from page range (FFI-wired)
466
- */
467
- async extractPageRange(
468
- startPage: number,
469
- endPage: number,
470
- skipNonScanned: boolean = true
471
- ): Promise<OcrBatchResult> {
472
- try {
473
- this.recordOperation();
474
-
475
- if (!this.ocrEngine) {
476
- throw new Error('OCR engine not initialized');
477
- }
478
-
479
- let totalSpans = 0;
480
- let confidenceSum = 0;
481
- let skippedPages = 0;
482
-
483
- for (let pageIdx = startPage; pageIdx <= endPage; pageIdx++) {
484
- try {
485
- if (skipNonScanned) {
486
- const needsOcr = await this.pageNeedsOcr(pageIdx);
487
- if (!needsOcr) {
488
- skippedPages++;
489
- continue;
490
- }
491
- }
492
-
493
- const text = await this.recognizePage(pageIdx);
494
- const confidence = await this.getOcrConfidence(pageIdx);
495
- const regions = await this.detectTextRegions(pageIdx);
496
- totalSpans += Math.max(regions.length, text ? 1 : 0);
497
- confidenceSum += confidence;
498
- } catch {
499
- continue;
500
- }
501
- }
502
-
503
- const processedPages = endPage - startPage + 1 - skippedPages;
504
- const avgConfidence = processedPages > 0 ? confidenceSum / processedPages : 0;
505
-
506
- const result: OcrBatchResult = {
507
- startPage,
508
- endPage,
509
- totalPages: endPage - startPage + 1,
510
- totalSpans,
511
- averageConfidence: avgConfidence,
512
- skippedPages,
513
- };
514
-
515
- this.emit('page-range-extracted', {
516
- ...result,
517
- timestamp: Date.now(),
518
- });
519
-
520
- this.setCached(`ocr-batch:${startPage}-${endPage}`, result);
521
-
522
- return result;
523
- } catch (error) {
524
- this.recordError(error instanceof Error ? error : new Error(String(error)));
525
- throw error;
526
- }
527
- }
528
-
529
- // ==========================================================================
530
- // Engine Status & Configuration (from typed version)
531
- // ==========================================================================
532
-
533
- /**
534
- * Get OCR engine status and configuration
535
- */
536
- async getEngineStatus(): Promise<string> {
537
- try {
538
- this.recordOperation();
539
-
540
- if (!this.ocrEngine) {
541
- return 'not_initialized';
542
- }
543
-
544
- return (await (this.document as any)?.getEngineStatus(this.ocrEngine)) || 'unknown';
545
- } catch (error) {
546
- this.recordError(error instanceof Error ? error : new Error(String(error)));
547
- throw error;
548
- }
549
- }
550
-
551
- /**
552
- * Get current OCR configuration
553
- */
554
- getConfiguration(): {
555
- language: OcrLanguage;
556
- preprocessingType: string;
557
- engineInitialized: boolean;
558
- } {
559
- return {
560
- language: this.currentLanguage,
561
- preprocessingType: this.preprocessingType,
562
- engineInitialized: !!this.ocrEngine,
563
- };
564
- }
565
-
566
- // ==========================================================================
567
- // Methods from root-level OCRManager
568
- // ==========================================================================
569
-
570
- /**
571
- * Extracts text from a page (convenience alias for recognizePage)
572
- * From root-level OCRManager
573
- */
574
- async extractText(pageIndex: number, config?: OcrConfig): Promise<string> {
575
- const cacheKey = `ocr:text:${pageIndex}:${this.currentLanguage}`;
576
- const cached = this.getCached<string>(cacheKey);
577
- if (cached !== undefined) {
578
- return cached;
579
- }
580
-
581
- let result = '';
582
- if ((this.document as any)?.extractText) {
583
- result = (this.document as any).extractText(pageIndex) || '';
584
- }
585
- this.setCached(cacheKey, result);
586
- this.emit('textExtracted', pageIndex, result.length);
587
- return result;
588
- }
589
-
590
- /**
591
- * Analyzes a page and returns detailed results
592
- * From root-level OCRManager
593
- */
594
- async analyzePage(pageIndex: number, config?: OcrConfig): Promise<OcrPageAnalysis> {
595
- const cacheKey = `ocr:analysis:${pageIndex}:${this.currentLanguage}`;
596
- const cached = this.getCached<OcrPageAnalysis>(cacheKey);
597
- if (cached !== undefined) {
598
- return cached;
599
- }
600
-
601
- let text = '';
602
- let needsOcr = false;
603
-
604
- if ((this.document as any)?.extractText) {
605
- text = (this.document as any).extractText(pageIndex) || '';
606
- needsOcr = !text || text.trim().length < 10;
607
- }
608
-
609
- const result: OcrPageAnalysis = {
610
- pageIndex,
611
- needsOcr,
612
- confidence: needsOcr ? 0.0 : 0.95,
613
- spanCount: text.split(' ').length || 0,
614
- text,
615
- };
616
- this.setCached(cacheKey, result);
617
- this.emit('pageAnalyzed', pageIndex, result);
618
- return result;
619
- }
620
-
621
- /**
622
- * Performs OCR analysis on all pages in the document
623
- * From root-level OCRManager
624
- */
625
- async analyzeDocument(config?: OcrConfig): Promise<OcrPageAnalysis[]> {
626
- const cacheKey = `ocr:document:${this.currentLanguage}`;
627
- const cached = this.getCached<OcrPageAnalysis[]>(cacheKey);
628
- if (cached !== undefined) {
629
- return cached;
630
- }
631
-
632
- const results: OcrPageAnalysis[] = [];
633
- const pageCount = (this.document as any)?.pageCount || 0;
634
-
635
- for (let i = 0; i < pageCount; i++) {
636
- const analysis = await this.analyzePage(i, config);
637
- results.push(analysis);
638
- this.emit('pageProcessed', i + 1, pageCount);
639
- }
640
-
641
- this.setCached(cacheKey, results);
642
- this.emit('documentAnalyzed', results.length);
643
- return results;
644
- }
645
-
646
- /**
647
- * Extracts text spans with bounding boxes for a page
648
- * From root-level OCRManager
649
- */
650
- async extractSpans(pageIndex: number, config?: OcrConfig): Promise<OcrSpan[]> {
651
- const cacheKey = `ocr:spans:${pageIndex}:${this.currentLanguage}`;
652
- const cached = this.getCached<OcrSpan[]>(cacheKey);
653
- if (cached !== undefined) {
654
- return cached;
655
- }
656
-
657
- let spans: OcrSpan[] = [];
658
- if (this.native?.extract_spans) {
659
- try {
660
- const spansJson = this.native.extract_spans(pageIndex) ?? [];
661
- spans = spansJson.length > 0 ? spansJson.map((json: string) => JSON.parse(json)) : [];
662
- } catch {
663
- spans = [];
664
- }
665
- }
666
-
667
- this.setCached(cacheKey, spans);
668
- this.emit('spansExtracted', { page: pageIndex, count: spans.length });
669
- return spans;
670
- }
671
-
672
- /**
673
- * Checks if OCR is available/installed
674
- * From root-level OCRManager
675
- */
676
- async isAvailable(): Promise<boolean> {
677
- const cacheKey = 'ocr:available';
678
- const cached = this.getCached<boolean>(cacheKey);
679
- if (cached !== undefined) {
680
- return cached;
681
- }
682
-
683
- const result = this.native ? true : false;
684
- this.setCached(cacheKey, result);
685
- return result;
686
- }
687
-
688
- /**
689
- * Gets OCR engine version
690
- * From root-level OCRManager
691
- */
692
- async getVersion(): Promise<string> {
693
- const cacheKey = 'ocr:version';
694
- const cached = this.getCached<string>(cacheKey);
695
- if (cached !== undefined) {
696
- return cached;
697
- }
698
-
699
- let version = '0.0.0';
700
- if (this.native?.get_ocr_version) {
701
- try {
702
- version = this.native.get_ocr_version() ?? '0.0.0';
703
- } catch {
704
- version = '0.0.0';
705
- }
706
- }
707
-
708
- this.setCached(cacheKey, version);
709
- return version;
710
- }
711
-
712
- // ==========================================================================
713
- // Cache Operations (from root-level OCRManager)
714
- // ==========================================================================
715
-
716
- /**
717
- * Clears the result cache
718
- */
719
- clearCache(): void {
720
- this.invalidateCache();
721
- this.emit('cacheCleared');
722
- }
723
-
724
- /**
725
- * Gets cache statistics
726
- */
727
- getCacheStats(): Record<string, any> {
728
- return {
729
- cacheSize: this.cache.size,
730
- entries: Array.from(this.cache.keys()),
731
- };
732
- }
733
-
734
- // ==========================================================================
735
- // Cleanup
736
- // ==========================================================================
737
-
738
- /**
739
- * Cleanup on destroy
740
- */
741
- async destroy(): Promise<void> {
742
- try {
743
- await this.destroyOcrEngine();
744
- this.invalidateCache();
745
- this.removeAllListeners();
746
- this.initialized = false;
747
- } catch (error) {
748
- console.error('Error during OCR manager cleanup:', error);
749
- }
750
- }
751
- }
752
-
753
- /** @deprecated Use OcrManager instead */
754
- export const OCRManager = OcrManager;
755
-
756
- export default OcrManager;