convertit 1.0.5 → 2.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +221 -6
- package/dist/analysis/index.d.ts +38 -0
- package/dist/analysis/index.d.ts.map +1 -0
- package/dist/batch/index.d.ts +116 -0
- package/dist/batch/index.d.ts.map +1 -0
- package/dist/converters/excel-styles.d.ts.map +1 -1
- package/dist/converters/index.d.ts +10 -6
- package/dist/converters/index.d.ts.map +1 -1
- package/dist/converters/pdf.d.ts.map +1 -1
- package/dist/core/converter.d.ts +54 -2
- package/dist/core/converter.d.ts.map +1 -1
- package/dist/core/errors.d.ts +5 -0
- package/dist/core/errors.d.ts.map +1 -1
- package/dist/core/types.d.ts +1201 -1
- package/dist/core/types.d.ts.map +1 -1
- package/dist/extractors/base.d.ts +151 -0
- package/dist/extractors/base.d.ts.map +1 -0
- package/dist/extractors/csv.d.ts +89 -0
- package/dist/extractors/csv.d.ts.map +1 -0
- package/dist/extractors/excel.d.ts +102 -0
- package/dist/extractors/excel.d.ts.map +1 -0
- package/dist/extractors/image.d.ts +94 -0
- package/dist/extractors/image.d.ts.map +1 -0
- package/dist/extractors/index.d.ts +16 -0
- package/dist/extractors/index.d.ts.map +1 -0
- package/dist/extractors/pdf.d.ts +89 -0
- package/dist/extractors/pdf.d.ts.map +1 -0
- package/dist/extractors/word.d.ts +83 -0
- package/dist/extractors/word.d.ts.map +1 -0
- package/dist/index.d.ts +8 -2
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +84776 -80182
- package/dist/search/index.d.ts +105 -0
- package/dist/search/index.d.ts.map +1 -0
- package/dist/streaming/index.d.ts +94 -0
- package/dist/streaming/index.d.ts.map +1 -0
- package/dist/utils/helpers.d.ts.map +1 -1
- package/package.json +41 -3
package/README.md
CHANGED
|
@@ -18,8 +18,12 @@
|
|
|
18
18
|
<a href="#features">Features</a> •
|
|
19
19
|
<a href="#installation">Installation</a> •
|
|
20
20
|
<a href="#quick-start">Quick Start</a> •
|
|
21
|
-
<a href="#
|
|
22
|
-
<a href="#
|
|
21
|
+
<a href="#extraction">Extraction</a> •
|
|
22
|
+
<a href="#analysis">Analysis</a> •
|
|
23
|
+
<a href="#search">Search</a> •
|
|
24
|
+
<a href="#batch-processing">Batch</a> •
|
|
25
|
+
<a href="#streaming">Streaming</a> •
|
|
26
|
+
<a href="#excel-styling">Excel</a> •
|
|
23
27
|
<a href="#examples">Examples</a>
|
|
24
28
|
</p>
|
|
25
29
|
|
|
@@ -27,16 +31,46 @@
|
|
|
27
31
|
|
|
28
32
|
## Features
|
|
29
33
|
|
|
34
|
+
### File Conversion
|
|
35
|
+
|
|
30
36
|
- **Multiple Format Support**: PDF, Word (DOCX), Excel (XLSX), CSV, HTML, JSON, XML, Markdown, and various image formats
|
|
31
37
|
- **Simple API**: Convert files with just one line of code
|
|
32
38
|
- **Builder Pattern**: Fluent API for complex conversions
|
|
33
39
|
- **Excel Conditional Formatting**: Row colors, cell styles, data bars, color scales
|
|
40
|
+
|
|
41
|
+
### Extraction & Content Analysis
|
|
42
|
+
|
|
43
|
+
- **Extract Content**: Extract text, images, tables, links, annotations from PDFs, Word, Excel
|
|
44
|
+
- **Document Analysis**: Analyze structure, content, style, security, accessibility, and quality
|
|
45
|
+
- **Entity Recognition**: Extract emails, URLs, phone numbers, dates, amounts from documents
|
|
46
|
+
- **Sentiment Analysis**: Detect sentiment and language from text content
|
|
47
|
+
- **Metadata Extraction**: Pull EXIF, IPTC, XMP data from images
|
|
48
|
+
- **Table Extraction**: Extract and structure table data from documents
|
|
49
|
+
|
|
50
|
+
### Search & Indexing
|
|
51
|
+
|
|
52
|
+
- **Full-Text Search**: Search across multiple documents with ranking
|
|
53
|
+
- **Advanced Queries**: Boolean operators, fuzzy matching, regex support, phrase search
|
|
54
|
+
- **Document Indexing**: Build inverted indexes for fast searching
|
|
55
|
+
- **Relevance Scoring**: TF-IDF based ranking with context snippets
|
|
56
|
+
- **Search Suggestions**: Fuzzy matching for typo tolerance
|
|
57
|
+
|
|
58
|
+
### Batch & Streaming
|
|
59
|
+
|
|
60
|
+
- **Batch Processing**: Process multiple files with configurable concurrency
|
|
61
|
+
- **Stream Processing**: Memory-efficient chunked processing for large files
|
|
62
|
+
- **Progress Tracking**: Real-time progress callbacks and statistics
|
|
63
|
+
- **Retry Logic**: Automatic retries with exponential backoff
|
|
64
|
+
- **Error Handling**: Comprehensive error handling with recovery options
|
|
65
|
+
|
|
66
|
+
### Advanced Features
|
|
67
|
+
|
|
34
68
|
- **Template Engine**: Built-in template processing for document generation
|
|
35
|
-
- **Transformers**:
|
|
69
|
+
- **Transformers**: Compression, watermarks, merging, splitting, rotation
|
|
70
|
+
- **Document Comparison**: Compare versions, track changes, similarity scoring
|
|
71
|
+
- **Excel Conditional Formatting**: Row colors, cell styles, data bars, color scales
|
|
36
72
|
- **Type-Safe**: Full TypeScript support with comprehensive type definitions
|
|
37
|
-
- **Extensible**: Plugin system for custom converters
|
|
38
|
-
- **Batch Processing**: Convert multiple files efficiently
|
|
39
|
-
- **Progress Tracking**: Monitor conversion progress with callbacks
|
|
73
|
+
- **Extensible**: Plugin system for custom converters and processors
|
|
40
74
|
|
|
41
75
|
## Installation
|
|
42
76
|
|
|
@@ -85,6 +119,187 @@ const buffer = await convertit
|
|
|
85
119
|
.toBuffer();
|
|
86
120
|
```
|
|
87
121
|
|
|
122
|
+
## Extraction
|
|
123
|
+
|
|
124
|
+
Extract content from documents without converting them:
|
|
125
|
+
|
|
126
|
+
```typescript
|
|
127
|
+
import { Convertit } from 'convertit';
|
|
128
|
+
|
|
129
|
+
// Extract text from PDF
|
|
130
|
+
const result = await Convertit.extract(pdfFile, 'pdf', {
|
|
131
|
+
extractText: true,
|
|
132
|
+
extractImages: true,
|
|
133
|
+
extractTables: true,
|
|
134
|
+
extractLinks: true,
|
|
135
|
+
});
|
|
136
|
+
|
|
137
|
+
console.log(result.data.text?.content);
|
|
138
|
+
console.log(result.data.images?.length);
|
|
139
|
+
console.log(result.data.tables);
|
|
140
|
+
```
|
|
141
|
+
|
|
142
|
+
### Supported Extractions
|
|
143
|
+
|
|
144
|
+
- **Text**: Full text with formatting and positioning
|
|
145
|
+
- **Images**: Images with metadata, EXIF data, and dimensions
|
|
146
|
+
- **Tables**: Structured table data with headers and rows
|
|
147
|
+
- **Links**: Hyperlinks with destinations and text
|
|
148
|
+
- **Annotations**: Comments, highlights, notes
|
|
149
|
+
- **Metadata**: Document properties, creation date, author
|
|
150
|
+
- **Styles**: Font information, colors, formatting
|
|
151
|
+
|
|
152
|
+
## Analysis
|
|
153
|
+
|
|
154
|
+
Analyze document structure, content, and quality:
|
|
155
|
+
|
|
156
|
+
```typescript
|
|
157
|
+
import { Convertit } from 'convertit';
|
|
158
|
+
|
|
159
|
+
// Analyze document
|
|
160
|
+
const analysis = await Convertit.analyze(wordFile, 'word', {
|
|
161
|
+
analyzeStructure: true,
|
|
162
|
+
analyzeContent: true,
|
|
163
|
+
analyzeStyle: true,
|
|
164
|
+
generateSummary: true,
|
|
165
|
+
extractKeywords: true,
|
|
166
|
+
detectSentiment: true,
|
|
167
|
+
});
|
|
168
|
+
|
|
169
|
+
console.log(analysis.structure); // Sections, chapters, headings
|
|
170
|
+
console.log(analysis.content); // Text stats, keywords, entities
|
|
171
|
+
console.log(analysis.summary); // Abstract, key points, reading time
|
|
172
|
+
```
|
|
173
|
+
|
|
174
|
+
### Analysis Capabilities
|
|
175
|
+
|
|
176
|
+
- **Structure**: Sections, chapters, headings, page breaks
|
|
177
|
+
- **Content**: Text statistics, keyword extraction, entity recognition
|
|
178
|
+
- **Style**: Font usage, colors, formatting consistency
|
|
179
|
+
- **Security**: Encryption, permissions, macros, external links
|
|
180
|
+
- **Accessibility**: WCAG compliance, alt text, reading order
|
|
181
|
+
- **Quality**: Image quality, readability, formatting issues
|
|
182
|
+
- **Comparison**: Compare versions and track changes
|
|
183
|
+
|
|
184
|
+
## Search
|
|
185
|
+
|
|
186
|
+
Search across multiple documents:
|
|
187
|
+
|
|
188
|
+
```typescript
|
|
189
|
+
import { Convertit } from 'convertit';
|
|
190
|
+
|
|
191
|
+
// Create search engine
|
|
192
|
+
const searchEngine = Convertit.createSearchEngine();
|
|
193
|
+
|
|
194
|
+
// Index documents
|
|
195
|
+
await searchEngine.index({
|
|
196
|
+
data: document1,
|
|
197
|
+
format: 'pdf',
|
|
198
|
+
name: 'doc1.pdf',
|
|
199
|
+
});
|
|
200
|
+
await searchEngine.index({
|
|
201
|
+
data: document2,
|
|
202
|
+
format: 'pdf',
|
|
203
|
+
name: 'doc2.pdf',
|
|
204
|
+
});
|
|
205
|
+
|
|
206
|
+
// Search with advanced options
|
|
207
|
+
const results = await searchEngine.search('keyword', {
|
|
208
|
+
fuzzyMatch: true,
|
|
209
|
+
maxResults: 50,
|
|
210
|
+
includeContext: true,
|
|
211
|
+
highlightMatches: true,
|
|
212
|
+
});
|
|
213
|
+
|
|
214
|
+
results.hits.forEach(hit => {
|
|
215
|
+
console.log(`${hit.documentName}: ${hit.highlightedSnippet}`);
|
|
216
|
+
});
|
|
217
|
+
```
|
|
218
|
+
|
|
219
|
+
### Search Features
|
|
220
|
+
|
|
221
|
+
- **Full-Text Search**: Index and search across documents
|
|
222
|
+
- **Fuzzy Matching**: Typo-tolerant search with configurable threshold
|
|
223
|
+
- **Boolean Queries**: Support for +required and -excluded terms
|
|
224
|
+
- **Phrase Search**: Find exact phrases with "quoted text"
|
|
225
|
+
- **Regular Expressions**: Use /regex/ patterns in queries
|
|
226
|
+
- **Context Snippets**: Get surrounding text for matches
|
|
227
|
+
- **Highlighting**: HTML-highlighted results
|
|
228
|
+
- **Ranking**: TF-IDF based relevance scoring
|
|
229
|
+
|
|
230
|
+
## Batch-processing
|
|
231
|
+
|
|
232
|
+
Process multiple files with concurrency control:
|
|
233
|
+
|
|
234
|
+
```typescript
|
|
235
|
+
import { Convertit } from 'convertit';
|
|
236
|
+
|
|
237
|
+
// Extract from multiple files in parallel
|
|
238
|
+
const { results, errors } = await Convertit.batchExtract(
|
|
239
|
+
[
|
|
240
|
+
{ data: pdf1, format: 'pdf' },
|
|
241
|
+
{ data: pdf2, format: 'pdf' },
|
|
242
|
+
{ data: word1, format: 'word' },
|
|
243
|
+
],
|
|
244
|
+
{
|
|
245
|
+
concurrency: 3,
|
|
246
|
+
retryAttempts: 2,
|
|
247
|
+
timeout: 30000,
|
|
248
|
+
}
|
|
249
|
+
);
|
|
250
|
+
|
|
251
|
+
console.log(`Processed: ${results.length}, Failed: ${errors.length}`);
|
|
252
|
+
```
|
|
253
|
+
|
|
254
|
+
### Batch Features
|
|
255
|
+
|
|
256
|
+
- **Concurrent Processing**: Configurable concurrency limits
|
|
257
|
+
- **Retry Logic**: Automatic retries with exponential backoff
|
|
258
|
+
- **Progress Tracking**: Real-time progress callbacks
|
|
259
|
+
- **Error Handling**: Graceful error handling with detailed error info
|
|
260
|
+
- **Timeout Support**: Per-item timeout configuration
|
|
261
|
+
- **Job Management**: Pause, resume, and cancel operations
|
|
262
|
+
|
|
263
|
+
## Streaming
|
|
264
|
+
|
|
265
|
+
Memory-efficient processing of large files:
|
|
266
|
+
|
|
267
|
+
```typescript
|
|
268
|
+
import { Convertit } from 'convertit';
|
|
269
|
+
|
|
270
|
+
// Create stream processor
|
|
271
|
+
const processor = await Convertit.createStreamProcessor({
|
|
272
|
+
chunkSize: 64 * 1024, // 64KB chunks
|
|
273
|
+
emitProgress: true,
|
|
274
|
+
progressInterval: 100,
|
|
275
|
+
});
|
|
276
|
+
|
|
277
|
+
// Handle streamed data
|
|
278
|
+
processor.onData(chunk => {
|
|
279
|
+
console.log(`Received chunk: ${chunk.size} bytes`);
|
|
280
|
+
});
|
|
281
|
+
|
|
282
|
+
processor.onProgress(progress => {
|
|
283
|
+
console.log(`Progress: ${progress.percentage}% (${progress.rate} bytes/sec)`);
|
|
284
|
+
});
|
|
285
|
+
|
|
286
|
+
processor.onEnd(() => {
|
|
287
|
+
console.log('Streaming complete');
|
|
288
|
+
});
|
|
289
|
+
|
|
290
|
+
// Process large file
|
|
291
|
+
await processor.process(largeFile, 'pdf');
|
|
292
|
+
```
|
|
293
|
+
|
|
294
|
+
### Streaming Features
|
|
295
|
+
|
|
296
|
+
- **Chunked Processing**: Process large files in configurable chunks
|
|
297
|
+
- **Backpressure Handling**: Automatic flow control
|
|
298
|
+
- **Progress Events**: Real-time progress reporting
|
|
299
|
+
- **Memory Efficient**: Constant memory usage regardless of file size
|
|
300
|
+
- **Pipeline Builder**: Chain transformations in pipeline
|
|
301
|
+
- **Pause/Resume**: Control stream processing flow
|
|
302
|
+
|
|
88
303
|
## Excel Styling
|
|
89
304
|
|
|
90
305
|
### Conditional Row Formatting
|
|
@@ -0,0 +1,38 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Document Analysis Module
|
|
3
|
+
* Comprehensive document analysis, comparison, and intelligence
|
|
4
|
+
*/
|
|
5
|
+
import type { FileFormat, InputDataType, AnalysisOptions, AnalysisResult, ComparisonOptions, ComparisonResult } from '../core/types.js';
|
|
6
|
+
export declare class DocumentAnalyzer {
|
|
7
|
+
private registry;
|
|
8
|
+
constructor();
|
|
9
|
+
analyze(data: InputDataType, format: FileFormat, options?: AnalysisOptions): Promise<AnalysisResult>;
|
|
10
|
+
private analyzeStructure;
|
|
11
|
+
private analyzeContent;
|
|
12
|
+
private calculateTextStats;
|
|
13
|
+
private extractKeywords;
|
|
14
|
+
private extractEntities;
|
|
15
|
+
private detectLanguage;
|
|
16
|
+
private detectSentiment;
|
|
17
|
+
private analyzeStyle;
|
|
18
|
+
private analyzeConsistency;
|
|
19
|
+
private analyzeSecurity;
|
|
20
|
+
private analyzeAccessibility;
|
|
21
|
+
private analyzeQuality;
|
|
22
|
+
private generateSummary;
|
|
23
|
+
}
|
|
24
|
+
export declare class DocumentComparator {
|
|
25
|
+
compare(source: {
|
|
26
|
+
data: InputDataType;
|
|
27
|
+
format: FileFormat;
|
|
28
|
+
}, target: {
|
|
29
|
+
data: InputDataType;
|
|
30
|
+
format: FileFormat;
|
|
31
|
+
}, options?: ComparisonOptions): Promise<ComparisonResult>;
|
|
32
|
+
private compareText;
|
|
33
|
+
private compareTables;
|
|
34
|
+
private compareMetadata;
|
|
35
|
+
private calculateSimilarity;
|
|
36
|
+
}
|
|
37
|
+
export { DocumentAnalyzer as default };
|
|
38
|
+
//# sourceMappingURL=index.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/analysis/index.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,UAAU,EACV,aAAa,EACb,eAAe,EACf,cAAc,EACd,iBAAiB,EACjB,gBAAgB,EAwBjB,MAAM,kBAAkB,CAAC;AAqB1B,qBAAa,gBAAgB;IAC3B,OAAO,CAAC,QAAQ,CAAoB;;IAM9B,OAAO,CACX,IAAI,EAAE,aAAa,EACnB,MAAM,EAAE,UAAU,EAClB,OAAO,GAAE,eAAoB,GAC5B,OAAO,CAAC,cAAc,CAAC;IAuD1B,OAAO,CAAC,gBAAgB;IA+CxB,OAAO,CAAC,cAAc;IAgCtB,OAAO,CAAC,kBAAkB;IA8B1B,OAAO,CAAC,eAAe;IAIvB,OAAO,CAAC,eAAe;IA4EvB,OAAO,CAAC,cAAc;IAsFtB,OAAO,CAAC,eAAe;IA4FvB,OAAO,CAAC,YAAY;IA0CpB,OAAO,CAAC,kBAAkB;IA+B1B,OAAO,CAAC,eAAe;IAgDvB,OAAO,CAAC,oBAAoB;IA6E5B,OAAO,CAAC,cAAc;IA4FtB,OAAO,CAAC,eAAe;CA4BxB;AAED,qBAAa,kBAAkB;IACvB,OAAO,CACX,MAAM,EAAE;QAAE,IAAI,EAAE,aAAa,CAAC;QAAC,MAAM,EAAE,UAAU,CAAA;KAAE,EACnD,MAAM,EAAE;QAAE,IAAI,EAAE,aAAa,CAAC;QAAC,MAAM,EAAE,UAAU,CAAA;KAAE,EACnD,OAAO,GAAE,iBAAsB,GAC9B,OAAO,CAAC,gBAAgB,CAAC;IA0F5B,OAAO,CAAC,WAAW;IA4EnB,OAAO,CAAC,aAAa;IAuBrB,OAAO,CAAC,eAAe;IA8BvB,OAAO,CAAC,mBAAmB;CAiB5B;AAED,OAAO,EAAE,gBAAgB,IAAI,OAAO,EAAE,CAAC"}
|
|
@@ -0,0 +1,116 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Batch Processing Module
|
|
3
|
+
* Queue-based batch processing for large-scale document operations
|
|
4
|
+
*/
|
|
5
|
+
import type { FileFormat, InputDataType, BatchJobConfig, BatchJobResult, BatchJobStatus } from '../core/types.js';
|
|
6
|
+
/**
|
|
7
|
+
* Job item in the batch queue
|
|
8
|
+
*/
|
|
9
|
+
export interface BatchJobItem {
|
|
10
|
+
/** Unique identifier */
|
|
11
|
+
id: string;
|
|
12
|
+
/** Input data */
|
|
13
|
+
data: InputDataType;
|
|
14
|
+
/** Input format */
|
|
15
|
+
inputFormat: FileFormat;
|
|
16
|
+
outputFormat?: FileFormat;
|
|
17
|
+
options?: Record<string, unknown>;
|
|
18
|
+
status: 'pending' | 'processing' | 'completed' | 'failed' | 'cancelled';
|
|
19
|
+
result?: unknown;
|
|
20
|
+
error?: Error;
|
|
21
|
+
startTime?: Date;
|
|
22
|
+
endTime?: Date;
|
|
23
|
+
retryCount: number;
|
|
24
|
+
}
|
|
25
|
+
export interface BatchJob {
|
|
26
|
+
id: string;
|
|
27
|
+
name: string;
|
|
28
|
+
type: 'conversion' | 'extraction' | 'analysis';
|
|
29
|
+
config: BatchJobConfig;
|
|
30
|
+
items: BatchJobItem[];
|
|
31
|
+
status: BatchJobStatus;
|
|
32
|
+
createdAt: Date;
|
|
33
|
+
startedAt?: Date;
|
|
34
|
+
completedAt?: Date;
|
|
35
|
+
onProgress?: (progress: BatchJobProgress) => void;
|
|
36
|
+
onItemComplete?: (item: BatchJobItem) => void;
|
|
37
|
+
onError?: (error: Error, item: BatchJobItem) => void;
|
|
38
|
+
}
|
|
39
|
+
export interface BatchJobProgress {
|
|
40
|
+
jobId: string;
|
|
41
|
+
total: number;
|
|
42
|
+
completed: number;
|
|
43
|
+
failed: number;
|
|
44
|
+
percentage: number;
|
|
45
|
+
estimatedTimeRemaining?: number;
|
|
46
|
+
processingRate?: number;
|
|
47
|
+
}
|
|
48
|
+
export interface BatchProcessorConfig {
|
|
49
|
+
maxConcurrentJobs: number;
|
|
50
|
+
maxConcurrentItems: number;
|
|
51
|
+
defaultTimeout: number;
|
|
52
|
+
maxRetries: number;
|
|
53
|
+
retryDelay: number;
|
|
54
|
+
memoryLimit?: number;
|
|
55
|
+
enableProgress: boolean;
|
|
56
|
+
}
|
|
57
|
+
export declare class BatchProcessor {
|
|
58
|
+
private config;
|
|
59
|
+
private jobs;
|
|
60
|
+
private activeJobs;
|
|
61
|
+
private extractorRegistry;
|
|
62
|
+
private converterRegistry;
|
|
63
|
+
constructor(config?: Partial<BatchProcessorConfig>);
|
|
64
|
+
createJob(name: string, type: BatchJob['type'], config: Partial<BatchJobConfig>): BatchJob;
|
|
65
|
+
addItems(jobId: string, items: Array<{
|
|
66
|
+
data: InputDataType;
|
|
67
|
+
inputFormat: FileFormat;
|
|
68
|
+
outputFormat?: FileFormat;
|
|
69
|
+
options?: Record<string, unknown>;
|
|
70
|
+
}>): BatchJobItem[];
|
|
71
|
+
onProgress(jobId: string, callback: (progress: BatchJobProgress) => void): void;
|
|
72
|
+
onItemComplete(jobId: string, callback: (item: BatchJobItem) => void): void;
|
|
73
|
+
onError(jobId: string, callback: (error: Error, item: BatchJobItem) => void): void;
|
|
74
|
+
startJob(jobId: string): Promise<BatchJobResult>;
|
|
75
|
+
pauseJob(jobId: string): void;
|
|
76
|
+
resumeJob(jobId: string): Promise<BatchJobResult>;
|
|
77
|
+
cancelJob(jobId: string): void;
|
|
78
|
+
getJobStatus(jobId: string): BatchJob | undefined;
|
|
79
|
+
getAllJobs(): BatchJob[];
|
|
80
|
+
deleteJob(jobId: string): boolean;
|
|
81
|
+
private processJob;
|
|
82
|
+
private processItem;
|
|
83
|
+
private extractItem;
|
|
84
|
+
private convertItem;
|
|
85
|
+
private analyzeItem;
|
|
86
|
+
}
|
|
87
|
+
export declare class BatchJobBuilder {
|
|
88
|
+
private processor;
|
|
89
|
+
private name;
|
|
90
|
+
private type;
|
|
91
|
+
private config;
|
|
92
|
+
private items;
|
|
93
|
+
constructor(processor: BatchProcessor);
|
|
94
|
+
setName(name: string): this;
|
|
95
|
+
forExtraction(): this;
|
|
96
|
+
forConversion(): this;
|
|
97
|
+
forAnalysis(): this;
|
|
98
|
+
withConcurrency(concurrency: number): this;
|
|
99
|
+
withTimeout(timeout: number): this;
|
|
100
|
+
withRetries(attempts: number): this;
|
|
101
|
+
continueOnError(value?: boolean): this;
|
|
102
|
+
withDefaultOptions(options: Record<string, unknown>): this;
|
|
103
|
+
outputTo(directory: string): this;
|
|
104
|
+
addItem(data: InputDataType, inputFormat: FileFormat, outputFormat?: FileFormat, options?: Record<string, unknown>): this;
|
|
105
|
+
addItems(items: Array<{
|
|
106
|
+
data: InputDataType;
|
|
107
|
+
inputFormat: FileFormat;
|
|
108
|
+
outputFormat?: FileFormat;
|
|
109
|
+
options?: Record<string, unknown>;
|
|
110
|
+
}>): this;
|
|
111
|
+
build(): BatchJob;
|
|
112
|
+
buildAndStart(): Promise<BatchJobResult>;
|
|
113
|
+
reset(): this;
|
|
114
|
+
}
|
|
115
|
+
export { BatchProcessor as default };
|
|
116
|
+
//# sourceMappingURL=index.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/batch/index.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,UAAU,EACV,aAAa,EACb,cAAc,EACd,cAAc,EACd,cAAc,EAGf,MAAM,kBAAkB,CAAC;AAK1B;;GAEG;AACH,MAAM,WAAW,YAAY;IAC3B,wBAAwB;IACxB,EAAE,EAAE,MAAM,CAAC;IACX,iBAAiB;IACjB,IAAI,EAAE,aAAa,CAAC;IACpB,mBAAmB;IACnB,WAAW,EAAE,UAAU,CAAC;IACxB,YAAY,CAAC,EAAE,UAAU,CAAC;IAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;IAClC,MAAM,EAAE,SAAS,GAAG,YAAY,GAAG,WAAW,GAAG,QAAQ,GAAG,WAAW,CAAC;IACxE,MAAM,CAAC,EAAE,OAAO,CAAC;IACjB,KAAK,CAAC,EAAE,KAAK,CAAC;IACd,SAAS,CAAC,EAAE,IAAI,CAAC;IACjB,OAAO,CAAC,EAAE,IAAI,CAAC;IACf,UAAU,EAAE,MAAM,CAAC;CACpB;AAED,MAAM,WAAW,QAAQ;IACvB,EAAE,EAAE,MAAM,CAAC;IACX,IAAI,EAAE,MAAM,CAAC;IACb,IAAI,EAAE,YAAY,GAAG,YAAY,GAAG,UAAU,CAAC;IAC/C,MAAM,EAAE,cAAc,CAAC;IACvB,KAAK,EAAE,YAAY,EAAE,CAAC;IACtB,MAAM,EAAE,cAAc,CAAC;IACvB,SAAS,EAAE,IAAI,CAAC;IAChB,SAAS,CAAC,EAAE,IAAI,CAAC;IACjB,WAAW,CAAC,EAAE,IAAI,CAAC;IACnB,UAAU,CAAC,EAAE,CAAC,QAAQ,EAAE,gBAAgB,KAAK,IAAI,CAAC;IAClD,cAAc,CAAC,EAAE,CAAC,IAAI,EAAE,YAAY,KAAK,IAAI,CAAC;IAC9C,OAAO,CAAC,EAAE,CAAC,KAAK,EAAE,KAAK,EAAE,IAAI,EAAE,YAAY,KAAK,IAAI,CAAC;CACtD;AAED,MAAM,WAAW,gBAAgB;IAC/B,KAAK,EAAE,MAAM,CAAC;IACd,KAAK,EAAE,MAAM,CAAC;IACd,SAAS,EAAE,MAAM,CAAC;IAClB,MAAM,EAAE,MAAM,CAAC;IACf,UAAU,EAAE,MAAM,CAAC;IACnB,sBAAsB,CAAC,EAAE,MAAM,CAAC;IAChC,cAAc,CAAC,EAAE,MAAM,CAAC;CACzB;AAED,MAAM,WAAW,oBAAoB;IACnC,iBAAiB,EAAE,MAAM,CAAC;IAC1B,kBAAkB,EAAE,MAAM,CAAC;IAC3B,cAAc,EAAE,MAAM,CAAC;IACvB,UAAU,EAAE,MAAM,CAAC;IACnB,UAAU,EAAE,MAAM,CAAC;IACnB,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,cAAc,EAAE,OAAO,CAAC;CACzB;AAWD,qBAAa,cAAc;IACzB,OAAO,CAAC,MAAM,CAAuB;IACrC,OAAO,CAAC,IAAI,CAAwB;IACpC,OAAO,CAAC,UAAU,CAAc;IAChC,OAAO,CAAC,iBAAiB,CAAoB;IAC7C,OAAO,CAAC,iBAAiB,CAAoB;gBAEjC,MAAM,GAAE,OAAO,CAAC,oBAAoB,CAAM;IAQtD,SAAS,CAAC,IAAI,EAAE,MAAM,EAAE,IAAI,EAAE,QAAQ,CAAC,MAAM,CAAC,EAAE,MAAM,EAAE,OAAO,CAAC,cAAc,CAAC,GAAG,QAAQ;IAqB1F,QAAQ,CACN,KAAK,EAAE,MAAM,EACb,KAAK,EAAE,KAAK,CAAC;QACX,IAAI,EAAE,aAAa,CAAC;QACpB,WAAW,EAAE,UAAU,CAAC;QACxB,YAAY,CAAC,EAAE,UAAU,CAAC;QAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KACnC,CAAC,GACD,YAAY,EAAE;IAwBjB,UAAU,CAAC,KAAK,EAAE,MAAM,EAAE,QAAQ,EAAE,CAAC,QAAQ,EAAE,gBAAgB,KAAK,IAAI,GAAG,IAAI;IAO/E,cAAc,CAAC,KAAK,EAAE,MAAM,EAAE,QAAQ,EAAE,CAAC,IAAI,EAAE,YAAY,KAAK,IAAI,GAAG,IAAI;IAO3E,OAAO,CAAC,KAAK,EAAE,MAAM,EAAE,QAAQ,EAAE,CAAC,KAAK,EAAE,KAAK,EAAE,IAAI,EAAE,YAAY,KAAK,IAAI,GAAG,IAAI;IAO5E,QAAQ,CAAC,KAAK,EAAE,MAAM,GAAG,OAAO,CAAC,cAAc,CAAC;IA4BtD,QAAQ,CAAC,KAAK,EAAE,MAAM,GAAG,IAAI;IAOvB,SAAS,CAAC,KAAK,EAAE,MAAM,GAAG,OAAO,CAAC,cAAc,CAAC;IAavD,SAAS,CAAC,KAAK,EAAE,MAAM,GAAG,IAAI;IAa9B,YAAY,CAAC,KAAK,EAAE,MAAM,GAAG,QAAQ,GAAG,SAAS;IAIjD,UAAU,IAAI,QAAQ,EAAE;IAIxB,SAAS,CAAC,KAAK,EAAE,MAAM,GAAG,OAAO;YAYnB,UAAU;YA6EV,WAAW;YA2DX,WAAW;YAkBX,WAAW;YAwBX,WAAW;CAgB1B;AAED,qBAAa,eAAe;IAC1B,OAAO,CAAC,SAAS,CAAiB;IAClC,OAAO,CAAC,IAAI,CAAc;IAC1B,OAAO,CAAC,IAAI,CAAkC;IAC9C,OAAO,CAAC,MAAM,CAAsB;IACpC,OAAO,CAAC,KAAK,CAKL;gBAEI,SAAS,EAAE,cAAc;IAIrC,OAAO,CAAC,IAAI,EAAE,MAAM,GAAG,IAAI;IAK3B,aAAa,IAAI,IAAI;IAKrB,aAAa,IAAI,IAAI;IAKrB,WAAW,IAAI,IAAI;IAKnB,eAAe,CAAC,WAAW,EAAE,MAAM,GAAG,IAAI;IAK1C,WAAW,CAAC,OAAO,EAAE,MAAM,GAAG,IAAI;IAKlC,WAAW,CAAC,QAAQ,EAAE,MAAM,GAAG,IAAI;IAKnC,eAAe,CAAC,KAAK,GAAE,OAAc,GAAG,IAAI;IAK5C,kBAAkB,CAAC,OAAO,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAK1D,QAAQ,CAAC,SAAS,EAAE,MAAM,GAAG,IAAI;IAKjC,OAAO,CACL,IAAI,EAAE,aAAa,EACnB,WAAW,EAAE,UAAU,EACvB,YAAY,CAAC,EAAE,UAAU,EACzB,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAChC,IAAI;IAKP,QAAQ,CACN,KAAK,EAAE,KAAK,CAAC;QACX,IAAI,EAAE,aAAa,CAAC;QACpB,WAAW,EAAE,UAAU,CAAC;QACxB,YAAY,CAAC,EAAE,UAAU,CAAC;QAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KACnC,CAAC,GACD,IAAI;IAKP,KAAK,IAAI,QAAQ;IAQX,aAAa,IAAI,OAAO,CAAC,cAAc,CAAC;IAK9C,KAAK,IAAI,IAAI;CAOd;AAED,OAAO,EAAE,cAAc,IAAI,OAAO,EAAE,CAAC"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"excel-styles.d.ts","sourceRoot":"","sources":["../../src/converters/excel-styles.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,OAAO,KAAK,
|
|
1
|
+
{"version":3,"file":"excel-styles.d.ts","sourceRoot":"","sources":["../../src/converters/excel-styles.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,OAAO,KAAK,EAAE,SAAS,EAAQ,MAAM,SAAS,CAAC;AAC/C,OAAO,KAAK,EACV,YAAY,EAEZ,YAAY,EAEZ,SAAS,EACT,kBAAkB,EACnB,MAAM,kBAAkB,CAAC;AAE1B,qBAAa,gBAAgB;IAC3B,OAAO,CAAC,SAAS,CAAY;IAC7B,OAAO,CAAC,OAAO,CAAe;IAE9B,OAAO,CAAC,IAAI,CAAQ;gBAGR,SAAS,EAAE,SAAS,EAAE,OAAO,EAAE,YAAY,EAAE,IAAI,EAAE,GAAG,EAAE;IAMpE,cAAc,IAAI,IAAI;IAYtB,OAAO,CAAC,cAAc;IAgBtB,OAAO,CAAC,oBAAoB;IA4B5B,OAAO,CAAC,uBAAuB;IAiB/B,OAAO,CAAC,aAAa;IAsCrB,OAAO,CAAC,eAAe;IAOvB,OAAO,CAAC,eAAe;IAkBvB,OAAO,CAAC,eAAe;IAiCvB,OAAO,CAAC,0BAA0B;IAiBlC,OAAO,CAAC,yBAAyB;IAajC,OAAO,CAAC,2BAA2B;IAenC,OAAO,CAAC,qBAAqB;IAU7B,OAAO,CAAC,cAAc;IAgGtB,OAAO,CAAC,cAAc;IAsBtB,OAAO,CAAC,cAAc;IAQtB,OAAO,CAAC,oBAAoB;IAQ5B,OAAO,CAAC,oBAAoB;CAS7B;AAED,eAAO,MAAM,YAAY;uBAIlB,SAAS;uBAKT,SAAS;sBAKT,SAAS;mBAKT,SAAS;mBAKT,SAAS;iBAMT,SAAS;uBAIT,SAAS;sBAIT,SAAS;mBAKT,SAAS;qBAKT,SAAS;eAKT,SAAS;CACf,CAAC;AAEF,wBAAgB,mBAAmB,CACjC,OAAO,EAAE,KAAK,CAAC;IACb,SAAS,EACL,MAAM,GACN,KAAK,GAEL;QAAE,MAAM,EAAE,MAAM,GAAG,MAAM,CAAC;QAAC,QAAQ,EAAE,kBAAkB,CAAC;QAAC,KAAK,EAAE,GAAG,CAAA;KAAE,CAAC;IAC1E,KAAK,EAAE,SAAS,CAAC;CAClB,CAAC,GACD,YAAY,EAAE,CAkBhB;AAED,eAAe,gBAAgB,CAAC"}
|
|
@@ -1,10 +1,14 @@
|
|
|
1
|
-
|
|
2
|
-
export {
|
|
1
|
+
import { ConverterRegistry } from './base.js';
|
|
2
|
+
export { ConverterRegistry } from './base.js';
|
|
3
|
+
export { PDFConverter } from './pdf.js';
|
|
3
4
|
export { WordConverter } from './word.js';
|
|
4
|
-
export { ExcelConverter
|
|
5
|
-
export {
|
|
6
|
-
export { CSVConverter, CSVUtils } from './csv.js';
|
|
5
|
+
export { ExcelConverter } from './excel.js';
|
|
6
|
+
export { CSVConverter } from './csv.js';
|
|
7
7
|
export { HTMLConverter } from './html.js';
|
|
8
|
-
export { ImageConverter
|
|
8
|
+
export { ImageConverter } from './image.js';
|
|
9
9
|
export { TextConverter, JSONConverter, XMLConverter, MarkdownConverter } from './text.js';
|
|
10
|
+
/**
|
|
11
|
+
* Initialize all converters and register them in the registry
|
|
12
|
+
*/
|
|
13
|
+
export declare function initializeConverters(): ConverterRegistry;
|
|
10
14
|
//# sourceMappingURL=index.d.ts.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/converters/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../src/converters/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,iBAAiB,EAAE,MAAM,WAAW,CAAC;AAU9C,OAAO,EAAE,iBAAiB,EAAE,MAAM,WAAW,CAAC;AAC9C,OAAO,EAAE,YAAY,EAAE,MAAM,UAAU,CAAC;AACxC,OAAO,EAAE,aAAa,EAAE,MAAM,WAAW,CAAC;AAC1C,OAAO,EAAE,cAAc,EAAE,MAAM,YAAY,CAAC;AAC5C,OAAO,EAAE,YAAY,EAAE,MAAM,UAAU,CAAC;AACxC,OAAO,EAAE,aAAa,EAAE,MAAM,WAAW,CAAC;AAC1C,OAAO,EAAE,cAAc,EAAE,MAAM,YAAY,CAAC;AAC5C,OAAO,EAAE,aAAa,EAAE,aAAa,EAAE,YAAY,EAAE,iBAAiB,EAAE,MAAM,WAAW,CAAC;AAE1F;;GAEG;AACH,wBAAgB,oBAAoB,IAAI,iBAAiB,CA2BxD"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"pdf.d.ts","sourceRoot":"","sources":["../../src/converters/pdf.ts"],"names":[],"mappings":"AAAA;;GAEG;AAIH,OAAO,EAAE,aAAa,EAAE,MAAM,WAAW,CAAC;AAC1C,OAAO,KAAK,EACV,aAAa,EACb,kBAAkB,EAClB,UAAU,EAKX,MAAM,kBAAkB,CAAC;AAI1B,qBAAa,YAAa,SAAQ,aAAa;;IAK7C,wBAAwB,IAAI,UAAU,EAAE;IAIlC,OAAO,CAAC,IAAI,EAAE,aAAa,EAAE,OAAO,EAAE,kBAAkB,GAAG,OAAO,CAAC,MAAM,CAAC;IA6BhF,OAAO,CAAC,WAAW;YAOL,cAAc;
|
|
1
|
+
{"version":3,"file":"pdf.d.ts","sourceRoot":"","sources":["../../src/converters/pdf.ts"],"names":[],"mappings":"AAAA;;GAEG;AAIH,OAAO,EAAE,aAAa,EAAE,MAAM,WAAW,CAAC;AAC1C,OAAO,KAAK,EACV,aAAa,EACb,kBAAkB,EAClB,UAAU,EAKX,MAAM,kBAAkB,CAAC;AAI1B,qBAAa,YAAa,SAAQ,aAAa;;IAK7C,wBAAwB,IAAI,UAAU,EAAE;IAIlC,OAAO,CAAC,IAAI,EAAE,aAAa,EAAE,OAAO,EAAE,kBAAkB,GAAG,OAAO,CAAC,MAAM,CAAC;IA6BhF,OAAO,CAAC,WAAW;YAOL,cAAc;YAwFd,eAAe;YAoBf,gBAAgB;YAUhB,mBAAmB;YAkDnB,gBAAgB;IAU9B,OAAO,CAAC,SAAS;IAmDjB,OAAO,CAAC,SAAS;IAiBjB,OAAO,CAAC,SAAS;IAiBjB,OAAO,CAAC,cAAc;IAkBtB,OAAO,CAAC,OAAO;CAchB;AAED;;GAEG;AACH,qBAAa,cAAc;IACzB;;OAEG;WACU,KAAK,CAAC,KAAK,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,CAAC;IAmBpD;;OAEG;WACU,KAAK,CAAC,IAAI,EAAE,MAAM,EAAE,KAAK,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,EAAE,CAAC;IA2BpE;;OAEG;WACU,aAAa,CACxB,IAAI,EAAE,MAAM,EACZ,MAAM,EAAE,KAAK,CAAC;QAAE,KAAK,EAAE,MAAM,CAAC;QAAC,GAAG,EAAE,MAAM,CAAA;KAAE,CAAC,GAC5C,OAAO,CAAC,MAAM,EAAE,CAAC;IA+BpB;;OAEG;WACU,gBAAgB,CAC3B,IAAI,EAAE,MAAM,EACZ,IAAI,EAAE,MAAM,EACZ,OAAO,GAAE;QACP,OAAO,CAAC,EAAE,MAAM,CAAC;QACjB,QAAQ,CAAC,EAAE,MAAM,CAAC;QAClB,QAAQ,CAAC,EAAE,MAAM,CAAC;QAClB,KAAK,CAAC,EAAE;YAAE,CAAC,EAAE,MAAM,CAAC;YAAC,CAAC,EAAE,MAAM,CAAC;YAAC,CAAC,EAAE,MAAM,CAAA;SAAE,CAAC;KACxC,GACL,OAAO,CAAC,MAAM,CAAC;IAoClB;;OAEG;WACU,WAAW,CACtB,IAAI,EAAE,MAAM,EACZ,KAAK,EAAE,EAAE,GAAG,GAAG,GAAG,GAAG,EACrB,WAAW,CAAC,EAAE,MAAM,EAAE,GACrB,OAAO,CAAC,MAAM,CAAC;IAsBlB;;OAEG;WACU,YAAY,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC;IAKxD;;OAEG;WACU,YAAY,CAAC,IAAI,EAAE,MAAM,EAAE,WAAW,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,CAAC;CAiBhF;AAED,eAAe,YAAY,CAAC"}
|
package/dist/core/converter.d.ts
CHANGED
|
@@ -1,15 +1,67 @@
|
|
|
1
1
|
/**
|
|
2
2
|
* convertit - Main Converter Class
|
|
3
|
-
* Core API for file conversion
|
|
3
|
+
* Core API for file conversion, extraction, analysis, and batch operations.
|
|
4
4
|
*/
|
|
5
|
-
import type { InputDataType, ConvertFileOptions, ConversionResult, BatchConversionResult, FileFormat, ProgressInfo, PDFOptions, WordOptions, ExcelOptions, CSVOptions, HTMLOptions, ImageOptions, WatermarkConfig, EncryptionConfig, CompressionConfig, PageNumberConfig, HeaderFooterConfig, SplitConfig, TableConfig } from './types.js';
|
|
5
|
+
import type { InputDataType, ConvertFileOptions, ConversionResult, BatchConversionResult, FileFormat, ProgressInfo, PDFOptions, WordOptions, ExcelOptions, CSVOptions, HTMLOptions, ImageOptions, WatermarkConfig, EncryptionConfig, CompressionConfig, PageNumberConfig, HeaderFooterConfig, SplitConfig, TableConfig, ExtractionResult, AnalysisResult, AnalysisOptions, SearchOptions, SearchResult } from './types.js';
|
|
6
6
|
import { BaseConverter } from '../converters/base.js';
|
|
7
7
|
export declare class Convertit {
|
|
8
8
|
private data;
|
|
9
9
|
private options;
|
|
10
10
|
private static registry;
|
|
11
|
+
private static extractorRegistry;
|
|
11
12
|
constructor(data: InputDataType, options: ConvertFileOptions);
|
|
12
13
|
private initializeConverters;
|
|
14
|
+
/**
|
|
15
|
+
* Extract content from a document
|
|
16
|
+
*/
|
|
17
|
+
static extract(data: InputDataType, format: FileFormat, options?: Record<string, unknown>): Promise<ExtractionResult>;
|
|
18
|
+
/**
|
|
19
|
+
* Analyze a document
|
|
20
|
+
*/
|
|
21
|
+
static analyze(data: InputDataType, format: FileFormat, options?: AnalysisOptions): Promise<AnalysisResult>;
|
|
22
|
+
/**
|
|
23
|
+
* Search within documents
|
|
24
|
+
*/
|
|
25
|
+
static search(documents: Array<{
|
|
26
|
+
data: InputDataType;
|
|
27
|
+
format: FileFormat;
|
|
28
|
+
name?: string;
|
|
29
|
+
}>, query: string, options?: Omit<SearchOptions, 'query'>): Promise<SearchResult>;
|
|
30
|
+
/**
|
|
31
|
+
* Create a search engine instance for multiple searches
|
|
32
|
+
*/
|
|
33
|
+
static createSearchEngine(): Promise<{
|
|
34
|
+
index: (data: InputDataType, format: FileFormat, options?: {
|
|
35
|
+
name?: string;
|
|
36
|
+
}) => Promise<void>;
|
|
37
|
+
search: (query: string, options?: Omit<SearchOptions, 'query'>) => SearchResult;
|
|
38
|
+
clear: () => void;
|
|
39
|
+
}>;
|
|
40
|
+
/**
|
|
41
|
+
* Process documents in batch
|
|
42
|
+
*/
|
|
43
|
+
static batchExtract(items: Array<{
|
|
44
|
+
data: InputDataType;
|
|
45
|
+
format: FileFormat;
|
|
46
|
+
options?: Record<string, unknown>;
|
|
47
|
+
}>, config?: {
|
|
48
|
+
concurrency?: number;
|
|
49
|
+
continueOnError?: boolean;
|
|
50
|
+
}): Promise<{
|
|
51
|
+
results: ExtractionResult[];
|
|
52
|
+
errors: Error[];
|
|
53
|
+
}>;
|
|
54
|
+
/**
|
|
55
|
+
* Create a stream processor for large files
|
|
56
|
+
*/
|
|
57
|
+
static createStreamProcessor(options?: {
|
|
58
|
+
chunkSize?: number;
|
|
59
|
+
}): Promise<{
|
|
60
|
+
process: (data: InputDataType, format: FileFormat) => Promise<void>;
|
|
61
|
+
onData: (callback: (chunk: unknown) => void) => void;
|
|
62
|
+
onEnd: (callback: () => void) => void;
|
|
63
|
+
onError: (callback: (error: Error) => void) => void;
|
|
64
|
+
}>;
|
|
13
65
|
convert(): Promise<ConversionResult>;
|
|
14
66
|
private applyTransformers;
|
|
15
67
|
private formatOutput;
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"converter.d.ts","sourceRoot":"","sources":["../../src/core/converter.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,aAAa,EACb,kBAAkB,EAClB,gBAAgB,EAChB,qBAAqB,EACrB,UAAU,EACV,YAAY,EACZ,UAAU,EACV,WAAW,EACX,YAAY,EACZ,UAAU,EACV,WAAW,EACX,YAAY,EACZ,eAAe,EACf,gBAAgB,EAChB,iBAAiB,EACjB,gBAAgB,EAChB,kBAAkB,EAClB,WAAW,EACX,WAAW,
|
|
1
|
+
{"version":3,"file":"converter.d.ts","sourceRoot":"","sources":["../../src/core/converter.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,aAAa,EACb,kBAAkB,EAClB,gBAAgB,EAChB,qBAAqB,EACrB,UAAU,EACV,YAAY,EACZ,UAAU,EACV,WAAW,EACX,YAAY,EACZ,UAAU,EACV,WAAW,EACX,YAAY,EACZ,eAAe,EACf,gBAAgB,EAChB,iBAAiB,EACjB,gBAAgB,EAChB,kBAAkB,EAClB,WAAW,EACX,WAAW,EACX,gBAAgB,EAChB,cAAc,EACd,eAAe,EACf,aAAa,EACb,YAAY,EACb,MAAM,YAAY,CAAC;AAEpB,OAAO,EAAE,aAAa,EAAqB,MAAM,uBAAuB,CAAC;AAiCzE,qBAAa,SAAS;IACpB,OAAO,CAAC,IAAI,CAAgB;IAC5B,OAAO,CAAC,OAAO,CAAqB;IACpC,OAAO,CAAC,MAAM,CAAC,QAAQ,CAAsD;IAC7E,OAAO,CAAC,MAAM,CAAC,iBAAiB,CAA6C;gBAEjE,IAAI,EAAE,aAAa,EAAE,OAAO,EAAE,kBAAkB;IAM5D,OAAO,CAAC,oBAAoB;IA0B5B;;OAEG;WACU,OAAO,CAClB,IAAI,EAAE,aAAa,EACnB,MAAM,EAAE,UAAU,EAClB,OAAO,GAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAM,GACpC,OAAO,CAAC,gBAAgB,CAAC;IAc5B;;OAEG;WACU,OAAO,CAClB,IAAI,EAAE,aAAa,EACnB,MAAM,EAAE,UAAU,EAClB,OAAO,GAAE,eAAoB,GAC5B,OAAO,CAAC,cAAc,CAAC;IAM1B;;OAEG;WACU,MAAM,CACjB,SAAS,EAAE,KAAK,CAAC;QAAE,IAAI,EAAE,aAAa,CAAC;QAAC,MAAM,EAAE,UAAU,CAAC;QAAC,IAAI,CAAC,EAAE,MAAM,CAAA;KAAE,CAAC,EAC5E,KAAK,EAAE,MAAM,EACb,OAAO,GAAE,IAAI,CAAC,aAAa,EAAE,OAAO,CAAM,GACzC,OAAO,CAAC,YAAY,CAAC;IAYxB;;OAEG;WACU,kBAAkB,IAAI,OAAO,CAAC;QACzC,KAAK,EAAE,CAAC,IAAI,EAAE,aAAa,EAAE,MAAM,EAAE,UAAU,EAAE,OAAO,CAAC,EAAE;YAAE,IAAI,CAAC,EAAE,MAAM,CAAA;SAAE,KAAK,OAAO,CAAC,IAAI,CAAC,CAAC;QAC/F,MAAM,EAAE,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,IAAI,CAAC,aAAa,EAAE,OAAO,CAAC,KAAK,YAAY,CAAC;QAChF,KAAK,EAAE,MAAM,IAAI,CAAC;KACnB,CAAC;IAaF;;OAEG;WACU,YAAY,CACvB,KAAK,EAAE,KAAK,CAAC;QAAE,IAAI,EAAE,aAAa,CAAC;QAAC,MAAM,EAAE,UAAU,CAAC;QAAC,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAA;KAAE,CAAC,EAC5F,MAAM,GAAE;QAAE,WAAW,CAAC,EAAE,MAAM,CAAC;QAAC,eAAe,CAAC,EAAE,OAAO,CAAA;KAAO,GAC/D,OAAO,CAAC;QAAE,OAAO,EAAE,gBAAgB,EAAE,CAAC;QAAC,MAAM,EAAE,KAAK,EAAE,CAAA;KAAE,CAAC;IA8B5D;;OAEG;WACU,qBAAqB,CAAC,OAAO,GAAE;QAAE,SAAS,CAAC,EAAE,MAAM,CAAA;KAAO,GAAG,OAAO,CAAC;QAChF,OAAO,EAAE,CAAC,IAAI,EAAE,aAAa,EAAE,MAAM,EAAE,UAAU,KAAK,OAAO,CAAC,IAAI,CAAC,CAAC;QACpE,MAAM,EAAE,CAAC,QAAQ,EAAE,CAAC,KAAK,EAAE,OAAO,KAAK,IAAI,KAAK,IAAI,CAAC;QACrD,KAAK,EAAE,CAAC,QAAQ,EAAE,MAAM,IAAI,KAAK,IAAI,CAAC;QACtC,OAAO,EAAE,CAAC,QAAQ,EAAE,CAAC,KAAK,EAAE,KAAK,KAAK,IAAI,KAAK,IAAI,CAAC;KACrD,CAAC;IAcI,OAAO,IAAI,OAAO,CAAC,gBAAgB,CAAC;YA6D5B,iBAAiB;YA4BjB,YAAY;IAuCpB,QAAQ,IAAI,OAAO,CAAC,MAAM,CAAC;IAiB3B,QAAQ,IAAI,OAAO,CAAC,MAAM,CAAC;IAK3B,SAAS,IAAI,OAAO,CAAC,MAAM,CAAC;IAO5B,MAAM,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC;IAM3C,MAAM,CAAC,IAAI,CAAC,IAAI,EAAE,aAAa,GAAG,gBAAgB;WAIrC,KAAK,CAChB,KAAK,EAAE,KAAK,CAAC;QAAE,IAAI,EAAE,aAAa,CAAC;QAAC,OAAO,EAAE,kBAAkB,CAAA;KAAE,CAAC,EAClE,WAAW,GAAE,MAAU,GACtB,OAAO,CAAC,qBAAqB,CAAC;WAwCpB,KAAK,CAAC,KAAK,EAAE,KAAK,CAAC,MAAM,GAAG,MAAM,CAAC,EAAE,MAAM,EAAE,UAAU,GAAG,OAAO,CAAC,MAAM,CAAC;WAazE,KAAK,CAAC,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE,MAAM,EAAE,WAAW,GAAG,OAAO,CAAC,MAAM,EAAE,CAAC;IAI5F,MAAM,CAAC,mBAAmB,IAAI,UAAU,EAAE;IAI1C,MAAM,CAAC,iBAAiB,CAAC,MAAM,EAAE,UAAU,EAAE,SAAS,EAAE,aAAa,GAAG,IAAI;CAG7E;AAED,qBAAa,gBAAgB;IAC3B,OAAO,CAAC,IAAI,CAAgB;IAC5B,OAAO,CAAC,OAAO,CAAmC;gBAEtC,IAAI,EAAE,aAAa;IAI/B,KAAK,CAAC,OAAO,CAAC,EAAE,UAAU,GAAG,IAAI;IAMjC,MAAM,CAAC,OAAO,CAAC,EAAE,WAAW,GAAG,IAAI;IAMnC,OAAO,CAAC,OAAO,CAAC,EAAE,YAAY,GAAG,IAAI;IAMrC,KAAK,CAAC,OAAO,CAAC,EAAE,UAAU,GAAG,IAAI;IAMjC,MAAM,CAAC,OAAO,CAAC,EAAE,WAAW,GAAG,IAAI;IAMnC,OAAO,CAAC,MAAM,GAAE,KAAK,GAAG,KAAK,GAAG,MAAM,GAAG,MAAM,GAAG,KAAa,EAAE,OAAO,CAAC,EAAE,YAAY,GAAG,IAAI;IAM9F,MAAM,IAAI,IAAI;IAKd,MAAM,IAAI,IAAI;IAKd,UAAU,IAAI,IAAI;IAKlB,KAAK,IAAI,IAAI;IAKb,aAAa,CAAC,MAAM,EAAE,eAAe,GAAG,IAAI;IAK5C,cAAc,CAAC,MAAM,EAAE,gBAAgB,GAAG,IAAI;IAK9C,eAAe,CAAC,MAAM,EAAE,iBAAiB,GAAG,IAAI;IAKhD,eAAe,CAAC,MAAM,EAAE,gBAAgB,GAAG,IAAI;IAS/C,UAAU,CAAC,MAAM,EAAE,kBAAkB,GAAG,IAAI;IAW5C,UAAU,CAAC,MAAM,EAAE,kBAAkB,GAAG,IAAI;IAW5C,SAAS,IAAI,IAAI;IAWjB,QAAQ,CAAC,IAAI,EAAE,IAAI,GAAG,IAAI,GAAG,IAAI,GAAG,QAAQ,GAAG,OAAO,GAAG,IAAI;IAW7D,SAAS,CAAC,MAAM,EAAE,WAAW,GAAG,IAAI;IAMpC,UAAU,CAAC,QAAQ,EAAE,CAAC,QAAQ,EAAE,YAAY,KAAK,IAAI,GAAG,IAAI;IAM5D,OAAO,CAAC,QAAQ,EAAE,CAAC,KAAK,EAAE,KAAK,KAAK,IAAI,GAAG,IAAI;IAM/C,OAAO,CAAC,EAAE,EAAE,MAAM,GAAG,IAAI;IAKzB,OAAO,CAAC,KAAK,EAAE,MAAM,GAAG,IAAI;IAKtB,QAAQ,IAAI,OAAO,CAAC,MAAM,CAAC;IAM3B,QAAQ,IAAI,OAAO,CAAC,MAAM,CAAC;IAM3B,SAAS,IAAI,OAAO,CAAC,MAAM,CAAC;IAM5B,MAAM,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC;IAMrC,OAAO,IAAI,OAAO,CAAC,gBAAgB,CAAC;IAM1C,OAAO,CAAC,UAAU;CAQnB;AAED,eAAe,SAAS,CAAC"}
|
package/dist/core/errors.d.ts
CHANGED
|
@@ -15,6 +15,11 @@ export declare enum ErrorCode {
|
|
|
15
15
|
CONVERSION_FAILED = "CONVERSION_FAILED",
|
|
16
16
|
CONVERSION_TIMEOUT = "CONVERSION_TIMEOUT",
|
|
17
17
|
CONVERSION_CANCELLED = "CONVERSION_CANCELLED",
|
|
18
|
+
EXTRACTION_FAILED = "EXTRACTION_FAILED",
|
|
19
|
+
ANALYSIS_FAILED = "ANALYSIS_FAILED",
|
|
20
|
+
SEARCH_FAILED = "SEARCH_FAILED",
|
|
21
|
+
BATCH_FAILED = "BATCH_FAILED",
|
|
22
|
+
STREAM_FAILED = "STREAM_FAILED",
|
|
18
23
|
MERGE_FAILED = "MERGE_FAILED",
|
|
19
24
|
SPLIT_FAILED = "SPLIT_FAILED",
|
|
20
25
|
COMPRESSION_FAILED = "COMPRESSION_FAILED",
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"errors.d.ts","sourceRoot":"","sources":["../../src/core/errors.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,oBAAY,SAAS;IACnB,aAAa,kBAAkB;IAC/B,cAAc,mBAAmB;IACjC,eAAe,oBAAoB;IACnC,kBAAkB,uBAAuB;IACzC,UAAU,eAAe;IAEzB,cAAc,mBAAmB;IACjC,eAAe,oBAAoB;IACnC,gBAAgB,qBAAqB;IACrC,kBAAkB,uBAAuB;IACzC,cAAc,mBAAmB;IAEjC,iBAAiB,sBAAsB;IACvC,kBAAkB,uBAAuB;IACzC,oBAAoB,yBAAyB;IAE7C,YAAY,iBAAiB;IAC7B,YAAY,iBAAiB;IAC7B,kBAAkB,uBAAuB;IACzC,iBAAiB,sBAAsB;IACvC,gBAAgB,qBAAqB;IACrC,UAAU,eAAe;IAEzB,eAAe,oBAAoB;IACnC,kBAAkB,uBAAuB;IACzC,YAAY,iBAAiB;IAC7B,cAAc,mBAAmB;IAEjC,aAAa,kBAAkB;IAC/B,aAAa,kBAAkB;IAC/B,eAAe,oBAAoB;CACpC;AAED,qBAAa,gBAAiB,SAAQ,KAAK;IACzC,SAAgB,IAAI,EAAE,SAAS,CAAC;IAEhC,SAAgB,OAAO,CAAC,EAAE,GAAG,CAAC;IAC9B,SAAgB,WAAW,EAAE,OAAO,CAAC;IACrC,SAAgB,SAAS,EAAE,IAAI,CAAC;IAChC,SAAgB,IAAI,CAAC,EAAE,MAAM,CAAC;gBAG5B,IAAI,EAAE,SAAS,EACf,OAAO,EAAE,MAAM,EACf,OAAO,CAAC,EAAE;QAER,OAAO,CAAC,EAAE,GAAG,CAAC;QACd,WAAW,CAAC,EAAE,OAAO,CAAC;QACtB,IAAI,CAAC,EAAE,MAAM,CAAC;QACd,KAAK,CAAC,EAAE,KAAK,CAAC;KACf;IAiBH,MAAM,IAAI,MAAM;IAahB,MAAM,CAAC,SAAS,CAAC,KAAK,EAAE,KAAK,EAAE,IAAI,GAAE,SAAoC,GAAG,gBAAgB;CAM7F;AAED,qBAAa,eAAgB,SAAQ,gBAAgB;gBAEvC,OAAO,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,GAAG;CAI3C;AAED,qBAAa,WAAY,SAAQ,gBAAgB;gBACnC,MAAM,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,MAAM;CAO7C;AAED,qBAAa,SAAU,SAAQ,gBAAgB;gBACjC,IAAI,EAAE,SAAS,EAAE,QAAQ,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,MAAM;CAOhE;AAED,qBAAa,qBAAsB,SAAQ,gBAAgB;gBAC7C,MAAM,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,KAAK;CAQ5D;AAED,qBAAa,YAAa,SAAQ,gBAAgB;gBACpC,OAAO,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,MAAM;CAO9C;AAED,wBAAgB,kBAAkB,CAAC,KAAK,EAAE,OAAO,GAAG,KAAK,IAAI,gBAAgB,CAE5E;AAED,wBAAgB,WAAW,CAAC,KAAK,EAAE,OAAO,GAAG,gBAAgB,CAc5D"}
|
|
1
|
+
{"version":3,"file":"errors.d.ts","sourceRoot":"","sources":["../../src/core/errors.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,oBAAY,SAAS;IACnB,aAAa,kBAAkB;IAC/B,cAAc,mBAAmB;IACjC,eAAe,oBAAoB;IACnC,kBAAkB,uBAAuB;IACzC,UAAU,eAAe;IAEzB,cAAc,mBAAmB;IACjC,eAAe,oBAAoB;IACnC,gBAAgB,qBAAqB;IACrC,kBAAkB,uBAAuB;IACzC,cAAc,mBAAmB;IAEjC,iBAAiB,sBAAsB;IACvC,kBAAkB,uBAAuB;IACzC,oBAAoB,yBAAyB;IAE7C,iBAAiB,sBAAsB;IACvC,eAAe,oBAAoB;IACnC,aAAa,kBAAkB;IAC/B,YAAY,iBAAiB;IAC7B,aAAa,kBAAkB;IAE/B,YAAY,iBAAiB;IAC7B,YAAY,iBAAiB;IAC7B,kBAAkB,uBAAuB;IACzC,iBAAiB,sBAAsB;IACvC,gBAAgB,qBAAqB;IACrC,UAAU,eAAe;IAEzB,eAAe,oBAAoB;IACnC,kBAAkB,uBAAuB;IACzC,YAAY,iBAAiB;IAC7B,cAAc,mBAAmB;IAEjC,aAAa,kBAAkB;IAC/B,aAAa,kBAAkB;IAC/B,eAAe,oBAAoB;CACpC;AAED,qBAAa,gBAAiB,SAAQ,KAAK;IACzC,SAAgB,IAAI,EAAE,SAAS,CAAC;IAEhC,SAAgB,OAAO,CAAC,EAAE,GAAG,CAAC;IAC9B,SAAgB,WAAW,EAAE,OAAO,CAAC;IACrC,SAAgB,SAAS,EAAE,IAAI,CAAC;IAChC,SAAgB,IAAI,CAAC,EAAE,MAAM,CAAC;gBAG5B,IAAI,EAAE,SAAS,EACf,OAAO,EAAE,MAAM,EACf,OAAO,CAAC,EAAE;QAER,OAAO,CAAC,EAAE,GAAG,CAAC;QACd,WAAW,CAAC,EAAE,OAAO,CAAC;QACtB,IAAI,CAAC,EAAE,MAAM,CAAC;QACd,KAAK,CAAC,EAAE,KAAK,CAAC;KACf;IAiBH,MAAM,IAAI,MAAM;IAahB,MAAM,CAAC,SAAS,CAAC,KAAK,EAAE,KAAK,EAAE,IAAI,GAAE,SAAoC,GAAG,gBAAgB;CAM7F;AAED,qBAAa,eAAgB,SAAQ,gBAAgB;gBAEvC,OAAO,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,GAAG;CAI3C;AAED,qBAAa,WAAY,SAAQ,gBAAgB;gBACnC,MAAM,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,MAAM;CAO7C;AAED,qBAAa,SAAU,SAAQ,gBAAgB;gBACjC,IAAI,EAAE,SAAS,EAAE,QAAQ,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,MAAM;CAOhE;AAED,qBAAa,qBAAsB,SAAQ,gBAAgB;gBAC7C,MAAM,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,MAAM,EAAE,KAAK,CAAC,EAAE,KAAK;CAQ5D;AAED,qBAAa,YAAa,SAAQ,gBAAgB;gBACpC,OAAO,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,MAAM;CAO9C;AAED,wBAAgB,kBAAkB,CAAC,KAAK,EAAE,OAAO,GAAG,KAAK,IAAI,gBAAgB,CAE5E;AAED,wBAAgB,WAAW,CAAC,KAAK,EAAE,OAAO,GAAG,gBAAgB,CAc5D"}
|