@kreuzberg/node 4.0.0-rc.6 → 4.0.0-rc.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +45 -14
- package/dist/cli.d.mts +9 -0
- package/dist/cli.d.ts +9 -0
- package/dist/cli.js +78 -0
- package/dist/cli.js.map +1 -0
- package/dist/cli.mjs +43 -0
- package/dist/cli.mjs.map +1 -0
- package/dist/errors.d.mts +358 -0
- package/dist/errors.d.ts +358 -0
- package/dist/errors.js +139 -0
- package/dist/errors.js.map +1 -0
- package/dist/errors.mjs +107 -0
- package/dist/errors.mjs.map +1 -0
- package/dist/index.d.mts +857 -0
- package/dist/index.d.ts +857 -0
- package/dist/index.js +815 -0
- package/dist/index.js.map +1 -0
- package/dist/index.mjs +754 -0
- package/dist/index.mjs.map +1 -0
- package/dist/ocr/guten-ocr.d.mts +193 -0
- package/dist/ocr/guten-ocr.d.ts +193 -0
- package/dist/ocr/guten-ocr.js +232 -0
- package/dist/ocr/guten-ocr.js.map +1 -0
- package/dist/ocr/guten-ocr.mjs +198 -0
- package/dist/ocr/guten-ocr.mjs.map +1 -0
- package/dist/types.d.mts +666 -0
- package/dist/types.d.ts +666 -0
- package/dist/types.js +17 -0
- package/dist/types.js.map +1 -0
- package/dist/types.mjs +1 -0
- package/dist/types.mjs.map +1 -0
- package/index.d.ts +11 -2
- package/index.js +52 -52
- package/package.json +30 -29
- package/LICENSE +0 -7
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../typescript/types.ts"],"sourcesContent":["/**\n * Type definitions for Kreuzberg extraction results.\n *\n * These types mirror the strongly-typed Rust metadata structures,\n * providing type safety for TypeScript users.\n */\n\n// ============================================================================\n// ============================================================================\n\nexport interface TesseractConfig {\n\tpsm?: number;\n\tenableTableDetection?: boolean;\n\ttesseditCharWhitelist?: string;\n}\n\nexport interface OcrConfig {\n\tbackend: string;\n\tlanguage?: string;\n\ttesseractConfig?: TesseractConfig;\n}\n\nexport interface ChunkingConfig {\n\tmaxChars?: number;\n\tmaxOverlap?: number;\n\tchunkSize?: number;\n\tchunkOverlap?: number;\n\tpreset?: string;\n\tembedding?: Record<string, unknown>;\n\tenabled?: boolean;\n}\n\nexport interface LanguageDetectionConfig {\n\tenabled?: boolean;\n\tminConfidence?: number;\n\tdetectMultiple?: boolean;\n}\n\nexport interface TokenReductionConfig {\n\tmode?: string;\n\tpreserveImportantWords?: boolean;\n}\n\nexport interface PdfConfig {\n\textractImages?: boolean;\n\tpasswords?: string[];\n\textractMetadata?: boolean;\n}\n\nexport interface ImageExtractionConfig {\n\textractImages?: boolean;\n\ttargetDpi?: number;\n\tmaxImageDimension?: number;\n\tautoAdjustDpi?: boolean;\n\tminDpi?: number;\n\tmaxDpi?: number;\n}\n\nexport interface PostProcessorConfig {\n\tenabled?: boolean;\n\tenabledProcessors?: string[];\n\tdisabledProcessors?: string[];\n}\n\nexport interface HtmlPreprocessingOptions {\n\tenabled?: boolean;\n\tpreset?: \"minimal\" | \"standard\" | \"aggressive\";\n\tremoveNavigation?: boolean;\n\tremoveForms?: boolean;\n}\n\nexport interface HtmlConversionOptions {\n\theadingStyle?: \"atx\" | \"underlined\" | \"atx_closed\";\n\tlistIndentType?: \"spaces\" | \"tabs\";\n\tlistIndentWidth?: number;\n\tbullets?: string;\n\tstrongEmSymbol?: string;\n\tescapeAsterisks?: boolean;\n\tescapeUnderscores?: boolean;\n\tescapeMisc?: boolean;\n\tescapeAscii?: boolean;\n\tcodeLanguage?: string;\n\tautolinks?: boolean;\n\tdefaultTitle?: boolean;\n\tbrInTables?: boolean;\n\thocrSpatialTables?: boolean;\n\thighlightStyle?: \"double_equal\" | \"html\" | \"bold\" | \"none\";\n\textractMetadata?: boolean;\n\twhitespaceMode?: \"normalized\" | \"strict\";\n\tstripNewlines?: boolean;\n\twrap?: boolean;\n\twrapWidth?: number;\n\tconvertAsInline?: boolean;\n\tsubSymbol?: string;\n\tsupSymbol?: string;\n\tnewlineStyle?: \"spaces\" | \"backslash\";\n\tcodeBlockStyle?: \"indented\" | \"backticks\" | \"tildes\";\n\tkeepInlineImagesIn?: string[];\n\tencoding?: string;\n\tdebug?: boolean;\n\tstripTags?: string[];\n\tpreserveTags?: string[];\n\tpreprocessing?: HtmlPreprocessingOptions;\n}\n\nexport type KeywordAlgorithm = \"yake\" | \"rake\";\n\nexport interface YakeParams {\n\twindowSize?: number;\n}\n\nexport interface RakeParams {\n\tminWordLength?: number;\n\tmaxWordsPerPhrase?: number;\n}\n\nexport interface KeywordConfig {\n\talgorithm?: KeywordAlgorithm;\n\tmaxKeywords?: number;\n\tminScore?: number;\n\tngramRange?: [number, number];\n\tlanguage?: string;\n\tyakeParams?: YakeParams;\n\trakeParams?: RakeParams;\n}\n\n/**\n * Page tracking and extraction configuration.\n *\n * Controls how pages/slides/sheets are extracted and tracked in the document.\n * Page range information in chunk metadata (first_page/last_page) is automatically\n * enabled when page boundaries are available and chunking is configured.\n */\nexport interface PageConfig {\n\t/** Extract pages as separate array (ExtractionResult.pages) */\n\textractPages?: boolean;\n\t/** Insert page markers in main content string */\n\tinsertPageMarkers?: boolean;\n\t/** Page marker format (use {page_num} placeholder) */\n\tmarkerFormat?: string;\n}\n\nexport interface ExtractionConfig {\n\tuseCache?: boolean;\n\tenableQualityProcessing?: boolean;\n\tocr?: OcrConfig;\n\tforceOcr?: boolean;\n\tchunking?: ChunkingConfig;\n\timages?: ImageExtractionConfig;\n\tpdfOptions?: PdfConfig;\n\ttokenReduction?: TokenReductionConfig;\n\tlanguageDetection?: LanguageDetectionConfig;\n\tpostprocessor?: PostProcessorConfig;\n\thtmlOptions?: HtmlConversionOptions;\n\tkeywords?: KeywordConfig;\n\tpages?: PageConfig;\n\tmaxConcurrentExtractions?: number;\n}\n\nexport interface Table {\n\tcells: string[][];\n\tmarkdown: string;\n\tpageNumber: number;\n}\n\nexport interface ExcelMetadata {\n\tsheetCount?: number;\n\tsheetNames?: string[];\n}\n\nexport interface EmailMetadata {\n\tfromEmail?: string | null;\n\tfromName?: string | null;\n\ttoEmails?: string[];\n\tccEmails?: string[];\n\tbccEmails?: string[];\n\tmessageId?: string | null;\n\tattachments?: string[];\n}\n\nexport interface ArchiveMetadata {\n\tformat?: string;\n\tfileCount?: number;\n\tfileList?: string[];\n\ttotalSize?: number;\n\tcompressedSize?: number | null;\n}\n\nexport interface ImageMetadata {\n\twidth?: number;\n\theight?: number;\n\tformat?: string;\n\texif?: Record<string, string>;\n}\n\nexport interface XmlMetadata {\n\telementCount?: number;\n\tuniqueElements?: string[];\n}\n\nexport interface TextMetadata {\n\tlineCount?: number;\n\twordCount?: number;\n\tcharacterCount?: number;\n\theaders?: string[] | null;\n\tlinks?: [string, string][] | null;\n\tcodeBlocks?: [string, string][] | null;\n}\n\nexport interface HtmlMetadata {\n\ttitle?: string | null;\n\tdescription?: string | null;\n\tkeywords?: string | null;\n\tauthor?: string | null;\n\tcanonical?: string | null;\n\tbaseHref?: string | null;\n\togTitle?: string | null;\n\togDescription?: string | null;\n\togImage?: string | null;\n\togUrl?: string | null;\n\togType?: string | null;\n\togSiteName?: string | null;\n\ttwitterCard?: string | null;\n\ttwitterTitle?: string | null;\n\ttwitterDescription?: string | null;\n\ttwitterImage?: string | null;\n\ttwitterSite?: string | null;\n\ttwitterCreator?: string | null;\n\tlinkAuthor?: string | null;\n\tlinkLicense?: string | null;\n\tlinkAlternate?: string | null;\n}\n\nexport interface PdfMetadata {\n\ttitle?: string | null;\n\tauthor?: string | null;\n\tsubject?: string | null;\n\tkeywords?: string | null;\n\tcreator?: string | null;\n\tproducer?: string | null;\n\tcreationDate?: string | null;\n\tmodificationDate?: string | null;\n\tpageCount?: number;\n}\n\nexport interface PptxMetadata {\n\ttitle?: string | null;\n\tauthor?: string | null;\n\tdescription?: string | null;\n\tsummary?: string | null;\n\tfonts?: string[];\n}\n\nexport interface OcrMetadata {\n\tlanguage?: string;\n\tpsm?: number;\n\toutputFormat?: string;\n\ttableCount?: number;\n\ttableRows?: number | null;\n\ttableCols?: number | null;\n}\n\nexport interface ImagePreprocessingMetadata {\n\toriginalDimensions?: [number, number];\n\toriginalDpi?: [number, number];\n\ttargetDpi?: number;\n\tscaleFactor?: number;\n\tautoAdjusted?: boolean;\n\tfinalDpi?: number;\n\tnewDimensions?: [number, number] | null;\n\tresampleMethod?: string;\n\tdimensionClamped?: boolean;\n\tcalculatedDpi?: number | null;\n\tskippedResize?: boolean;\n\tresizeError?: string | null;\n}\n\nexport interface ErrorMetadata {\n\terrorType?: string;\n\tmessage?: string;\n}\n\n/**\n * Page boundary information for chunk metadata.\n *\n * Tracks where a specific page's content starts and ends in the main content string,\n * enabling mapping from byte positions to page numbers. All offsets are guaranteed to be\n * at valid UTF-8 character boundaries.\n */\nexport interface PageBoundary {\n\t/** Byte offset where this page starts in the content string (UTF-8 valid boundary, inclusive) */\n\tbyteStart: number;\n\t/** Byte offset where this page ends in the content string (UTF-8 valid boundary, exclusive) */\n\tbyteEnd: number;\n\t/** Page number (1-indexed) */\n\tpageNumber: number;\n}\n\n/**\n * Type of paginated unit in a document.\n *\n * Distinguishes between different types of \"pages\":\n * - \"page\": Standard document pages (PDF, DOCX, images)\n * - \"slide\": Presentation slides (PPTX, ODP)\n * - \"sheet\": Spreadsheet sheets (XLSX, ODS)\n */\nexport type PageUnitType = \"page\" | \"slide\" | \"sheet\";\n\n/**\n * Detailed per-page metadata.\n *\n * Captures information about a single page/slide/sheet including dimensions,\n * content counts, and visibility state.\n */\nexport interface PageInfo {\n\t/** Page number (1-indexed) */\n\tnumber: number;\n\t/** Page title (usually for presentations) */\n\ttitle?: string | null;\n\t/** Dimensions in points (PDF) or pixels (images): [width, height] */\n\tdimensions?: [number, number] | null;\n\t/** Number of images on this page */\n\timageCount?: number | null;\n\t/** Number of tables on this page */\n\ttableCount?: number | null;\n\t/** Whether this page is hidden (e.g., in presentations) */\n\thidden?: boolean | null;\n}\n\n/**\n * Page structure metadata.\n *\n * Contains information about pages/slides/sheets in a document, including\n * boundaries for mapping chunks to pages and detailed per-page metadata.\n */\nexport interface PageStructure {\n\t/** Total number of pages/slides/sheets */\n\ttotalCount: number;\n\t/** Type of paginated unit (page, slide, or sheet) */\n\tunitType: PageUnitType;\n\t/** Byte offset boundaries for each page */\n\tboundaries?: PageBoundary[] | null;\n\t/** Detailed per-page metadata (optional, only when needed) */\n\tpages?: PageInfo[] | null;\n}\n\n/**\n * Metadata about a chunk's position and properties in the document.\n *\n * Tracks where a chunk appears in the original document, including byte offsets\n * and page ranges when page tracking is enabled.\n */\nexport interface ChunkMetadata {\n\t/** Byte offset where this chunk starts in the original text (UTF-8 valid boundary) */\n\tbyteStart: number;\n\t/** Byte offset where this chunk ends in the original text (UTF-8 valid boundary) */\n\tbyteEnd: number;\n\t/** Number of tokens in this chunk (if available from embedding model) */\n\ttokenCount?: number | null;\n\t/** Zero-based index of this chunk in the document */\n\tchunkIndex: number;\n\t/** Total number of chunks in the document */\n\ttotalChunks: number;\n\t/** First page number this chunk spans (1-indexed, only when page tracking enabled) */\n\tfirstPage?: number | null;\n\t/** Last page number this chunk spans (1-indexed, only when page tracking enabled) */\n\tlastPage?: number | null;\n}\n\nexport interface Chunk {\n\tcontent: string;\n\tembedding?: number[] | null;\n\tmetadata: ChunkMetadata;\n}\n\nexport interface ExtractedImage {\n\tdata: Uint8Array;\n\tformat: string;\n\timageIndex: number;\n\tpageNumber?: number | null;\n\twidth?: number | null;\n\theight?: number | null;\n\tcolorspace?: string | null;\n\tbitsPerComponent?: number | null;\n\tisMask: boolean;\n\tdescription?: string | null;\n\tocrResult?: ExtractionResult | null;\n}\n\n/**\n * Content for a single page/slide/sheet.\n *\n * When page extraction is enabled, documents are split into per-page content\n * with associated tables and images mapped to each page.\n */\nexport interface PageContent {\n\t/** Page number (1-indexed) */\n\tpageNumber: number;\n\t/** Text content for this page */\n\tcontent: string;\n\t/** Tables found on this page */\n\ttables: Table[];\n\t/** Images found on this page */\n\timages: ExtractedImage[];\n}\n\n/**\n * Extraction result metadata.\n *\n * Uses a flattened discriminated union approach with format_type as the discriminator.\n * When format_type is set (e.g., \"archive\"), the corresponding format-specific fields\n * are available at the root level of the metadata object.\n *\n * This structure matches the Rust serialization with serde's tagged enum flattening.\n */\nexport interface Metadata {\n\tlanguage?: string | null;\n\tdate?: string | null;\n\tsubject?: string | null;\n\n\tformat_type?: \"pdf\" | \"excel\" | \"email\" | \"pptx\" | \"archive\" | \"image\" | \"xml\" | \"text\" | \"html\" | \"ocr\";\n\n\ttitle?: string | null;\n\tauthor?: string | null;\n\tkeywords?: string | null;\n\tcreator?: string | null;\n\tproducer?: string | null;\n\tcreation_date?: string | null;\n\tmodification_date?: string | null;\n\tpage_count?: number;\n\n\tsheet_count?: number;\n\tsheet_names?: string[];\n\n\tfrom_email?: string | null;\n\tfrom_name?: string | null;\n\tto_emails?: string[];\n\tcc_emails?: string[];\n\tbcc_emails?: string[];\n\tmessage_id?: string | null;\n\tattachments?: string[];\n\n\tdescription?: string | null;\n\tsummary?: string | null;\n\tfonts?: string[];\n\n\tformat?: string;\n\tfile_count?: number;\n\tfile_list?: string[];\n\ttotal_size?: number;\n\tcompressed_size?: number | null;\n\n\twidth?: number;\n\theight?: number;\n\texif?: Record<string, string>;\n\n\telement_count?: number;\n\tunique_elements?: string[];\n\n\tline_count?: number;\n\tword_count?: number;\n\tcharacter_count?: number;\n\theaders?: string[] | null;\n\tlinks?: [string, string][] | null;\n\tcode_blocks?: [string, string][] | null;\n\n\tcanonical?: string | null;\n\tbase_href?: string | null;\n\tog_title?: string | null;\n\tog_description?: string | null;\n\tog_image?: string | null;\n\tog_url?: string | null;\n\tog_type?: string | null;\n\tog_site_name?: string | null;\n\ttwitter_card?: string | null;\n\ttwitter_title?: string | null;\n\ttwitter_description?: string | null;\n\ttwitter_image?: string | null;\n\ttwitter_site?: string | null;\n\ttwitter_creator?: string | null;\n\tlink_author?: string | null;\n\tlink_license?: string | null;\n\tlink_alternate?: string | null;\n\n\tpsm?: number;\n\toutput_format?: string;\n\ttable_count?: number;\n\ttable_rows?: number | null;\n\ttable_cols?: number | null;\n\n\timage_preprocessing?: ImagePreprocessingMetadata | null;\n\n\tjson_schema?: Record<string, unknown> | null;\n\n\tpage_structure?: PageStructure | null;\n\n\terror?: ErrorMetadata | null;\n\n\t// biome-ignore lint/suspicious/noExplicitAny: Postprocessors can add arbitrary metadata fields\n\t[key: string]: any;\n}\n\nexport interface ExtractionResult {\n\tcontent: string;\n\tmimeType: string;\n\tmetadata: Metadata;\n\ttables: Table[];\n\tdetectedLanguages: string[] | null;\n\tchunks: Chunk[] | null;\n\timages: ExtractedImage[] | null;\n\tpages?: PageContent[] | null;\n}\n\nexport type ProcessingStage = \"early\" | \"middle\" | \"late\";\n\nexport interface PostProcessorProtocol {\n\t/**\n\t * Return the unique name of this postprocessor.\n\t */\n\tname(): string;\n\n\t/**\n\t * Process and enrich an extraction result.\n\t *\n\t * @param result - ExtractionResult with extracted content, metadata, and tables\n\t * @returns Modified result with enriched metadata\n\t */\n\tprocess(result: ExtractionResult): ExtractionResult | Promise<ExtractionResult>;\n\n\t/**\n\t * Return the processing stage for this processor.\n\t *\n\t * @returns One of \"early\", \"middle\", or \"late\" (default: \"middle\")\n\t */\n\tprocessingStage?(): ProcessingStage;\n\n\t/**\n\t * Initialize the processor (e.g., load ML models).\n\t *\n\t * Called once when the processor is registered.\n\t */\n\tinitialize?(): void | Promise<void>;\n\n\t/**\n\t * Shutdown the processor and release resources.\n\t *\n\t * Called when the processor is unregistered.\n\t */\n\tshutdown?(): void | Promise<void>;\n}\n\nexport interface ValidatorProtocol {\n\t/**\n\t * Return the unique name of this validator.\n\t */\n\tname(): string;\n\n\t/**\n\t * Validate an extraction result.\n\t *\n\t * Throw an error if validation fails. The error message should explain why validation failed.\n\t * If validation passes, return without throwing.\n\t *\n\t * @param result - ExtractionResult to validate\n\t * @throws Error if validation fails (extraction will fail)\n\t */\n\tvalidate(result: ExtractionResult): void | Promise<void>;\n\n\t/**\n\t * Return the validation priority.\n\t *\n\t * Higher priority validators run first. Useful for running cheap validations before expensive ones.\n\t *\n\t * @returns Priority value (higher = runs earlier, default: 50)\n\t */\n\tpriority?(): number;\n\n\t/**\n\t * Check if this validator should run for a given result.\n\t *\n\t * Allows conditional validation based on MIME type, metadata, or content.\n\t *\n\t * @param result - ExtractionResult to check\n\t * @returns true if validator should run, false to skip (default: true)\n\t */\n\tshouldValidate?(result: ExtractionResult): boolean;\n\n\t/**\n\t * Initialize the validator.\n\t *\n\t * Called once when the validator is registered.\n\t */\n\tinitialize?(): void | Promise<void>;\n\n\t/**\n\t * Shutdown the validator and release resources.\n\t *\n\t * Called when the validator is unregistered.\n\t */\n\tshutdown?(): void | Promise<void>;\n}\n\n/**\n * OCR backend protocol for implementing custom OCR engines.\n *\n * This interface defines the contract for OCR backends that can be registered\n * with Kreuzberg's extraction pipeline.\n *\n * ## Implementation Requirements\n *\n * OCR backends must implement:\n * - `name()`: Return a unique backend identifier\n * - `supportedLanguages()`: Return list of supported ISO 639-1/2/3 language codes\n * - `processImage()`: Process image bytes and return extraction result\n *\n * ## Optional Methods\n *\n * - `initialize()`: Called when backend is registered (load models, etc.)\n * - `shutdown()`: Called when backend is unregistered (cleanup resources)\n *\n * @example\n * ```typescript\n * import { GutenOcrBackend } from '@kreuzberg/node/ocr/guten-ocr';\n * import { registerOcrBackend, extractFile } from '@kreuzberg/node';\n *\n * // Create and register the backend\n * const backend = new GutenOcrBackend();\n * await backend.initialize();\n * registerOcrBackend(backend);\n *\n * // Use with extraction\n * const result = await extractFile('scanned.pdf', null, {\n * ocr: { backend: 'guten-ocr', language: 'en' }\n * });\n * ```\n */\nexport interface OcrBackendProtocol {\n\t/**\n\t * Return the unique name of this OCR backend.\n\t *\n\t * This name is used in ExtractionConfig to select the backend:\n\t * ```typescript\n\t * { ocr: { backend: 'guten-ocr', language: 'en' } }\n\t * ```\n\t *\n\t * @returns Unique backend identifier (e.g., \"guten-ocr\", \"tesseract\")\n\t */\n\tname(): string;\n\n\t/**\n\t * Return list of supported language codes.\n\t *\n\t * Language codes should follow ISO 639-1 (2-letter) or ISO 639-2 (3-letter) standards.\n\t * Common codes: \"en\", \"eng\" (English), \"de\", \"deu\" (German), \"fr\", \"fra\" (French).\n\t *\n\t * @returns Array of supported language codes\n\t *\n\t * @example\n\t * ```typescript\n\t * supportedLanguages(): string[] {\n\t * return [\"en\", \"eng\", \"de\", \"deu\", \"fr\", \"fra\"];\n\t * }\n\t * ```\n\t */\n\tsupportedLanguages(): string[];\n\n\t/**\n\t * Process image bytes and extract text via OCR.\n\t *\n\t * This method receives raw image data and must return a result object with:\n\t * - `content`: Extracted text content\n\t * - `mime_type`: MIME type (usually \"text/plain\")\n\t * - `metadata`: Additional information (confidence, dimensions, etc.)\n\t * - `tables`: Optional array of detected tables\n\t *\n\t * @param imageBytes - Raw image data (Uint8Array) or Base64-encoded string (when called from Rust bindings)\n\t * @param language - Language code from supportedLanguages()\n\t * @returns Promise resolving to extraction result\n\t *\n\t * @example\n\t * ```typescript\n\t * async processImage(imageBytes: Uint8Array | string, language: string): Promise<{\n\t * content: string;\n\t * mime_type: string;\n\t * metadata: Record<string, unknown>;\n\t * tables: unknown[];\n\t * }> {\n\t * const buffer = typeof imageBytes === \"string\" ? Buffer.from(imageBytes, \"base64\") : Buffer.from(imageBytes);\n\t * const text = await myOcrEngine.recognize(buffer, language);\n\t * return {\n\t * content: text,\n\t * mime_type: \"text/plain\",\n\t * metadata: { confidence: 0.95, language },\n\t * tables: []\n\t * };\n\t * }\n\t * ```\n\t */\n\tprocessImage(\n\t\timageBytes: Uint8Array | string,\n\t\tlanguage: string,\n\t): Promise<{\n\t\tcontent: string;\n\t\tmime_type: string;\n\t\tmetadata: Record<string, unknown>;\n\t\ttables: unknown[];\n\t}>;\n\n\t/**\n\t * Initialize the OCR backend (optional).\n\t *\n\t * Called once when the backend is registered. Use this to:\n\t * - Load ML models\n\t * - Initialize libraries\n\t * - Validate dependencies\n\t *\n\t * @example\n\t * ```typescript\n\t * async initialize(): Promise<void> {\n\t * this.model = await loadModel('./path/to/model');\n\t * }\n\t * ```\n\t */\n\tinitialize?(): void | Promise<void>;\n\n\t/**\n\t * Shutdown the OCR backend and release resources (optional).\n\t *\n\t * Called when the backend is unregistered. Use this to:\n\t * - Free model memory\n\t * - Close file handles\n\t * - Cleanup temporary files\n\t *\n\t * @example\n\t * ```typescript\n\t * async shutdown(): Promise<void> {\n\t * await this.model.dispose();\n\t * this.model = null;\n\t * }\n\t * ```\n\t */\n\tshutdown?(): void | Promise<void>;\n}\n"],"mappings":";;;;;;;;;;;;;;AAAA;AAAA;","names":[]}
|
package/dist/types.mjs
ADDED
|
@@ -0,0 +1 @@
|
|
|
1
|
+
//# sourceMappingURL=types.mjs.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":[],"sourcesContent":[],"mappings":"","names":[]}
|
package/index.d.ts
CHANGED
|
@@ -596,11 +596,13 @@ export interface JsChunkingConfig {
|
|
|
596
596
|
}
|
|
597
597
|
|
|
598
598
|
export interface JsChunkMetadata {
|
|
599
|
-
|
|
600
|
-
|
|
599
|
+
byteStart: number
|
|
600
|
+
byteEnd: number
|
|
601
601
|
tokenCount?: number
|
|
602
602
|
chunkIndex: number
|
|
603
603
|
totalChunks: number
|
|
604
|
+
firstPage?: number
|
|
605
|
+
lastPage?: number
|
|
604
606
|
}
|
|
605
607
|
|
|
606
608
|
/** Embedding generation configuration for Node.js bindings. */
|
|
@@ -662,6 +664,7 @@ export interface JsExtractionConfig {
|
|
|
662
664
|
keywords?: JsKeywordConfig
|
|
663
665
|
htmlOptions?: JsHtmlOptions
|
|
664
666
|
maxConcurrentExtractions?: number
|
|
667
|
+
pages?: JsPageConfig
|
|
665
668
|
}
|
|
666
669
|
|
|
667
670
|
export interface JsExtractionResult {
|
|
@@ -746,6 +749,12 @@ export interface JsOcrConfig {
|
|
|
746
749
|
tesseractConfig?: JsTesseractConfig
|
|
747
750
|
}
|
|
748
751
|
|
|
752
|
+
export interface JsPageConfig {
|
|
753
|
+
extractPages?: boolean
|
|
754
|
+
insertPageMarkers?: boolean
|
|
755
|
+
markerFormat?: string
|
|
756
|
+
}
|
|
757
|
+
|
|
749
758
|
export interface JsPdfConfig {
|
|
750
759
|
extractImages?: boolean
|
|
751
760
|
passwords?: Array<string>
|
package/index.js
CHANGED
|
@@ -77,8 +77,8 @@ function requireNative() {
|
|
|
77
77
|
try {
|
|
78
78
|
const binding = require('@kreuzberg/node-android-arm64')
|
|
79
79
|
const bindingPackageVersion = require('@kreuzberg/node-android-arm64/package.json').version
|
|
80
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
81
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
80
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
81
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
82
82
|
}
|
|
83
83
|
return binding
|
|
84
84
|
} catch (e) {
|
|
@@ -93,8 +93,8 @@ function requireNative() {
|
|
|
93
93
|
try {
|
|
94
94
|
const binding = require('@kreuzberg/node-android-arm-eabi')
|
|
95
95
|
const bindingPackageVersion = require('@kreuzberg/node-android-arm-eabi/package.json').version
|
|
96
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
97
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
96
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
97
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
98
98
|
}
|
|
99
99
|
return binding
|
|
100
100
|
} catch (e) {
|
|
@@ -114,8 +114,8 @@ function requireNative() {
|
|
|
114
114
|
try {
|
|
115
115
|
const binding = require('@kreuzberg/node-win32-x64-gnu')
|
|
116
116
|
const bindingPackageVersion = require('@kreuzberg/node-win32-x64-gnu/package.json').version
|
|
117
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
118
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
117
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
118
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
119
119
|
}
|
|
120
120
|
return binding
|
|
121
121
|
} catch (e) {
|
|
@@ -130,8 +130,8 @@ function requireNative() {
|
|
|
130
130
|
try {
|
|
131
131
|
const binding = require('@kreuzberg/node-win32-x64-msvc')
|
|
132
132
|
const bindingPackageVersion = require('@kreuzberg/node-win32-x64-msvc/package.json').version
|
|
133
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
134
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
133
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
134
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
135
135
|
}
|
|
136
136
|
return binding
|
|
137
137
|
} catch (e) {
|
|
@@ -147,8 +147,8 @@ function requireNative() {
|
|
|
147
147
|
try {
|
|
148
148
|
const binding = require('@kreuzberg/node-win32-ia32-msvc')
|
|
149
149
|
const bindingPackageVersion = require('@kreuzberg/node-win32-ia32-msvc/package.json').version
|
|
150
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
151
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
150
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
151
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
152
152
|
}
|
|
153
153
|
return binding
|
|
154
154
|
} catch (e) {
|
|
@@ -163,8 +163,8 @@ function requireNative() {
|
|
|
163
163
|
try {
|
|
164
164
|
const binding = require('@kreuzberg/node-win32-arm64-msvc')
|
|
165
165
|
const bindingPackageVersion = require('@kreuzberg/node-win32-arm64-msvc/package.json').version
|
|
166
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
167
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
166
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
167
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
168
168
|
}
|
|
169
169
|
return binding
|
|
170
170
|
} catch (e) {
|
|
@@ -182,8 +182,8 @@ function requireNative() {
|
|
|
182
182
|
try {
|
|
183
183
|
const binding = require('@kreuzberg/node-darwin-universal')
|
|
184
184
|
const bindingPackageVersion = require('@kreuzberg/node-darwin-universal/package.json').version
|
|
185
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
186
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
185
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
186
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
187
187
|
}
|
|
188
188
|
return binding
|
|
189
189
|
} catch (e) {
|
|
@@ -198,8 +198,8 @@ function requireNative() {
|
|
|
198
198
|
try {
|
|
199
199
|
const binding = require('@kreuzberg/node-darwin-x64')
|
|
200
200
|
const bindingPackageVersion = require('@kreuzberg/node-darwin-x64/package.json').version
|
|
201
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
202
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
201
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
202
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
203
203
|
}
|
|
204
204
|
return binding
|
|
205
205
|
} catch (e) {
|
|
@@ -214,8 +214,8 @@ function requireNative() {
|
|
|
214
214
|
try {
|
|
215
215
|
const binding = require('@kreuzberg/node-darwin-arm64')
|
|
216
216
|
const bindingPackageVersion = require('@kreuzberg/node-darwin-arm64/package.json').version
|
|
217
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
218
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
217
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
218
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
219
219
|
}
|
|
220
220
|
return binding
|
|
221
221
|
} catch (e) {
|
|
@@ -234,8 +234,8 @@ function requireNative() {
|
|
|
234
234
|
try {
|
|
235
235
|
const binding = require('@kreuzberg/node-freebsd-x64')
|
|
236
236
|
const bindingPackageVersion = require('@kreuzberg/node-freebsd-x64/package.json').version
|
|
237
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
238
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
237
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
238
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
239
239
|
}
|
|
240
240
|
return binding
|
|
241
241
|
} catch (e) {
|
|
@@ -250,8 +250,8 @@ function requireNative() {
|
|
|
250
250
|
try {
|
|
251
251
|
const binding = require('@kreuzberg/node-freebsd-arm64')
|
|
252
252
|
const bindingPackageVersion = require('@kreuzberg/node-freebsd-arm64/package.json').version
|
|
253
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
254
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
253
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
254
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
255
255
|
}
|
|
256
256
|
return binding
|
|
257
257
|
} catch (e) {
|
|
@@ -271,8 +271,8 @@ function requireNative() {
|
|
|
271
271
|
try {
|
|
272
272
|
const binding = require('@kreuzberg/node-linux-x64-musl')
|
|
273
273
|
const bindingPackageVersion = require('@kreuzberg/node-linux-x64-musl/package.json').version
|
|
274
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
275
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
274
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
275
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
276
276
|
}
|
|
277
277
|
return binding
|
|
278
278
|
} catch (e) {
|
|
@@ -287,8 +287,8 @@ function requireNative() {
|
|
|
287
287
|
try {
|
|
288
288
|
const binding = require('@kreuzberg/node-linux-x64-gnu')
|
|
289
289
|
const bindingPackageVersion = require('@kreuzberg/node-linux-x64-gnu/package.json').version
|
|
290
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
291
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
290
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
291
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
292
292
|
}
|
|
293
293
|
return binding
|
|
294
294
|
} catch (e) {
|
|
@@ -305,8 +305,8 @@ function requireNative() {
|
|
|
305
305
|
try {
|
|
306
306
|
const binding = require('@kreuzberg/node-linux-arm64-musl')
|
|
307
307
|
const bindingPackageVersion = require('@kreuzberg/node-linux-arm64-musl/package.json').version
|
|
308
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
309
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
308
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
309
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
310
310
|
}
|
|
311
311
|
return binding
|
|
312
312
|
} catch (e) {
|
|
@@ -321,8 +321,8 @@ function requireNative() {
|
|
|
321
321
|
try {
|
|
322
322
|
const binding = require('@kreuzberg/node-linux-arm64-gnu')
|
|
323
323
|
const bindingPackageVersion = require('@kreuzberg/node-linux-arm64-gnu/package.json').version
|
|
324
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
325
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
324
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
325
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
326
326
|
}
|
|
327
327
|
return binding
|
|
328
328
|
} catch (e) {
|
|
@@ -339,8 +339,8 @@ function requireNative() {
|
|
|
339
339
|
try {
|
|
340
340
|
const binding = require('@kreuzberg/node-linux-arm-musleabihf')
|
|
341
341
|
const bindingPackageVersion = require('@kreuzberg/node-linux-arm-musleabihf/package.json').version
|
|
342
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
343
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
342
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
343
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
344
344
|
}
|
|
345
345
|
return binding
|
|
346
346
|
} catch (e) {
|
|
@@ -355,8 +355,8 @@ function requireNative() {
|
|
|
355
355
|
try {
|
|
356
356
|
const binding = require('@kreuzberg/node-linux-arm-gnueabihf')
|
|
357
357
|
const bindingPackageVersion = require('@kreuzberg/node-linux-arm-gnueabihf/package.json').version
|
|
358
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
359
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
358
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
359
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
360
360
|
}
|
|
361
361
|
return binding
|
|
362
362
|
} catch (e) {
|
|
@@ -373,8 +373,8 @@ function requireNative() {
|
|
|
373
373
|
try {
|
|
374
374
|
const binding = require('@kreuzberg/node-linux-loong64-musl')
|
|
375
375
|
const bindingPackageVersion = require('@kreuzberg/node-linux-loong64-musl/package.json').version
|
|
376
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
377
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
376
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
377
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
378
378
|
}
|
|
379
379
|
return binding
|
|
380
380
|
} catch (e) {
|
|
@@ -389,8 +389,8 @@ function requireNative() {
|
|
|
389
389
|
try {
|
|
390
390
|
const binding = require('@kreuzberg/node-linux-loong64-gnu')
|
|
391
391
|
const bindingPackageVersion = require('@kreuzberg/node-linux-loong64-gnu/package.json').version
|
|
392
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
393
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
392
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
393
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
394
394
|
}
|
|
395
395
|
return binding
|
|
396
396
|
} catch (e) {
|
|
@@ -407,8 +407,8 @@ function requireNative() {
|
|
|
407
407
|
try {
|
|
408
408
|
const binding = require('@kreuzberg/node-linux-riscv64-musl')
|
|
409
409
|
const bindingPackageVersion = require('@kreuzberg/node-linux-riscv64-musl/package.json').version
|
|
410
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
411
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
410
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
411
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
412
412
|
}
|
|
413
413
|
return binding
|
|
414
414
|
} catch (e) {
|
|
@@ -423,8 +423,8 @@ function requireNative() {
|
|
|
423
423
|
try {
|
|
424
424
|
const binding = require('@kreuzberg/node-linux-riscv64-gnu')
|
|
425
425
|
const bindingPackageVersion = require('@kreuzberg/node-linux-riscv64-gnu/package.json').version
|
|
426
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
427
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
426
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
427
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
428
428
|
}
|
|
429
429
|
return binding
|
|
430
430
|
} catch (e) {
|
|
@@ -440,8 +440,8 @@ function requireNative() {
|
|
|
440
440
|
try {
|
|
441
441
|
const binding = require('@kreuzberg/node-linux-ppc64-gnu')
|
|
442
442
|
const bindingPackageVersion = require('@kreuzberg/node-linux-ppc64-gnu/package.json').version
|
|
443
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
444
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
443
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
444
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
445
445
|
}
|
|
446
446
|
return binding
|
|
447
447
|
} catch (e) {
|
|
@@ -456,8 +456,8 @@ function requireNative() {
|
|
|
456
456
|
try {
|
|
457
457
|
const binding = require('@kreuzberg/node-linux-s390x-gnu')
|
|
458
458
|
const bindingPackageVersion = require('@kreuzberg/node-linux-s390x-gnu/package.json').version
|
|
459
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
460
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
459
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
460
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
461
461
|
}
|
|
462
462
|
return binding
|
|
463
463
|
} catch (e) {
|
|
@@ -476,8 +476,8 @@ function requireNative() {
|
|
|
476
476
|
try {
|
|
477
477
|
const binding = require('@kreuzberg/node-openharmony-arm64')
|
|
478
478
|
const bindingPackageVersion = require('@kreuzberg/node-openharmony-arm64/package.json').version
|
|
479
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
480
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
479
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
480
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
481
481
|
}
|
|
482
482
|
return binding
|
|
483
483
|
} catch (e) {
|
|
@@ -492,8 +492,8 @@ function requireNative() {
|
|
|
492
492
|
try {
|
|
493
493
|
const binding = require('@kreuzberg/node-openharmony-x64')
|
|
494
494
|
const bindingPackageVersion = require('@kreuzberg/node-openharmony-x64/package.json').version
|
|
495
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
496
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
495
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
496
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
497
497
|
}
|
|
498
498
|
return binding
|
|
499
499
|
} catch (e) {
|
|
@@ -508,8 +508,8 @@ function requireNative() {
|
|
|
508
508
|
try {
|
|
509
509
|
const binding = require('@kreuzberg/node-openharmony-arm')
|
|
510
510
|
const bindingPackageVersion = require('@kreuzberg/node-openharmony-arm/package.json').version
|
|
511
|
-
if (bindingPackageVersion !== '4.0.0-rc.
|
|
512
|
-
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.
|
|
511
|
+
if (bindingPackageVersion !== '4.0.0-rc.8' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
512
|
+
throw new Error(`Native binding package version mismatch, expected 4.0.0-rc.8 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
513
513
|
}
|
|
514
514
|
return binding
|
|
515
515
|
} catch (e) {
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@kreuzberg/node",
|
|
3
|
-
"version": "4.0.0-rc.
|
|
3
|
+
"version": "4.0.0-rc.8",
|
|
4
4
|
"description": "Kreuzberg document intelligence - Node.js native bindings",
|
|
5
5
|
"author": {
|
|
6
6
|
"name": "Na'aman Hirschfeld",
|
|
@@ -27,11 +27,11 @@
|
|
|
27
27
|
}
|
|
28
28
|
},
|
|
29
29
|
"bin": {
|
|
30
|
-
"kreuzberg": "
|
|
30
|
+
"kreuzberg": "dist/cli.js"
|
|
31
31
|
},
|
|
32
32
|
"repository": {
|
|
33
33
|
"type": "git",
|
|
34
|
-
"url": "https://github.com/kreuzberg-dev/kreuzberg.git"
|
|
34
|
+
"url": "git+https://github.com/kreuzberg-dev/kreuzberg.git"
|
|
35
35
|
},
|
|
36
36
|
"license": "MIT",
|
|
37
37
|
"keywords": [
|
|
@@ -82,31 +82,6 @@
|
|
|
82
82
|
"registry": "https://registry.npmjs.org/",
|
|
83
83
|
"access": "public"
|
|
84
84
|
},
|
|
85
|
-
"devDependencies": {
|
|
86
|
-
"@napi-rs/cli": "^3.5.0",
|
|
87
|
-
"@types/archiver": "^7.0.0",
|
|
88
|
-
"@types/node": "^24.10.2",
|
|
89
|
-
"@types/which": "^3.0.4",
|
|
90
|
-
"@vitest/coverage-v8": "^4.0.15",
|
|
91
|
-
"archiver": "^7.0.1",
|
|
92
|
-
"oxlint": "^1.32.0",
|
|
93
|
-
"tsup": "^8.5.1",
|
|
94
|
-
"typescript": "^5.9.3",
|
|
95
|
-
"vitest": "^4.0.15"
|
|
96
|
-
},
|
|
97
|
-
"dependencies": {
|
|
98
|
-
"@emnapi/runtime": "1.7.1",
|
|
99
|
-
"which": "^6.0.0"
|
|
100
|
-
},
|
|
101
|
-
"optionalDependencies": {
|
|
102
|
-
"@kreuzberg/node-darwin-x64": "4.0.0-rc.6",
|
|
103
|
-
"@kreuzberg/node-darwin-arm64": "4.0.0-rc.6",
|
|
104
|
-
"@kreuzberg/node-win32-x64-msvc": "4.0.0-rc.6",
|
|
105
|
-
"@kreuzberg/node-win32-arm64-msvc": "4.0.0-rc.6",
|
|
106
|
-
"@kreuzberg/node-linux-x64-gnu": "4.0.0-rc.6",
|
|
107
|
-
"@kreuzberg/node-linux-arm64-gnu": "4.0.0-rc.6",
|
|
108
|
-
"@kreuzberg/node-linux-arm-gnueabihf": "4.0.0-rc.6"
|
|
109
|
-
},
|
|
110
85
|
"scripts": {
|
|
111
86
|
"artifacts": "napi artifacts",
|
|
112
87
|
"build": "napi build --platform --release && tsup",
|
|
@@ -122,7 +97,33 @@
|
|
|
122
97
|
"lint": "biome check typescript && oxlint typescript",
|
|
123
98
|
"lint:fix": "biome check --write typescript",
|
|
124
99
|
"format": "biome format --write typescript",
|
|
100
|
+
"prepublishOnly": "napi prepublish -t npm",
|
|
125
101
|
"universal": "napi universal",
|
|
126
102
|
"version": "napi version"
|
|
103
|
+
},
|
|
104
|
+
"devDependencies": {
|
|
105
|
+
"@napi-rs/cli": "^3.5.0",
|
|
106
|
+
"@types/archiver": "^7.0.0",
|
|
107
|
+
"@types/node": "^25.0.2",
|
|
108
|
+
"@types/which": "^3.0.4",
|
|
109
|
+
"@vitest/coverage-v8": "^4.0.15",
|
|
110
|
+
"archiver": "^7.0.1",
|
|
111
|
+
"oxlint": "^1.32.0",
|
|
112
|
+
"tsup": "^8.5.1",
|
|
113
|
+
"typescript": "^5.9.3",
|
|
114
|
+
"vitest": "^4.0.15"
|
|
115
|
+
},
|
|
116
|
+
"dependencies": {
|
|
117
|
+
"@emnapi/runtime": "1.7.1",
|
|
118
|
+
"which": "^6.0.0"
|
|
119
|
+
},
|
|
120
|
+
"optionalDependencies": {
|
|
121
|
+
"@kreuzberg/node-darwin-arm64": "4.0.0-rc.8",
|
|
122
|
+
"@kreuzberg/node-darwin-x64": "4.0.0-rc.8",
|
|
123
|
+
"@kreuzberg/node-linux-arm-gnueabihf": "4.0.0-rc.8",
|
|
124
|
+
"@kreuzberg/node-linux-arm64-gnu": "4.0.0-rc.8",
|
|
125
|
+
"@kreuzberg/node-linux-x64-gnu": "4.0.0-rc.8",
|
|
126
|
+
"@kreuzberg/node-win32-arm64-msvc": "4.0.0-rc.8",
|
|
127
|
+
"@kreuzberg/node-win32-x64-msvc": "4.0.0-rc.8"
|
|
127
128
|
}
|
|
128
|
-
}
|
|
129
|
+
}
|
package/LICENSE
DELETED
|
@@ -1,7 +0,0 @@
|
|
|
1
|
-
Copyright 2025 Na'aman Hirschfeld
|
|
2
|
-
|
|
3
|
-
Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the “Software”), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
|
|
4
|
-
|
|
5
|
-
The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
|
|
6
|
-
|
|
7
|
-
THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|