@kreuzberg/wasm 4.5.0 → 4.5.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/README.md
CHANGED
|
@@ -22,7 +22,7 @@
|
|
|
22
22
|
<img src="https://img.shields.io/maven-central/v/dev.kreuzberg/kreuzberg?label=Java&color=007ec6" alt="Java">
|
|
23
23
|
</a>
|
|
24
24
|
<a href="https://github.com/kreuzberg-dev/kreuzberg/releases">
|
|
25
|
-
<img src="https://img.shields.io/github/v/tag/kreuzberg-dev/kreuzberg?label=Go&color=007ec6&filter=v4.5.
|
|
25
|
+
<img src="https://img.shields.io/github/v/tag/kreuzberg-dev/kreuzberg?label=Go&color=007ec6&filter=v4.5.1" alt="Go">
|
|
26
26
|
</a>
|
|
27
27
|
<a href="https://www.nuget.org/packages/Kreuzberg/">
|
|
28
28
|
<img src="https://img.shields.io/nuget/v/Kreuzberg?label=C%23&color=007ec6" alt="C#">
|
|
@@ -488,6 +488,30 @@ For advanced configuration options including language detection, table extractio
|
|
|
488
488
|
|
|
489
489
|
**[Configuration Guide](https://kreuzberg.dev/guides/configuration/)**
|
|
490
490
|
|
|
491
|
+
## Platform Limitations
|
|
492
|
+
|
|
493
|
+
WASM runs in single-threaded environments without access to ONNX Runtime, which constrains some features:
|
|
494
|
+
|
|
495
|
+
### Unsupported Features
|
|
496
|
+
|
|
497
|
+
- **Layout Detection** – Requires RT-DETR model inference via ONNX Runtime, which is unavailable in WebAssembly
|
|
498
|
+
- **Hardware Acceleration** – No GPU support (AccelerationConfig is not applicable)
|
|
499
|
+
- **Concurrency Configuration** – Single-threaded WASM environment (ConcurrencyConfig does not apply)
|
|
500
|
+
- **Email Codepage Configuration** – EmailConfig is not supported in WASM
|
|
501
|
+
|
|
502
|
+
### Supported Features
|
|
503
|
+
|
|
504
|
+
- **Text Extraction** – Full text content from all supported formats
|
|
505
|
+
- **OCR via Tesseract WASM** – Scanned document and image OCR using browser-native Tesseract
|
|
506
|
+
- **Embeddings** – FastEmbed-based vector generation
|
|
507
|
+
- **Chunking** – Text segmentation for RAG pipelines
|
|
508
|
+
- **Metadata Extraction** – Document properties, creation dates, page counts
|
|
509
|
+
- **Table Extraction** – Structured table data from PDFs and spreadsheets
|
|
510
|
+
- **Language Detection** – Identify document language
|
|
511
|
+
- **Image Extraction** – Embedded images from documents
|
|
512
|
+
|
|
513
|
+
All 88+ file formats supported by Kreuzberg are available in WASM, with the exception that features requiring ONNX Runtime (layout detection) will fail gracefully with an unsupported error.
|
|
514
|
+
|
|
491
515
|
## Documentation
|
|
492
516
|
|
|
493
517
|
- **[Official Documentation](https://kreuzberg.dev/)**
|
package/dist/pkg/README.md
CHANGED
|
@@ -22,7 +22,7 @@
|
|
|
22
22
|
<img src="https://img.shields.io/maven-central/v/dev.kreuzberg/kreuzberg?label=Java&color=007ec6" alt="Java">
|
|
23
23
|
</a>
|
|
24
24
|
<a href="https://github.com/kreuzberg-dev/kreuzberg/releases">
|
|
25
|
-
<img src="https://img.shields.io/github/v/tag/kreuzberg-dev/kreuzberg?label=Go&color=007ec6&filter=v4.5.
|
|
25
|
+
<img src="https://img.shields.io/github/v/tag/kreuzberg-dev/kreuzberg?label=Go&color=007ec6&filter=v4.5.1" alt="Go">
|
|
26
26
|
</a>
|
|
27
27
|
<a href="https://www.nuget.org/packages/Kreuzberg/">
|
|
28
28
|
<img src="https://img.shields.io/nuget/v/Kreuzberg?label=C%23&color=007ec6" alt="C#">
|
|
@@ -488,6 +488,30 @@ For advanced configuration options including language detection, table extractio
|
|
|
488
488
|
|
|
489
489
|
**[Configuration Guide](https://kreuzberg.dev/guides/configuration/)**
|
|
490
490
|
|
|
491
|
+
## Platform Limitations
|
|
492
|
+
|
|
493
|
+
WASM runs in single-threaded environments without access to ONNX Runtime, which constrains some features:
|
|
494
|
+
|
|
495
|
+
### Unsupported Features
|
|
496
|
+
|
|
497
|
+
- **Layout Detection** – Requires RT-DETR model inference via ONNX Runtime, which is unavailable in WebAssembly
|
|
498
|
+
- **Hardware Acceleration** – No GPU support (AccelerationConfig is not applicable)
|
|
499
|
+
- **Concurrency Configuration** – Single-threaded WASM environment (ConcurrencyConfig does not apply)
|
|
500
|
+
- **Email Codepage Configuration** – EmailConfig is not supported in WASM
|
|
501
|
+
|
|
502
|
+
### Supported Features
|
|
503
|
+
|
|
504
|
+
- **Text Extraction** – Full text content from all supported formats
|
|
505
|
+
- **OCR via Tesseract WASM** – Scanned document and image OCR using browser-native Tesseract
|
|
506
|
+
- **Embeddings** – FastEmbed-based vector generation
|
|
507
|
+
- **Chunking** – Text segmentation for RAG pipelines
|
|
508
|
+
- **Metadata Extraction** – Document properties, creation dates, page counts
|
|
509
|
+
- **Table Extraction** – Structured table data from PDFs and spreadsheets
|
|
510
|
+
- **Language Detection** – Identify document language
|
|
511
|
+
- **Image Extraction** – Embedded images from documents
|
|
512
|
+
|
|
513
|
+
All 88+ file formats supported by Kreuzberg are available in WASM, with the exception that features requiring ONNX Runtime (layout detection) will fail gracefully with an unsupported error.
|
|
514
|
+
|
|
491
515
|
## Documentation
|
|
492
516
|
|
|
493
517
|
- **[Official Documentation](https://kreuzberg.dev/)**
|
|
@@ -1791,7 +1791,7 @@ function __wbg_get_imports() {
|
|
|
1791
1791
|
},
|
|
1792
1792
|
__wbindgen_cast_0000000000000002: function(arg0, arg1) {
|
|
1793
1793
|
// Cast intrinsic for `Closure(Closure { dtor_idx: 4, function: Function { arguments: [Externref], shim_idx: 5, ret: Unit, inner_ret: Some(Unit) }, mutable: true }) -> Externref`.
|
|
1794
|
-
const ret = makeMutClosure(arg0, arg1, wasm.
|
|
1794
|
+
const ret = makeMutClosure(arg0, arg1, wasm.wasm_bindgen__closure__destroy__h594455dbca0a1257, wasm_bindgen__convert__closures_____invoke__h56e58b9b796ad689);
|
|
1795
1795
|
return ret;
|
|
1796
1796
|
},
|
|
1797
1797
|
__wbindgen_cast_0000000000000003: function(arg0) {
|
|
@@ -1833,8 +1833,8 @@ function __wbg_get_imports() {
|
|
|
1833
1833
|
};
|
|
1834
1834
|
}
|
|
1835
1835
|
|
|
1836
|
-
function
|
|
1837
|
-
wasm.
|
|
1836
|
+
function wasm_bindgen__convert__closures_____invoke__h56e58b9b796ad689(arg0, arg1, arg2) {
|
|
1837
|
+
wasm.wasm_bindgen__convert__closures_____invoke__h56e58b9b796ad689(arg0, arg1, arg2);
|
|
1838
1838
|
}
|
|
1839
1839
|
|
|
1840
1840
|
function wasm_bindgen__convert__closures_____invoke__h240eec0b57535315(arg0, arg1, arg2) {
|
|
@@ -1697,7 +1697,7 @@ export function __wbindgen_cast_0000000000000001(arg0, arg1) {
|
|
|
1697
1697
|
}
|
|
1698
1698
|
export function __wbindgen_cast_0000000000000002(arg0, arg1) {
|
|
1699
1699
|
// Cast intrinsic for `Closure(Closure { dtor_idx: 4, function: Function { arguments: [Externref], shim_idx: 5, ret: Unit, inner_ret: Some(Unit) }, mutable: true }) -> Externref`.
|
|
1700
|
-
const ret = makeMutClosure(arg0, arg1, wasm.
|
|
1700
|
+
const ret = makeMutClosure(arg0, arg1, wasm.wasm_bindgen__closure__destroy__h594455dbca0a1257, wasm_bindgen__convert__closures_____invoke__h56e58b9b796ad689);
|
|
1701
1701
|
return ret;
|
|
1702
1702
|
}
|
|
1703
1703
|
export function __wbindgen_cast_0000000000000003(arg0) {
|
|
@@ -1730,8 +1730,8 @@ export function __wbindgen_init_externref_table() {
|
|
|
1730
1730
|
table.set(offset + 2, true);
|
|
1731
1731
|
table.set(offset + 3, false);
|
|
1732
1732
|
}
|
|
1733
|
-
function
|
|
1734
|
-
wasm.
|
|
1733
|
+
function wasm_bindgen__convert__closures_____invoke__h56e58b9b796ad689(arg0, arg1, arg2) {
|
|
1734
|
+
wasm.wasm_bindgen__convert__closures_____invoke__h56e58b9b796ad689(arg0, arg1, arg2);
|
|
1735
1735
|
}
|
|
1736
1736
|
|
|
1737
1737
|
function wasm_bindgen__convert__closures_____invoke__h240eec0b57535315(arg0, arg1, arg2) {
|
|
Binary file
|
|
@@ -46,10 +46,10 @@ export const write_block_from_callback_wasm: (a: number, b: number, c: number) =
|
|
|
46
46
|
export const compress: (a: number, b: number, c: number, d: number) => [number, number, number];
|
|
47
47
|
export const decompress: (a: any, b: number, c: number, d: any) => [number, number];
|
|
48
48
|
export const wasm_bindgen__closure__destroy__hcbea9f36b367d3d8: (a: number, b: number) => void;
|
|
49
|
-
export const
|
|
49
|
+
export const wasm_bindgen__closure__destroy__h594455dbca0a1257: (a: number, b: number) => void;
|
|
50
50
|
export const wasm_bindgen__convert__closures_____invoke__h240eec0b57535315: (a: number, b: number, c: any) => [number, number];
|
|
51
51
|
export const wasm_bindgen__convert__closures_____invoke__h8e9fc28c4e841be2: (a: number, b: number, c: any, d: any) => void;
|
|
52
|
-
export const
|
|
52
|
+
export const wasm_bindgen__convert__closures_____invoke__h56e58b9b796ad689: (a: number, b: number, c: any) => void;
|
|
53
53
|
export const __wbindgen_externrefs: WebAssembly.Table;
|
|
54
54
|
export const __wbindgen_malloc_command_export: (a: number, b: number) => number;
|
|
55
55
|
export const __wbindgen_realloc_command_export: (a: number, b: number, c: number, d: number) => number;
|