kreuzberg 4.0.0rc15__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- kreuzberg-4.0.0rc15/Cargo.lock +7947 -0
- kreuzberg-4.0.0rc15/Cargo.toml +85 -0
- kreuzberg-4.0.0rc15/PKG-INFO +563 -0
- kreuzberg-4.0.0rc15/README.md +514 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/Cargo.toml +248 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/README.md +230 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/benches/otel_overhead.rs +48 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/build.rs +887 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/api/error.rs +81 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/api/handlers.rs +199 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/api/mod.rs +79 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/api/server.rs +353 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/api/types.rs +170 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/cache/mod.rs +1167 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/chunking/mod.rs +1877 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/chunking/processor.rs +220 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/core/batch_mode.rs +95 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/core/config.rs +1080 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/core/extractor.rs +1156 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/core/io.rs +329 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/core/mime.rs +605 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/core/mod.rs +47 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/core/pipeline.rs +1184 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/embeddings.rs +500 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/error.rs +431 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/archive.rs +954 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/docx.rs +398 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/email.rs +854 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/excel.rs +688 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/html.rs +601 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/image.rs +491 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/libreoffice.rs +574 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/markdown.rs +213 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/mod.rs +81 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/office_metadata/app_properties.rs +398 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/office_metadata/core_properties.rs +247 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/office_metadata/custom_properties.rs +240 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/office_metadata/mod.rs +130 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/office_metadata/odt_properties.rs +284 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/pptx.rs +3100 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/structured.rs +490 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/table.rs +328 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/text.rs +269 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extraction/xml.rs +333 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/archive.rs +447 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/bibtex.rs +470 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/docbook.rs +504 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/docx.rs +400 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/email.rs +157 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/epub.rs +708 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/excel.rs +345 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/fictionbook.rs +492 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/html.rs +407 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/image.rs +219 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/jats.rs +1054 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/jupyter.rs +368 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/latex.rs +653 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/markdown.rs +701 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/mod.rs +429 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/odt.rs +628 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/opml.rs +635 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/orgmode.rs +529 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/pdf.rs +749 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/pptx.rs +267 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/rst.rs +577 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/rtf.rs +809 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/security.rs +484 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/security_tests.rs +367 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/structured.rs +142 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/text.rs +265 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/typst.rs +651 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/extractors/xml.rs +147 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/image/dpi.rs +164 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/image/mod.rs +6 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/image/preprocessing.rs +417 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/image/resize.rs +89 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/keywords/config.rs +154 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/keywords/mod.rs +237 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/keywords/processor.rs +275 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/keywords/rake.rs +293 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/keywords/types.rs +68 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/keywords/yake.rs +163 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/language_detection/mod.rs +985 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/language_detection/processor.rs +219 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/lib.rs +113 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/mcp/mod.rs +35 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/mcp/server.rs +2076 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/cache.rs +469 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/error.rs +37 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/hocr.rs +216 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/mod.rs +58 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/processor.rs +863 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/table/mod.rs +4 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/table/tsv_parser.rs +144 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/tesseract_backend.rs +452 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/types.rs +393 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/utils.rs +47 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/ocr/validation.rs +206 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/panic_context.rs +154 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/pdf/bindings.rs +44 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/pdf/bundled.rs +452 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/pdf/error.rs +130 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/pdf/images.rs +139 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/pdf/metadata.rs +489 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/pdf/mod.rs +68 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/pdf/rendering.rs +368 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/pdf/table.rs +420 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/pdf/text.rs +240 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/plugins/extractor.rs +1044 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/plugins/mod.rs +212 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/plugins/ocr.rs +639 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/plugins/processor.rs +650 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/plugins/registry.rs +1339 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/plugins/traits.rs +258 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/plugins/validator.rs +967 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/stopwords/mod.rs +1470 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/mod.rs +25 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/quality.rs +697 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/quality_processor.rs +219 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/string_utils.rs +217 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/token_reduction/cjk_utils.rs +164 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/token_reduction/config.rs +100 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/token_reduction/core.rs +796 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/token_reduction/filters.rs +902 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/token_reduction/mod.rs +160 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/token_reduction/semantic.rs +619 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/text/token_reduction/simd_text.rs +147 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/types.rs +1055 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/utils/mod.rs +17 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/utils/quality.rs +959 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/src/utils/string_utils.rs +381 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/af_stopwords.json +53 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ar_stopwords.json +482 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/bg_stopwords.json +261 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/bn_stopwords.json +400 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/br_stopwords.json +1205 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ca_stopwords.json +280 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/cs_stopwords.json +425 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/da_stopwords.json +172 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/de_stopwords.json +622 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/el_stopwords.json +849 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/en_stopwords.json +1300 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/eo_stopwords.json +175 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/es_stopwords.json +734 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/et_stopwords.json +37 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/eu_stopwords.json +100 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/fa_stopwords.json +801 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/fi_stopwords.json +849 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/fr_stopwords.json +693 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ga_stopwords.json +111 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/gl_stopwords.json +162 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/gu_stopwords.json +226 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ha_stopwords.json +41 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/he_stopwords.json +196 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/hi_stopwords.json +227 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/hr_stopwords.json +181 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/hu_stopwords.json +791 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/hy_stopwords.json +47 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/id_stopwords.json +760 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/it_stopwords.json +634 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ja_stopwords.json +136 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/kn_stopwords.json +84 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ko_stopwords.json +681 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ku_stopwords.json +64 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/la_stopwords.json +51 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/lt_stopwords.json +476 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/lv_stopwords.json +163 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ml_stopwords.json +1 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/mr_stopwords.json +101 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ms_stopwords.json +477 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ne_stopwords.json +490 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/nl_stopwords.json +415 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/no_stopwords.json +223 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/pl_stopwords.json +331 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/pt_stopwords.json +562 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ro_stopwords.json +436 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ru_stopwords.json +561 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/si_stopwords.json +193 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/sk_stopwords.json +420 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/sl_stopwords.json +448 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/so_stopwords.json +32 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/st_stopwords.json +33 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/sv_stopwords.json +420 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/sw_stopwords.json +76 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ta_stopwords.json +129 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/te_stopwords.json +54 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/th_stopwords.json +118 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/tl_stopwords.json +149 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/tr_stopwords.json +506 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/uk_stopwords.json +75 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/ur_stopwords.json +519 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/vi_stopwords.json +647 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/yo_stopwords.json +62 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/zh_stopwords.json +796 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/stopwords/zu_stopwords.json +31 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/api_extract_multipart.rs +52 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/api_tests.rs +966 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/archive_integration.rs +545 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/batch_orchestration.rs +556 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/batch_processing.rs +318 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/bibtex_parity_test.rs +421 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/concurrency_stress.rs +533 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/config_features.rs +612 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/config_loading_tests.rs +416 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/core_integration.rs +510 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/csv_integration.rs +414 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/docbook_extractor_tests.rs +500 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/docx_metadata_extraction_test.rs +122 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/docx_vs_pandoc_comparison.rs +370 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/email_integration.rs +327 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/epub_native_extractor_tests.rs +275 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/error_handling.rs +402 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/fictionbook_extractor_tests.rs +228 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/format_integration.rs +164 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/helpers/mod.rs +142 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/html_table_test.rs +551 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/image_integration.rs +255 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/instrumentation_test.rs +139 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/jats_extractor_tests.rs +639 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/jupyter_extractor_tests.rs +704 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/keywords_integration.rs +479 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/keywords_quality.rs +509 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/latex_extractor_tests.rs +496 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/markdown_extractor_tests.rs +490 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/mime_detection.rs +429 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/ocr_configuration.rs +514 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/ocr_errors.rs +698 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/ocr_quality.rs +629 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/ocr_stress.rs +469 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/odt_extractor_tests.rs +674 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/opml_extractor_tests.rs +616 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/orgmode_extractor_tests.rs +822 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/pdf_integration.rs +45 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/pdfium_linking.rs +374 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/pipeline_integration.rs +1436 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/plugin_ocr_backend_test.rs +776 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/plugin_postprocessor_test.rs +560 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/plugin_system.rs +927 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/plugin_validator_test.rs +783 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/registry_integration_tests.rs +587 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/rst_extractor_tests.rs +694 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/rtf_extractor_tests.rs +775 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/security_validation.rs +416 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/stopwords_integration_test.rs +888 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/test_fastembed.rs +631 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/typst_behavioral_tests.rs +1260 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/typst_extractor_tests.rs +648 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg/tests/xlsx_metadata_extraction_test.rs +87 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/Cargo.toml +33 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/README.md +310 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/benches/async_patterns_benchmark.py +98 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/build.rs +15 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/src/config.rs +2197 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/src/core.rs +522 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/src/error.rs +375 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/src/ffi.rs +31 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/src/lib.rs +360 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/src/plugins.rs +1884 -0
- kreuzberg-4.0.0rc15/crates/kreuzberg-py/src/types.rs +415 -0
- kreuzberg-4.0.0rc15/kreuzberg/__init__.py +739 -0
- kreuzberg-4.0.0rc15/kreuzberg/__main__.py +160 -0
- kreuzberg-4.0.0rc15/kreuzberg/_internal_bindings.pyi +1298 -0
- kreuzberg-4.0.0rc15/kreuzberg/_setup_lib_path.py +143 -0
- kreuzberg-4.0.0rc15/kreuzberg/exceptions.py +254 -0
- kreuzberg-4.0.0rc15/kreuzberg/ocr/__init__.py +25 -0
- kreuzberg-4.0.0rc15/kreuzberg/ocr/easyocr.py +371 -0
- kreuzberg-4.0.0rc15/kreuzberg/ocr/paddleocr.py +284 -0
- kreuzberg-4.0.0rc15/kreuzberg/ocr/protocol.py +150 -0
- kreuzberg-4.0.0rc15/kreuzberg/postprocessors/__init__.py +61 -0
- kreuzberg-4.0.0rc15/kreuzberg/postprocessors/protocol.py +83 -0
- kreuzberg-4.0.0rc15/kreuzberg/py.typed +0 -0
- kreuzberg-4.0.0rc15/kreuzberg/types.py +480 -0
- kreuzberg-4.0.0rc15/pyproject.toml +110 -0
There are too many changes on this page to be displayed.
The amount of changes on this page would crash your brower.
You can still verify the content by downloading the package file manually.