kreuzberg 3.13.1__tar.gz → 3.13.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/PKG-INFO +1 -1
- kreuzberg-3.13.2/docker-logs/docker-info.txt +60 -0
- kreuzberg-3.13.2/docker-logs/docker-version.txt +27 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/cli.py +2 -2
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/pyproject.toml +1 -1
- kreuzberg-3.13.2/test_report.json +16 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/gmft_test.py +1 -1
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/uv.lock +2 -2
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.commitlintrc +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.deepsource.toml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.docker/Dockerfile +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.docker/README.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.dockerignore +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.github/dependabot.yaml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.github/workflows/ci.yaml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.github/workflows/docker-e2e-tests.yml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.github/workflows/docs.yml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.github/workflows/pr-title.yaml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.github/workflows/publish-docker.yml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.github/workflows/release.yaml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.github/workflows/test-docker-builds.yml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.gitignore +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.markdownlint.yaml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/.pre-commit-config.yaml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/LICENSE +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/README.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/Taskfile.yml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/ai-rulez.yaml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/README.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/pyproject.toml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/src/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/src/__main__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/src/benchmarks.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/src/cli.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/src/models.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/src/profiler.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/benchmarks/src/runner.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docker-compose.example.yml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/advanced/custom-extractors.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/advanced/custom-hooks.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/advanced/error-handling.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/advanced/index.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/advanced/performance.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/api-reference/exceptions.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/api-reference/extraction-functions.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/api-reference/extractor-registry.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/api-reference/index.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/api-reference/ocr-configuration.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/api-reference/types.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/assets/favicon.png +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/assets/logo.png +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/cli.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/contributing.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/css/extra.css +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/examples/extraction-examples.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/examples/index.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/getting-started/index.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/getting-started/installation.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/getting-started/quick-start.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/index.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/api-server.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/basic-usage.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/chunking.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/docker.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/document-classification.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/extraction-configuration.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/index.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/mcp-server.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/metadata-extraction.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/ocr-backends.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/ocr-configuration.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/docs/user-guide/supported-formats.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/__main__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_api/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_api/main.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_chunker.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_config.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_constants.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_document_classification.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_entity_extraction.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/_base.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/_email.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/_html.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/_image.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/_pandoc.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/_pdf.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/_presentation.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/_spread_sheet.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_extractors/_structured.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_gmft.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_language_detection.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_mcp/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_mcp/server.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_mime_types.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_ocr/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_ocr/_base.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_ocr/_easyocr.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_ocr/_paddleocr.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_ocr/_table_extractor.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_ocr/_tesseract.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_playa.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_registry.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_types.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_cache.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_device.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_document_cache.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_errors.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_ocr_cache.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_pdf_lock.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_process_pool.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_quality.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_ref.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_serialization.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_string.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_sync.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_table.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/_utils/_tmp.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/exceptions.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/extraction.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/kreuzberg/py.typed +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/mkdocs.yaml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/output.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/results/baseline.json +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/results/serialization.json +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/results/statistical.json +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/api/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/api/conftest.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/api/main_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/api/runtime_config_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/chunker_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/cli_command_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/cli_integration_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/cli_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/config_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/conftest.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/document_classification_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/e2e/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/e2e/docker_e2e_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/entity_extraction_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/exceptions_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extraction_batch_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extraction_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/email_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/html_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/image_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/pandoc_metadata_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/pandoc_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/pdf_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/presentation_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/spreed_sheet_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/extractors/structured_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/gmft_extended_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/hooks_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/html_to_markdown_config_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/language_detection_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/mcp_server_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/mime_types_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/multiprocessing/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/multiprocessing/gmft_integration_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/multiprocessing/gmft_isolated_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/multiprocessing/process_manager_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/multiprocessing/tesseract_pool_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/ocr/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/ocr/base_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/ocr/device_integration_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/ocr/easyocr_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/ocr/init_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/ocr/paddleocr_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/ocr/tesseract_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/ocr/tesseract_tsv_integration_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/ocr/tesseract_tsv_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/playa_helpers_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/playa_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/registry_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/tesseract_sync_formats_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/contract.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/contract_test.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/document.docx +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/email/sample-email.eml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/excel-multi-sheet.xlsx +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/excel.xlsx +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/flower-no-text.jpg +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/form_test.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/french-text.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/german-text.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/html.html +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/images/test_hello_world.png +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/invoice_image.png +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/invoice_test.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/json/sample-document.json +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/layout-parser-ocr.jpg +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/markdown.md +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/non-ascii-text.pdf +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/non-searchable.pdf +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/ocr-image.jpg +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/pdfs_with_tables/large.pdf +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/pdfs_with_tables/medium.pdf +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/pdfs_with_tables/tiny.pdf +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/pitch-deck-presentation.pptx +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/receipt_test.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/report_test.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/sample-contract.pdf +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/scanned.pdf +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/searchable.pdf +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/spanish-text.txt +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/tables/borderless_table.png +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/tables/complex_document.png +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/tables/simple_table.png +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/test-article.pdf +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/test_source_files/yaml/sample-config.yaml +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/types_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/__init__.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/cache_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/device_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/errors_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/ocr_cache_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/pdf_lock_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/process_pool_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/ref_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/serialization_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/string_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/sync_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/table_test.py +0 -0
- {kreuzberg-3.13.1 → kreuzberg-3.13.2}/tests/utils/tmp_test.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: kreuzberg
|
3
|
-
Version: 3.13.
|
3
|
+
Version: 3.13.2
|
4
4
|
Summary: Document intelligence framework for Python - Extract text, metadata, and structured data from diverse file formats
|
5
5
|
Project-URL: documentation, https://kreuzberg.dev
|
6
6
|
Project-URL: homepage, https://github.com/Goldziher/kreuzberg
|
@@ -0,0 +1,60 @@
|
|
1
|
+
Client: Docker Engine - Community
|
2
|
+
Version: 28.0.4
|
3
|
+
Context: default
|
4
|
+
Debug Mode: false
|
5
|
+
Plugins:
|
6
|
+
buildx: Docker Buildx (Docker Inc.)
|
7
|
+
Version: v0.27.0
|
8
|
+
Path: /usr/libexec/docker/cli-plugins/docker-buildx
|
9
|
+
compose: Docker Compose (Docker Inc.)
|
10
|
+
Version: v2.38.2
|
11
|
+
Path: /usr/libexec/docker/cli-plugins/docker-compose
|
12
|
+
|
13
|
+
Server:
|
14
|
+
Containers: 1
|
15
|
+
Running: 1
|
16
|
+
Paused: 0
|
17
|
+
Stopped: 0
|
18
|
+
Images: 2
|
19
|
+
Server Version: 28.0.4
|
20
|
+
Storage Driver: overlay2
|
21
|
+
Backing Filesystem: extfs
|
22
|
+
Supports d_type: true
|
23
|
+
Using metacopy: false
|
24
|
+
Native Overlay Diff: false
|
25
|
+
userxattr: false
|
26
|
+
Logging Driver: json-file
|
27
|
+
Cgroup Driver: systemd
|
28
|
+
Cgroup Version: 2
|
29
|
+
Plugins:
|
30
|
+
Volume: local
|
31
|
+
Network: bridge host ipvlan macvlan null overlay
|
32
|
+
Log: awslogs fluentd gcplogs gelf journald json-file local splunk syslog
|
33
|
+
Swarm: inactive
|
34
|
+
Runtimes: io.containerd.runc.v2 runc
|
35
|
+
Default Runtime: runc
|
36
|
+
Init Binary: docker-init
|
37
|
+
containerd version: 05044ec0a9a75232cad458027ca83437aae3f4da
|
38
|
+
runc version: v1.2.5-0-g59923ef
|
39
|
+
init version: de40ad0
|
40
|
+
Security Options:
|
41
|
+
apparmor
|
42
|
+
seccomp
|
43
|
+
Profile: builtin
|
44
|
+
cgroupns
|
45
|
+
Kernel Version: 6.11.0-1018-azure
|
46
|
+
Operating System: Ubuntu 24.04.3 LTS
|
47
|
+
OSType: linux
|
48
|
+
Architecture: x86_64
|
49
|
+
CPUs: 4
|
50
|
+
Total Memory: 15.62GiB
|
51
|
+
Name: pkrvm7jw40e0xgp
|
52
|
+
ID: 33a18c03-7dc8-4ab9-bfe1-99342b7c1aaf
|
53
|
+
Docker Root Dir: /var/lib/docker
|
54
|
+
Debug Mode: false
|
55
|
+
Username: githubactions
|
56
|
+
Experimental: false
|
57
|
+
Insecure Registries:
|
58
|
+
::1/128
|
59
|
+
127.0.0.0/8
|
60
|
+
Live Restore Enabled: false
|
@@ -0,0 +1,27 @@
|
|
1
|
+
Client: Docker Engine - Community
|
2
|
+
Version: 28.0.4
|
3
|
+
API version: 1.48
|
4
|
+
Go version: go1.23.7
|
5
|
+
Git commit: b8034c0
|
6
|
+
Built: Tue Mar 25 15:07:16 2025
|
7
|
+
OS/Arch: linux/amd64
|
8
|
+
Context: default
|
9
|
+
|
10
|
+
Server: Docker Engine - Community
|
11
|
+
Engine:
|
12
|
+
Version: 28.0.4
|
13
|
+
API version: 1.48 (minimum version 1.24)
|
14
|
+
Go version: go1.23.7
|
15
|
+
Git commit: 6430e49
|
16
|
+
Built: Tue Mar 25 15:07:16 2025
|
17
|
+
OS/Arch: linux/amd64
|
18
|
+
Experimental: false
|
19
|
+
containerd:
|
20
|
+
Version: 1.7.27
|
21
|
+
GitCommit: 05044ec0a9a75232cad458027ca83437aae3f4da
|
22
|
+
runc:
|
23
|
+
Version: 1.2.5
|
24
|
+
GitCommit: v1.2.5-0-g59923ef
|
25
|
+
docker-init:
|
26
|
+
Version: 0.19.0
|
27
|
+
GitCommit: de40ad0
|
@@ -265,7 +265,7 @@ def cli(ctx: click.Context) -> None:
|
|
265
265
|
@click.option("--easyocr-languages", help="EasyOCR language codes (comma-separated, e.g., 'en,de')")
|
266
266
|
@click.option("--paddleocr-languages", help="PaddleOCR language codes (comma-separated, e.g., 'en,german')")
|
267
267
|
@click.pass_context
|
268
|
-
def extract(ctx: click.Context) -> None:
|
268
|
+
def extract(ctx: click.Context, /, **kwargs: Any) -> None:
|
269
269
|
"""Extract text from a document.
|
270
270
|
|
271
271
|
FILE can be a path to a document or '-' to read from stdin.
|
@@ -279,7 +279,7 @@ def extract(ctx: click.Context) -> None:
|
|
279
279
|
|
280
280
|
extraction_config = build_extraction_config(file_config, cli_args)
|
281
281
|
|
282
|
-
result = _perform_extraction(
|
282
|
+
result = _perform_extraction(kwargs.get("file"), extraction_config, params["verbose"])
|
283
283
|
|
284
284
|
_write_output(result, params["output"], params["show_metadata"], params["output_format"], params["verbose"])
|
285
285
|
|
@@ -5,7 +5,7 @@ requires = [ "hatchling" ]
|
|
5
5
|
|
6
6
|
[project]
|
7
7
|
name = "kreuzberg"
|
8
|
-
version = "3.13.
|
8
|
+
version = "3.13.2"
|
9
9
|
description = "Document intelligence framework for Python - Extract text, metadata, and structured data from diverse file formats"
|
10
10
|
readme = "README.md"
|
11
11
|
keywords = [
|
@@ -0,0 +1,16 @@
|
|
1
|
+
{
|
2
|
+
"base": {
|
3
|
+
"exists": true,
|
4
|
+
"cli_help": true,
|
5
|
+
"cli_version": true,
|
6
|
+
"api_health": true,
|
7
|
+
"extract_txt": false,
|
8
|
+
"extract_pdf": false,
|
9
|
+
"extract_docx": false,
|
10
|
+
"ocr": false,
|
11
|
+
"api_extract": true,
|
12
|
+
"volume_security": true,
|
13
|
+
"resource_limits": true,
|
14
|
+
"malicious_input": true
|
15
|
+
}
|
16
|
+
}
|
@@ -621,7 +621,7 @@ def test_gmft_inline_extraction_edge_cases_sync_empty_cropped_tables(tiny_pdf_wi
|
|
621
621
|
pytest.skip("Testing inline extraction, but isolated mode is enabled")
|
622
622
|
|
623
623
|
try:
|
624
|
-
from gmft.auto import AutoTableDetector
|
624
|
+
from gmft.auto import AutoTableDetector # type: ignore[attr-defined]
|
625
625
|
|
626
626
|
with patch.object(AutoTableDetector, "extract", return_value=[]):
|
627
627
|
result = extract_tables_sync(tiny_pdf_with_tables, use_isolated_process=False)
|
@@ -957,7 +957,7 @@ name = "exceptiongroup"
|
|
957
957
|
version = "1.3.0"
|
958
958
|
source = { registry = "https://pypi.org/simple" }
|
959
959
|
dependencies = [
|
960
|
-
{ name = "typing-extensions", marker = "python_full_version < '3.
|
960
|
+
{ name = "typing-extensions", marker = "python_full_version < '3.11'" },
|
961
961
|
]
|
962
962
|
sdist = { url = "https://files.pythonhosted.org/packages/0b/9f/a65090624ecf468cdca03533906e7c69ed7588582240cfe7cc9e770b50eb/exceptiongroup-1.3.0.tar.gz", hash = "sha256:b241f5885f560bc56a59ee63ca4c6a8bfa46ae4ad651af316d4e81817bb9fd88", size = 29749, upload-time = "2025-05-10T17:42:51.123Z" }
|
963
963
|
wheels = [
|
@@ -1633,7 +1633,7 @@ wheels = [
|
|
1633
1633
|
|
1634
1634
|
[[package]]
|
1635
1635
|
name = "kreuzberg"
|
1636
|
-
version = "3.13.
|
1636
|
+
version = "3.13.2"
|
1637
1637
|
source = { editable = "." }
|
1638
1638
|
dependencies = [
|
1639
1639
|
{ name = "anyio" },
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|