nv-ingest-api 2025.10.9.dev20251009__tar.gz → 2025.10.11.dev20251011__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of nv-ingest-api might be problematic. Click here for more details.
- {nv_ingest_api-2025.10.9.dev20251009/src/nv_ingest_api.egg-info → nv_ingest_api-2025.10.11.dev20251011}/PKG-INFO +1 -1
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/chart_extractor.py +7 -3
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/infographic_extractor.py +7 -3
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/table_extractor.py +7 -3
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/ocr.py +9 -2
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/nim_client.py +0 -3
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/ingest_job_schema.py +5 -1
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/rest/rest_client.py +9 -2
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011/src/nv_ingest_api.egg-info}/PKG-INFO +1 -1
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/LICENSE +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/MANIFEST.in +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/README.md +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/pyproject.toml +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/setup.cfg +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/extract.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/mutate.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/store.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/transform.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/utility.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/enums/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/enums/common.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/audio/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/audio/audio_extraction.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/docx_extractor.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/engines/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docx_helper.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docxreader.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/html/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/html/html_extractor.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/image_extractor.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/image_helpers/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/image_helpers/common.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/adobe.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/llama.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/nemoretriever.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/pdf_helpers/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/pdfium.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/tika.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/unstructured_io.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/pdf_extractor.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pptx/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pptx/engines/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pptx/engines/pptx_helper.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pptx/pptx_extractor.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/meta/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/meta/udf.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/mutate/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/mutate/deduplicate.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/mutate/filter.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/control_message_task.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/ingest_control_message.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/default_values.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/cached.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/decorators.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/deplot.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/helpers.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/nemoretriever_parse.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/parakeet.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/text_embedding.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/vlm.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/yolox.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/nim_model_interface.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/tracing/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/tracing/latency.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/tracing/logging.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/tracing/tagging.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_audio_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_chart_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_docx_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_html_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_image_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_infographic_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_pdf_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_pptx_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_table_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/message_brokers/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/message_brokers/message_broker_client_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/message_brokers/request_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/message_brokers/response_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/base_model_noext.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/metadata_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/udf.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/mutate/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/mutate/mutate_image_dedup_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/store/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/store/store_embedding_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/store/store_image_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/transform_image_caption_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/transform_image_filter_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/transform_text_embedding_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/transform_text_splitter_schema.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/store/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/store/embed_text_upload.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/store/image_upload.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/transform/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/transform/caption_image.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/transform/embed_text.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/transform/split_text.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/control_message/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/control_message/validators.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/bytetools.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/containers.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/datetools.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/dftools.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/formats.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/type_mappings.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/dataloader/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/dataloader/dataloader.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/detectors/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/detectors/language.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/converters.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/decorators.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/detectors.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/pdf.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/schemas.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/clustering.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/processing.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/table_and_chart.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/transforms.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/imports/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/imports/callable_signatures.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/imports/dynamic_resolvers.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/introspection/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/introspection/class_inspect.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/introspection/function_inspect.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/logging/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/logging/configuration.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/logging/sanitize.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/simple_message_broker/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/simple_message_broker/broker.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/simple_message_broker/ordered_message_queue.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/simple_message_broker/simple_client.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/metadata/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/metadata/aggregators.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/multi_processing/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/multi_processing/mp_pool_singleton.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/nim/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/pdf/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/pdf/pdfium.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/schema/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/schema/schema_validator.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/client_base.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/kafka/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/redis/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/redis/redis_client.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/rest/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/string_processing/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/string_processing/configuration.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/string_processing/yaml.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/system/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/system/hardware_info.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api.egg-info/SOURCES.txt +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api.egg-info/dependency_links.txt +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api.egg-info/requires.txt +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api.egg-info/top_level.txt +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/udfs/__init__.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/udfs/llm_summarizer_udf.py +0 -0
- {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/version.py +0 -0
|
@@ -97,7 +97,7 @@ def _run_chart_inference(
|
|
|
97
97
|
model_name="paddle",
|
|
98
98
|
max_batch_size=1 if ocr_client.protocol == "grpc" else 2,
|
|
99
99
|
)
|
|
100
|
-
elif ocr_model_name
|
|
100
|
+
elif ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}:
|
|
101
101
|
future_ocr_kwargs.update(
|
|
102
102
|
model_name=ocr_model_name,
|
|
103
103
|
input_names=["INPUT_IMAGE_URLS", "MERGE_LEVELS"],
|
|
@@ -237,7 +237,9 @@ def _create_ocr_client(
|
|
|
237
237
|
auth_token: str,
|
|
238
238
|
) -> NimClient:
|
|
239
239
|
ocr_model_interface = (
|
|
240
|
-
NemoRetrieverOCRModelInterface()
|
|
240
|
+
NemoRetrieverOCRModelInterface()
|
|
241
|
+
if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}
|
|
242
|
+
else PaddleOCRModelInterface()
|
|
241
243
|
)
|
|
242
244
|
|
|
243
245
|
ocr_client = create_inference_client(
|
|
@@ -245,7 +247,9 @@ def _create_ocr_client(
|
|
|
245
247
|
model_interface=ocr_model_interface,
|
|
246
248
|
auth_token=auth_token,
|
|
247
249
|
infer_protocol=ocr_protocol,
|
|
248
|
-
enable_dynamic_batching=(
|
|
250
|
+
enable_dynamic_batching=(
|
|
251
|
+
True if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"} else False
|
|
252
|
+
),
|
|
249
253
|
dynamic_batch_memory_budget_mb=32,
|
|
250
254
|
)
|
|
251
255
|
|
|
@@ -107,7 +107,7 @@ def _update_infographic_metadata(
|
|
|
107
107
|
model_name="paddle",
|
|
108
108
|
max_batch_size=1 if ocr_client.protocol == "grpc" else 2,
|
|
109
109
|
)
|
|
110
|
-
elif ocr_model_name
|
|
110
|
+
elif ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}:
|
|
111
111
|
infer_kwargs.update(
|
|
112
112
|
model_name=ocr_model_name,
|
|
113
113
|
input_names=["INPUT_IMAGE_URLS", "MERGE_LEVELS"],
|
|
@@ -152,7 +152,9 @@ def _create_ocr_client(
|
|
|
152
152
|
auth_token: str,
|
|
153
153
|
) -> NimClient:
|
|
154
154
|
ocr_model_interface = (
|
|
155
|
-
NemoRetrieverOCRModelInterface()
|
|
155
|
+
NemoRetrieverOCRModelInterface()
|
|
156
|
+
if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}
|
|
157
|
+
else PaddleOCRModelInterface()
|
|
156
158
|
)
|
|
157
159
|
|
|
158
160
|
ocr_client = create_inference_client(
|
|
@@ -160,7 +162,9 @@ def _create_ocr_client(
|
|
|
160
162
|
model_interface=ocr_model_interface,
|
|
161
163
|
auth_token=auth_token,
|
|
162
164
|
infer_protocol=ocr_protocol,
|
|
163
|
-
enable_dynamic_batching=(
|
|
165
|
+
enable_dynamic_batching=(
|
|
166
|
+
True if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"} else False
|
|
167
|
+
),
|
|
164
168
|
dynamic_batch_memory_budget_mb=32,
|
|
165
169
|
)
|
|
166
170
|
|
|
@@ -99,7 +99,7 @@ def _run_inference(
|
|
|
99
99
|
model_name="paddle",
|
|
100
100
|
max_batch_size=1 if ocr_client.protocol == "grpc" else 2,
|
|
101
101
|
)
|
|
102
|
-
elif ocr_model_name
|
|
102
|
+
elif ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}:
|
|
103
103
|
future_ocr_kwargs.update(
|
|
104
104
|
model_name=ocr_model_name,
|
|
105
105
|
input_names=["INPUT_IMAGE_URLS", "MERGE_LEVELS"],
|
|
@@ -246,7 +246,9 @@ def _create_ocr_client(
|
|
|
246
246
|
auth_token: str,
|
|
247
247
|
) -> NimClient:
|
|
248
248
|
ocr_model_interface = (
|
|
249
|
-
NemoRetrieverOCRModelInterface()
|
|
249
|
+
NemoRetrieverOCRModelInterface()
|
|
250
|
+
if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}
|
|
251
|
+
else PaddleOCRModelInterface()
|
|
250
252
|
)
|
|
251
253
|
|
|
252
254
|
ocr_client = create_inference_client(
|
|
@@ -254,7 +256,9 @@ def _create_ocr_client(
|
|
|
254
256
|
model_interface=ocr_model_interface,
|
|
255
257
|
auth_token=auth_token,
|
|
256
258
|
infer_protocol=ocr_protocol,
|
|
257
|
-
enable_dynamic_batching=(
|
|
259
|
+
enable_dynamic_batching=(
|
|
260
|
+
True if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"} else False
|
|
261
|
+
),
|
|
258
262
|
dynamic_batch_memory_budget_mb=32,
|
|
259
263
|
)
|
|
260
264
|
|
|
@@ -21,7 +21,10 @@ from nv_ingest_api.internal.primitives.nim.model_interface.helpers import prepro
|
|
|
21
21
|
from nv_ingest_api.util.image_processing.transforms import base64_to_numpy
|
|
22
22
|
|
|
23
23
|
DEFAULT_OCR_MODEL_NAME = "paddle"
|
|
24
|
-
NEMORETRIEVER_OCR_MODEL_NAME = "
|
|
24
|
+
NEMORETRIEVER_OCR_MODEL_NAME = "scene_text_wrapper"
|
|
25
|
+
NEMORETRIEVER_OCR_ENSEMBLE_MODEL_NAME = "scene_text_ensemble"
|
|
26
|
+
NEMORETRIEVER_OCR_BLS_MODEL_NAME = "scene_text_python"
|
|
27
|
+
|
|
25
28
|
|
|
26
29
|
logger = logging.getLogger(__name__)
|
|
27
30
|
|
|
@@ -231,7 +234,11 @@ class OCRModelInterfaceBase(ModelInterface):
|
|
|
231
234
|
if not isinstance(response, np.ndarray):
|
|
232
235
|
raise ValueError("Unexpected response format: response is not a NumPy array.")
|
|
233
236
|
|
|
234
|
-
if model_name
|
|
237
|
+
if model_name in [
|
|
238
|
+
NEMORETRIEVER_OCR_MODEL_NAME,
|
|
239
|
+
NEMORETRIEVER_OCR_ENSEMBLE_MODEL_NAME,
|
|
240
|
+
NEMORETRIEVER_OCR_BLS_MODEL_NAME,
|
|
241
|
+
]:
|
|
235
242
|
response = response.transpose((1, 0))
|
|
236
243
|
|
|
237
244
|
# If we have shape (3,), convert to (3, 1)
|
|
@@ -121,9 +121,6 @@ class NimClient:
|
|
|
121
121
|
if model_name == "yolox_ensemble":
|
|
122
122
|
model_name = "yolox"
|
|
123
123
|
|
|
124
|
-
if model_name == "scene_text_ensemble":
|
|
125
|
-
model_name = "scene_text_pre"
|
|
126
|
-
|
|
127
124
|
if model_name in self._max_batch_sizes:
|
|
128
125
|
return self._max_batch_sizes[model_name]
|
|
129
126
|
|
|
@@ -24,8 +24,12 @@ logger = logging.getLogger(__name__)
|
|
|
24
24
|
# Tracing Options Schema
|
|
25
25
|
class TracingOptionsSchema(BaseModelNoExt):
|
|
26
26
|
trace: bool = False
|
|
27
|
-
ts_send: int
|
|
27
|
+
ts_send: Optional[int] = None
|
|
28
28
|
trace_id: Optional[str] = None
|
|
29
|
+
# V2 PDF splitting support
|
|
30
|
+
parent_job_id: Optional[str] = None
|
|
31
|
+
page_num: Optional[int] = None
|
|
32
|
+
total_pages: Optional[int] = None
|
|
29
33
|
|
|
30
34
|
|
|
31
35
|
# Ingest Task Schemas
|
|
@@ -3,6 +3,7 @@
|
|
|
3
3
|
# SPDX-License-Identifier: Apache-2.0
|
|
4
4
|
|
|
5
5
|
import logging
|
|
6
|
+
import os
|
|
6
7
|
import re
|
|
7
8
|
import time
|
|
8
9
|
from typing import Any, Union, Tuple, Optional, Dict, Callable
|
|
@@ -137,13 +138,19 @@ class RestClient(MessageBrokerClientBase):
|
|
|
137
138
|
)
|
|
138
139
|
self._client = requests.Session()
|
|
139
140
|
|
|
140
|
-
|
|
141
|
-
|
|
141
|
+
# Allow API version override via environment variable or kwargs
|
|
142
|
+
api_version = kwargs.get("api_version") or os.getenv("NV_INGEST_API_VERSION", "v1")
|
|
143
|
+
self._api_version = api_version
|
|
144
|
+
self._submit_endpoint: str = f"/{api_version}/submit_job"
|
|
145
|
+
self._fetch_endpoint: str = f"/{api_version}/fetch_job"
|
|
142
146
|
self._base_url: str = kwargs.get("base_url") or self._generate_url(self._host, self._port)
|
|
143
147
|
self._headers = kwargs.get("headers", {})
|
|
144
148
|
self._auth = kwargs.get("auth", None)
|
|
145
149
|
|
|
146
150
|
logger.debug(f"RestClient base URL set to: {self._base_url}")
|
|
151
|
+
logger.info(
|
|
152
|
+
f"RestClient using API version: {api_version} (endpoints: {self._submit_endpoint}, {self._fetch_endpoint})"
|
|
153
|
+
)
|
|
147
154
|
|
|
148
155
|
@staticmethod
|
|
149
156
|
def _generate_url(host: str, port: int) -> str:
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/udfs/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|