nv-ingest-api 2025.10.15.dev20251015__tar.gz → 2025.10.17.dev20251017__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of nv-ingest-api might be problematic. Click here for more details.
- {nv_ingest_api-2025.10.15.dev20251015/src/nv_ingest_api.egg-info → nv_ingest_api-2025.10.17.dev20251017}/PKG-INFO +1 -1
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/ocr.py +2 -2
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017/src/nv_ingest_api.egg-info}/PKG-INFO +1 -1
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/udfs/llm_summarizer_udf.py +9 -8
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/LICENSE +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/MANIFEST.in +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/README.md +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/pyproject.toml +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/setup.cfg +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/interface/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/interface/extract.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/interface/mutate.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/interface/store.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/interface/transform.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/interface/utility.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/enums/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/enums/common.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/audio/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/audio/audio_extraction.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/docx/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/docx/docx_extractor.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/docx/engines/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docx_helper.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docxreader.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/html/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/html/html_extractor.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/image/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/image/chart_extractor.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/image/image_extractor.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/image/image_helpers/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/image/image_helpers/common.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/image/infographic_extractor.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/image/table_extractor.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/engines/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/engines/adobe.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/engines/llama.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/engines/nemoretriever.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/engines/pdf_helpers/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/engines/pdfium.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/engines/tika.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/engines/unstructured_io.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pdf/pdf_extractor.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pptx/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pptx/engines/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pptx/engines/pptx_helper.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/extract/pptx/pptx_extractor.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/meta/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/meta/udf.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/mutate/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/mutate/deduplicate.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/mutate/filter.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/control_message_task.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/ingest_control_message.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/default_values.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/cached.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/decorators.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/deplot.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/helpers.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/nemoretriever_parse.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/parakeet.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/text_embedding.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/vlm.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/model_interface/yolox.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/nim_client.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/nim/nim_model_interface.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/tracing/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/tracing/latency.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/tracing/logging.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/primitives/tracing/tagging.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/extract_audio_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/extract_chart_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/extract_docx_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/extract_html_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/extract_image_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/extract_infographic_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/extract_pdf_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/extract_pptx_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/extract/extract_table_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/message_brokers/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/message_brokers/message_broker_client_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/message_brokers/request_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/message_brokers/response_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/meta/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/meta/base_model_noext.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/meta/ingest_job_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/meta/metadata_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/meta/udf.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/mutate/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/mutate/mutate_image_dedup_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/store/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/store/store_embedding_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/store/store_image_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/transform/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/transform/transform_image_caption_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/transform/transform_image_filter_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/transform/transform_text_embedding_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/schemas/transform/transform_text_splitter_schema.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/store/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/store/embed_text_upload.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/store/image_upload.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/transform/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/transform/caption_image.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/transform/embed_text.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/internal/transform/split_text.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/control_message/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/control_message/validators.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/converters/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/converters/bytetools.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/converters/containers.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/converters/datetools.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/converters/dftools.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/converters/formats.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/converters/type_mappings.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/dataloader/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/dataloader/dataloader.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/detectors/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/detectors/language.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/exception_handlers/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/exception_handlers/converters.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/exception_handlers/decorators.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/exception_handlers/detectors.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/exception_handlers/pdf.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/exception_handlers/schemas.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/image_processing/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/image_processing/clustering.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/image_processing/processing.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/image_processing/table_and_chart.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/image_processing/transforms.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/imports/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/imports/callable_signatures.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/imports/dynamic_resolvers.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/introspection/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/introspection/class_inspect.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/introspection/function_inspect.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/logging/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/logging/configuration.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/logging/sanitize.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/message_brokers/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/message_brokers/simple_message_broker/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/message_brokers/simple_message_broker/broker.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/message_brokers/simple_message_broker/ordered_message_queue.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/message_brokers/simple_message_broker/simple_client.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/metadata/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/metadata/aggregators.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/multi_processing/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/multi_processing/mp_pool_singleton.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/nim/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/pdf/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/pdf/pdfium.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/schema/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/schema/schema_validator.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/service_clients/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/service_clients/client_base.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/service_clients/kafka/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/service_clients/redis/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/service_clients/redis/redis_client.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/service_clients/rest/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/service_clients/rest/rest_client.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/string_processing/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/string_processing/configuration.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/string_processing/yaml.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/system/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api/util/system/hardware_info.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api.egg-info/SOURCES.txt +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api.egg-info/dependency_links.txt +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api.egg-info/requires.txt +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/nv_ingest_api.egg-info/top_level.txt +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/udfs/__init__.py +0 -0
- {nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/version.py +0 -0
|
@@ -758,8 +758,8 @@ def get_ocr_model_name(ocr_grpc_endpoint=None, default_model_name=DEFAULT_OCR_MO
|
|
|
758
758
|
if ocr_model_name is not None:
|
|
759
759
|
return ocr_model_name
|
|
760
760
|
|
|
761
|
-
# 2. If no gRPC endpoint is provided, fall back to the default immediately.
|
|
762
|
-
if not ocr_grpc_endpoint:
|
|
761
|
+
# 2. If no gRPC endpoint is provided or the endpoint is a NVCF endpoint, fall back to the default immediately.
|
|
762
|
+
if (not ocr_grpc_endpoint) or ("grpc.nvcf.nvidia.com" in ocr_grpc_endpoint):
|
|
763
763
|
logger.debug(f"No OCR gRPC endpoint provided. Falling back to default model name '{default_model_name}'.")
|
|
764
764
|
return default_model_name
|
|
765
765
|
|
|
@@ -2,8 +2,9 @@
|
|
|
2
2
|
"""
|
|
3
3
|
LLM Content Summarizer UDF for NV-Ingest Pipeline
|
|
4
4
|
|
|
5
|
-
|
|
6
|
-
|
|
5
|
+
Generates document summaries using NVIDIA-hosted LLMs. This production UDF demonstrates how to extract the pipeline
|
|
6
|
+
payload, run custom code (summarization), and inject results into the metadata for downstream usecases (such as
|
|
7
|
+
retrieval).
|
|
7
8
|
|
|
8
9
|
These variables can be set in the environment before running the pipeline. These can be treated as kwargs.
|
|
9
10
|
- NVIDIA_API_KEY: API key for NVIDIA NIM endpoints (required)
|
|
@@ -14,16 +15,14 @@ These variables can be set in the environment before running the pipeline. These
|
|
|
14
15
|
- MAX_CONTENT_LENGTH: Maximum content length to send to API (default: 12000)
|
|
15
16
|
TODO: Implement this
|
|
16
17
|
- NUM_CHUNKS: (Optional) Number of first and last pages to summarize. default=1
|
|
18
|
+
|
|
19
|
+
More info can be found in `examples/udfs/README.md`
|
|
17
20
|
"""
|
|
18
21
|
|
|
19
22
|
import logging
|
|
20
23
|
import os
|
|
21
24
|
import time
|
|
22
25
|
|
|
23
|
-
# REMOVE BEFORE MERGING
|
|
24
|
-
# import yaml
|
|
25
|
-
# from pathlib import Path
|
|
26
|
-
|
|
27
26
|
|
|
28
27
|
logger = logging.getLogger(__name__)
|
|
29
28
|
|
|
@@ -85,6 +84,7 @@ def content_summarizer(control_message: "IngestControlMessage") -> "IngestContro
|
|
|
85
84
|
# According to docs/docs/extraction/user_defined_functions.md#understanding-the-dataframe-payload
|
|
86
85
|
# the rows are not necessarily pages. they are chunks of data extracted from the document. in order to select
|
|
87
86
|
# pages, it must require parsing the payload to see which chunks correspond to which pages
|
|
87
|
+
original_df = df.copy()
|
|
88
88
|
if len(df) > 1:
|
|
89
89
|
# TODO: add feature to select N first and last chunks
|
|
90
90
|
df = df.iloc[[0, -1]]
|
|
@@ -108,10 +108,11 @@ def content_summarizer(control_message: "IngestControlMessage") -> "IngestContro
|
|
|
108
108
|
if not stats["failed"]:
|
|
109
109
|
stats["tokens"] = _estimate_tokens(content)
|
|
110
110
|
logger.info("Summarized %d tokens in %f seconds using %s", stats["tokens"], stats["duration"], model_name)
|
|
111
|
-
_store_summary(
|
|
111
|
+
_store_summary(original_df, summary, model_name)
|
|
112
112
|
|
|
113
113
|
# Update the control message with modified DataFrame
|
|
114
|
-
control_message.payload(
|
|
114
|
+
control_message.payload(original_df)
|
|
115
|
+
|
|
115
116
|
else:
|
|
116
117
|
logger.warning("%s failed to summarize content", model_name)
|
|
117
118
|
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/pyproject.toml
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/udfs/__init__.py
RENAMED
|
File without changes
|
{nv_ingest_api-2025.10.15.dev20251015 → nv_ingest_api-2025.10.17.dev20251017}/src/version.py
RENAMED
|
File without changes
|