nv-ingest-api 2025.10.9.dev20251009__tar.gz → 2025.10.11.dev20251011__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of nv-ingest-api might be problematic. Click here for more details.

Files changed (180) hide show
  1. {nv_ingest_api-2025.10.9.dev20251009/src/nv_ingest_api.egg-info → nv_ingest_api-2025.10.11.dev20251011}/PKG-INFO +1 -1
  2. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/chart_extractor.py +7 -3
  3. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/infographic_extractor.py +7 -3
  4. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/table_extractor.py +7 -3
  5. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/ocr.py +9 -2
  6. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/nim_client.py +0 -3
  7. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/ingest_job_schema.py +5 -1
  8. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/rest/rest_client.py +9 -2
  9. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011/src/nv_ingest_api.egg-info}/PKG-INFO +1 -1
  10. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/LICENSE +0 -0
  11. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/MANIFEST.in +0 -0
  12. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/README.md +0 -0
  13. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/pyproject.toml +0 -0
  14. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/setup.cfg +0 -0
  15. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/__init__.py +0 -0
  16. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/__init__.py +0 -0
  17. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/extract.py +0 -0
  18. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/mutate.py +0 -0
  19. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/store.py +0 -0
  20. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/transform.py +0 -0
  21. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/interface/utility.py +0 -0
  22. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/__init__.py +0 -0
  23. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/enums/__init__.py +0 -0
  24. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/enums/common.py +0 -0
  25. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/__init__.py +0 -0
  26. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/audio/__init__.py +0 -0
  27. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/audio/audio_extraction.py +0 -0
  28. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/__init__.py +0 -0
  29. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/docx_extractor.py +0 -0
  30. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/engines/__init__.py +0 -0
  31. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/__init__.py +0 -0
  32. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docx_helper.py +0 -0
  33. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docxreader.py +0 -0
  34. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/html/__init__.py +0 -0
  35. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/html/html_extractor.py +0 -0
  36. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/__init__.py +0 -0
  37. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/image_extractor.py +0 -0
  38. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/image_helpers/__init__.py +0 -0
  39. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/image/image_helpers/common.py +0 -0
  40. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/__init__.py +0 -0
  41. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/__init__.py +0 -0
  42. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/adobe.py +0 -0
  43. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/llama.py +0 -0
  44. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/nemoretriever.py +0 -0
  45. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/pdf_helpers/__init__.py +0 -0
  46. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/pdfium.py +0 -0
  47. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/tika.py +0 -0
  48. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/engines/unstructured_io.py +0 -0
  49. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pdf/pdf_extractor.py +0 -0
  50. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pptx/__init__.py +0 -0
  51. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pptx/engines/__init__.py +0 -0
  52. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pptx/engines/pptx_helper.py +0 -0
  53. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/extract/pptx/pptx_extractor.py +0 -0
  54. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/meta/__init__.py +0 -0
  55. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/meta/udf.py +0 -0
  56. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/mutate/__init__.py +0 -0
  57. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/mutate/deduplicate.py +0 -0
  58. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/mutate/filter.py +0 -0
  59. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/__init__.py +0 -0
  60. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/control_message_task.py +0 -0
  61. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/ingest_control_message.py +0 -0
  62. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/__init__.py +0 -0
  63. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/default_values.py +0 -0
  64. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/__init__.py +0 -0
  65. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/cached.py +0 -0
  66. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/decorators.py +0 -0
  67. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/deplot.py +0 -0
  68. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/helpers.py +0 -0
  69. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/nemoretriever_parse.py +0 -0
  70. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/parakeet.py +0 -0
  71. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/text_embedding.py +0 -0
  72. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/vlm.py +0 -0
  73. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/model_interface/yolox.py +0 -0
  74. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/nim/nim_model_interface.py +0 -0
  75. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/tracing/__init__.py +0 -0
  76. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/tracing/latency.py +0 -0
  77. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/tracing/logging.py +0 -0
  78. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/primitives/tracing/tagging.py +0 -0
  79. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/__init__.py +0 -0
  80. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/__init__.py +0 -0
  81. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_audio_schema.py +0 -0
  82. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_chart_schema.py +0 -0
  83. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_docx_schema.py +0 -0
  84. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_html_schema.py +0 -0
  85. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_image_schema.py +0 -0
  86. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_infographic_schema.py +0 -0
  87. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_pdf_schema.py +0 -0
  88. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_pptx_schema.py +0 -0
  89. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/extract/extract_table_schema.py +0 -0
  90. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/message_brokers/__init__.py +0 -0
  91. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/message_brokers/message_broker_client_schema.py +0 -0
  92. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/message_brokers/request_schema.py +0 -0
  93. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/message_brokers/response_schema.py +0 -0
  94. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/__init__.py +0 -0
  95. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/base_model_noext.py +0 -0
  96. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/metadata_schema.py +0 -0
  97. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/meta/udf.py +0 -0
  98. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/mutate/__init__.py +0 -0
  99. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/mutate/mutate_image_dedup_schema.py +0 -0
  100. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/store/__init__.py +0 -0
  101. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/store/store_embedding_schema.py +0 -0
  102. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/store/store_image_schema.py +0 -0
  103. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/__init__.py +0 -0
  104. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/transform_image_caption_schema.py +0 -0
  105. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/transform_image_filter_schema.py +0 -0
  106. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/transform_text_embedding_schema.py +0 -0
  107. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/schemas/transform/transform_text_splitter_schema.py +0 -0
  108. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/store/__init__.py +0 -0
  109. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/store/embed_text_upload.py +0 -0
  110. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/store/image_upload.py +0 -0
  111. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/transform/__init__.py +0 -0
  112. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/transform/caption_image.py +0 -0
  113. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/transform/embed_text.py +0 -0
  114. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/internal/transform/split_text.py +0 -0
  115. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/__init__.py +0 -0
  116. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/control_message/__init__.py +0 -0
  117. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/control_message/validators.py +0 -0
  118. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/__init__.py +0 -0
  119. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/bytetools.py +0 -0
  120. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/containers.py +0 -0
  121. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/datetools.py +0 -0
  122. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/dftools.py +0 -0
  123. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/formats.py +0 -0
  124. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/converters/type_mappings.py +0 -0
  125. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/dataloader/__init__.py +0 -0
  126. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/dataloader/dataloader.py +0 -0
  127. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/detectors/__init__.py +0 -0
  128. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/detectors/language.py +0 -0
  129. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/__init__.py +0 -0
  130. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/converters.py +0 -0
  131. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/decorators.py +0 -0
  132. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/detectors.py +0 -0
  133. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/pdf.py +0 -0
  134. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/exception_handlers/schemas.py +0 -0
  135. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/__init__.py +0 -0
  136. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/clustering.py +0 -0
  137. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/processing.py +0 -0
  138. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/table_and_chart.py +0 -0
  139. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/image_processing/transforms.py +0 -0
  140. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/imports/__init__.py +0 -0
  141. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/imports/callable_signatures.py +0 -0
  142. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/imports/dynamic_resolvers.py +0 -0
  143. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/introspection/__init__.py +0 -0
  144. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/introspection/class_inspect.py +0 -0
  145. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/introspection/function_inspect.py +0 -0
  146. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/logging/__init__.py +0 -0
  147. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/logging/configuration.py +0 -0
  148. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/logging/sanitize.py +0 -0
  149. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/__init__.py +0 -0
  150. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/simple_message_broker/__init__.py +0 -0
  151. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/simple_message_broker/broker.py +0 -0
  152. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/simple_message_broker/ordered_message_queue.py +0 -0
  153. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/message_brokers/simple_message_broker/simple_client.py +0 -0
  154. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/metadata/__init__.py +0 -0
  155. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/metadata/aggregators.py +0 -0
  156. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/multi_processing/__init__.py +0 -0
  157. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/multi_processing/mp_pool_singleton.py +0 -0
  158. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/nim/__init__.py +0 -0
  159. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/pdf/__init__.py +0 -0
  160. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/pdf/pdfium.py +0 -0
  161. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/schema/__init__.py +0 -0
  162. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/schema/schema_validator.py +0 -0
  163. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/__init__.py +0 -0
  164. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/client_base.py +0 -0
  165. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/kafka/__init__.py +0 -0
  166. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/redis/__init__.py +0 -0
  167. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/redis/redis_client.py +0 -0
  168. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/service_clients/rest/__init__.py +0 -0
  169. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/string_processing/__init__.py +0 -0
  170. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/string_processing/configuration.py +0 -0
  171. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/string_processing/yaml.py +0 -0
  172. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/system/__init__.py +0 -0
  173. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api/util/system/hardware_info.py +0 -0
  174. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api.egg-info/SOURCES.txt +0 -0
  175. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api.egg-info/dependency_links.txt +0 -0
  176. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api.egg-info/requires.txt +0 -0
  177. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/nv_ingest_api.egg-info/top_level.txt +0 -0
  178. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/udfs/__init__.py +0 -0
  179. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/udfs/llm_summarizer_udf.py +0 -0
  180. {nv_ingest_api-2025.10.9.dev20251009 → nv_ingest_api-2025.10.11.dev20251011}/src/version.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest-api
3
- Version: 2025.10.9.dev20251009
3
+ Version: 2025.10.11.dev20251011
4
4
  Summary: Python module with core document ingestion functions.
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License
@@ -97,7 +97,7 @@ def _run_chart_inference(
97
97
  model_name="paddle",
98
98
  max_batch_size=1 if ocr_client.protocol == "grpc" else 2,
99
99
  )
100
- elif ocr_model_name == "scene_text_ensemble":
100
+ elif ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}:
101
101
  future_ocr_kwargs.update(
102
102
  model_name=ocr_model_name,
103
103
  input_names=["INPUT_IMAGE_URLS", "MERGE_LEVELS"],
@@ -237,7 +237,9 @@ def _create_ocr_client(
237
237
  auth_token: str,
238
238
  ) -> NimClient:
239
239
  ocr_model_interface = (
240
- NemoRetrieverOCRModelInterface() if ocr_model_name == "scene_text_ensemble" else PaddleOCRModelInterface()
240
+ NemoRetrieverOCRModelInterface()
241
+ if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}
242
+ else PaddleOCRModelInterface()
241
243
  )
242
244
 
243
245
  ocr_client = create_inference_client(
@@ -245,7 +247,9 @@ def _create_ocr_client(
245
247
  model_interface=ocr_model_interface,
246
248
  auth_token=auth_token,
247
249
  infer_protocol=ocr_protocol,
248
- enable_dynamic_batching=(True if ocr_model_name == "scene_text_ensemble" else False),
250
+ enable_dynamic_batching=(
251
+ True if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"} else False
252
+ ),
249
253
  dynamic_batch_memory_budget_mb=32,
250
254
  )
251
255
 
@@ -107,7 +107,7 @@ def _update_infographic_metadata(
107
107
  model_name="paddle",
108
108
  max_batch_size=1 if ocr_client.protocol == "grpc" else 2,
109
109
  )
110
- elif ocr_model_name == "scene_text_ensemble":
110
+ elif ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}:
111
111
  infer_kwargs.update(
112
112
  model_name=ocr_model_name,
113
113
  input_names=["INPUT_IMAGE_URLS", "MERGE_LEVELS"],
@@ -152,7 +152,9 @@ def _create_ocr_client(
152
152
  auth_token: str,
153
153
  ) -> NimClient:
154
154
  ocr_model_interface = (
155
- NemoRetrieverOCRModelInterface() if ocr_model_name == "scene_text_ensemble" else PaddleOCRModelInterface()
155
+ NemoRetrieverOCRModelInterface()
156
+ if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}
157
+ else PaddleOCRModelInterface()
156
158
  )
157
159
 
158
160
  ocr_client = create_inference_client(
@@ -160,7 +162,9 @@ def _create_ocr_client(
160
162
  model_interface=ocr_model_interface,
161
163
  auth_token=auth_token,
162
164
  infer_protocol=ocr_protocol,
163
- enable_dynamic_batching=(True if ocr_model_name == "scene_text_ensemble" else False),
165
+ enable_dynamic_batching=(
166
+ True if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"} else False
167
+ ),
164
168
  dynamic_batch_memory_budget_mb=32,
165
169
  )
166
170
 
@@ -99,7 +99,7 @@ def _run_inference(
99
99
  model_name="paddle",
100
100
  max_batch_size=1 if ocr_client.protocol == "grpc" else 2,
101
101
  )
102
- elif ocr_model_name == "scene_text_ensemble":
102
+ elif ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}:
103
103
  future_ocr_kwargs.update(
104
104
  model_name=ocr_model_name,
105
105
  input_names=["INPUT_IMAGE_URLS", "MERGE_LEVELS"],
@@ -246,7 +246,9 @@ def _create_ocr_client(
246
246
  auth_token: str,
247
247
  ) -> NimClient:
248
248
  ocr_model_interface = (
249
- NemoRetrieverOCRModelInterface() if ocr_model_name == "scene_text_ensemble" else PaddleOCRModelInterface()
249
+ NemoRetrieverOCRModelInterface()
250
+ if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"}
251
+ else PaddleOCRModelInterface()
250
252
  )
251
253
 
252
254
  ocr_client = create_inference_client(
@@ -254,7 +256,9 @@ def _create_ocr_client(
254
256
  model_interface=ocr_model_interface,
255
257
  auth_token=auth_token,
256
258
  infer_protocol=ocr_protocol,
257
- enable_dynamic_batching=(True if ocr_model_name == "scene_text_ensemble" else False),
259
+ enable_dynamic_batching=(
260
+ True if ocr_model_name in {"scene_text_ensemble", "scene_text_wrapper", "scene_text_python"} else False
261
+ ),
258
262
  dynamic_batch_memory_budget_mb=32,
259
263
  )
260
264
 
@@ -21,7 +21,10 @@ from nv_ingest_api.internal.primitives.nim.model_interface.helpers import prepro
21
21
  from nv_ingest_api.util.image_processing.transforms import base64_to_numpy
22
22
 
23
23
  DEFAULT_OCR_MODEL_NAME = "paddle"
24
- NEMORETRIEVER_OCR_MODEL_NAME = "scene_text_ensemble"
24
+ NEMORETRIEVER_OCR_MODEL_NAME = "scene_text_wrapper"
25
+ NEMORETRIEVER_OCR_ENSEMBLE_MODEL_NAME = "scene_text_ensemble"
26
+ NEMORETRIEVER_OCR_BLS_MODEL_NAME = "scene_text_python"
27
+
25
28
 
26
29
  logger = logging.getLogger(__name__)
27
30
 
@@ -231,7 +234,11 @@ class OCRModelInterfaceBase(ModelInterface):
231
234
  if not isinstance(response, np.ndarray):
232
235
  raise ValueError("Unexpected response format: response is not a NumPy array.")
233
236
 
234
- if model_name == NEMORETRIEVER_OCR_MODEL_NAME:
237
+ if model_name in [
238
+ NEMORETRIEVER_OCR_MODEL_NAME,
239
+ NEMORETRIEVER_OCR_ENSEMBLE_MODEL_NAME,
240
+ NEMORETRIEVER_OCR_BLS_MODEL_NAME,
241
+ ]:
235
242
  response = response.transpose((1, 0))
236
243
 
237
244
  # If we have shape (3,), convert to (3, 1)
@@ -121,9 +121,6 @@ class NimClient:
121
121
  if model_name == "yolox_ensemble":
122
122
  model_name = "yolox"
123
123
 
124
- if model_name == "scene_text_ensemble":
125
- model_name = "scene_text_pre"
126
-
127
124
  if model_name in self._max_batch_sizes:
128
125
  return self._max_batch_sizes[model_name]
129
126
 
@@ -24,8 +24,12 @@ logger = logging.getLogger(__name__)
24
24
  # Tracing Options Schema
25
25
  class TracingOptionsSchema(BaseModelNoExt):
26
26
  trace: bool = False
27
- ts_send: int
27
+ ts_send: Optional[int] = None
28
28
  trace_id: Optional[str] = None
29
+ # V2 PDF splitting support
30
+ parent_job_id: Optional[str] = None
31
+ page_num: Optional[int] = None
32
+ total_pages: Optional[int] = None
29
33
 
30
34
 
31
35
  # Ingest Task Schemas
@@ -3,6 +3,7 @@
3
3
  # SPDX-License-Identifier: Apache-2.0
4
4
 
5
5
  import logging
6
+ import os
6
7
  import re
7
8
  import time
8
9
  from typing import Any, Union, Tuple, Optional, Dict, Callable
@@ -137,13 +138,19 @@ class RestClient(MessageBrokerClientBase):
137
138
  )
138
139
  self._client = requests.Session()
139
140
 
140
- self._submit_endpoint: str = "/v1/submit_job"
141
- self._fetch_endpoint: str = "/v1/fetch_job"
141
+ # Allow API version override via environment variable or kwargs
142
+ api_version = kwargs.get("api_version") or os.getenv("NV_INGEST_API_VERSION", "v1")
143
+ self._api_version = api_version
144
+ self._submit_endpoint: str = f"/{api_version}/submit_job"
145
+ self._fetch_endpoint: str = f"/{api_version}/fetch_job"
142
146
  self._base_url: str = kwargs.get("base_url") or self._generate_url(self._host, self._port)
143
147
  self._headers = kwargs.get("headers", {})
144
148
  self._auth = kwargs.get("auth", None)
145
149
 
146
150
  logger.debug(f"RestClient base URL set to: {self._base_url}")
151
+ logger.info(
152
+ f"RestClient using API version: {api_version} (endpoints: {self._submit_endpoint}, {self._fetch_endpoint})"
153
+ )
147
154
 
148
155
  @staticmethod
149
156
  def _generate_url(host: str, port: int) -> str:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest-api
3
- Version: 2025.10.9.dev20251009
3
+ Version: 2025.10.11.dev20251011
4
4
  Summary: Python module with core document ingestion functions.
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License