nv-ingest-api 2025.8.18.dev20250818__tar.gz → 2025.8.20.dev20250820__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of nv-ingest-api might be problematic. Click here for more details.

Files changed (176) hide show
  1. {nv_ingest_api-2025.8.18.dev20250818/src/nv_ingest_api.egg-info → nv_ingest_api-2025.8.20.dev20250820}/PKG-INFO +1 -1
  2. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/engines/llama.py +4 -1
  3. nv_ingest_api-2025.8.20.dev20250820/src/nv_ingest_api/internal/schemas/transform/transform_image_caption_schema.py +33 -0
  4. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/transform/transform_text_embedding_schema.py +15 -2
  5. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/transform/embed_text.py +4 -1
  6. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820/src/nv_ingest_api.egg-info}/PKG-INFO +1 -1
  7. nv_ingest_api-2025.8.18.dev20250818/src/nv_ingest_api/internal/schemas/transform/transform_image_caption_schema.py +0 -15
  8. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/LICENSE +0 -0
  9. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/MANIFEST.in +0 -0
  10. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/README.md +0 -0
  11. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/pyproject.toml +0 -0
  12. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/setup.cfg +0 -0
  13. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/__init__.py +0 -0
  14. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/interface/__init__.py +0 -0
  15. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/interface/extract.py +0 -0
  16. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/interface/mutate.py +0 -0
  17. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/interface/store.py +0 -0
  18. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/interface/transform.py +0 -0
  19. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/interface/utility.py +0 -0
  20. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/__init__.py +0 -0
  21. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/enums/__init__.py +0 -0
  22. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/enums/common.py +0 -0
  23. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/__init__.py +0 -0
  24. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/audio/__init__.py +0 -0
  25. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/audio/audio_extraction.py +0 -0
  26. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/docx/__init__.py +0 -0
  27. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/docx/docx_extractor.py +0 -0
  28. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/docx/engines/__init__.py +0 -0
  29. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/__init__.py +0 -0
  30. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docx_helper.py +0 -0
  31. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docxreader.py +0 -0
  32. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/html/__init__.py +0 -0
  33. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/html/html_extractor.py +0 -0
  34. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/image/__init__.py +0 -0
  35. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/image/chart_extractor.py +0 -0
  36. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/image/image_extractor.py +0 -0
  37. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/image/image_helpers/__init__.py +0 -0
  38. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/image/image_helpers/common.py +0 -0
  39. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/image/infographic_extractor.py +0 -0
  40. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/image/table_extractor.py +0 -0
  41. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/__init__.py +0 -0
  42. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/engines/__init__.py +0 -0
  43. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/engines/adobe.py +0 -0
  44. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/engines/nemoretriever.py +0 -0
  45. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/engines/pdf_helpers/__init__.py +0 -0
  46. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/engines/pdfium.py +0 -0
  47. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/engines/tika.py +0 -0
  48. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/engines/unstructured_io.py +0 -0
  49. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pdf/pdf_extractor.py +0 -0
  50. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pptx/__init__.py +0 -0
  51. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pptx/engines/__init__.py +0 -0
  52. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pptx/engines/pptx_helper.py +0 -0
  53. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/extract/pptx/pptx_extractor.py +0 -0
  54. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/meta/__init__.py +0 -0
  55. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/meta/udf.py +0 -0
  56. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/mutate/__init__.py +0 -0
  57. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/mutate/deduplicate.py +0 -0
  58. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/mutate/filter.py +0 -0
  59. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/__init__.py +0 -0
  60. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/control_message_task.py +0 -0
  61. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/ingest_control_message.py +0 -0
  62. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/__init__.py +0 -0
  63. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/default_values.py +0 -0
  64. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/__init__.py +0 -0
  65. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/cached.py +0 -0
  66. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/decorators.py +0 -0
  67. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/deplot.py +0 -0
  68. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/helpers.py +0 -0
  69. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/nemoretriever_parse.py +0 -0
  70. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/ocr.py +0 -0
  71. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/parakeet.py +0 -0
  72. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/text_embedding.py +0 -0
  73. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/vlm.py +0 -0
  74. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/model_interface/yolox.py +0 -0
  75. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/nim_client.py +0 -0
  76. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/nim/nim_model_interface.py +0 -0
  77. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/tracing/__init__.py +0 -0
  78. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/tracing/latency.py +0 -0
  79. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/tracing/logging.py +0 -0
  80. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/primitives/tracing/tagging.py +0 -0
  81. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/__init__.py +0 -0
  82. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/__init__.py +0 -0
  83. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/extract_audio_schema.py +0 -0
  84. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/extract_chart_schema.py +0 -0
  85. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/extract_docx_schema.py +0 -0
  86. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/extract_html_schema.py +0 -0
  87. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/extract_image_schema.py +0 -0
  88. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/extract_infographic_schema.py +0 -0
  89. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/extract_pdf_schema.py +0 -0
  90. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/extract_pptx_schema.py +0 -0
  91. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/extract/extract_table_schema.py +0 -0
  92. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/message_brokers/__init__.py +0 -0
  93. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/message_brokers/message_broker_client_schema.py +0 -0
  94. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/message_brokers/request_schema.py +0 -0
  95. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/message_brokers/response_schema.py +0 -0
  96. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/meta/__init__.py +0 -0
  97. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/meta/base_model_noext.py +0 -0
  98. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/meta/ingest_job_schema.py +0 -0
  99. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/meta/metadata_schema.py +0 -0
  100. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/meta/udf.py +0 -0
  101. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/mutate/__init__.py +0 -0
  102. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/mutate/mutate_image_dedup_schema.py +0 -0
  103. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/store/__init__.py +0 -0
  104. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/store/store_embedding_schema.py +0 -0
  105. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/store/store_image_schema.py +0 -0
  106. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/transform/__init__.py +0 -0
  107. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/transform/transform_image_filter_schema.py +0 -0
  108. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/schemas/transform/transform_text_splitter_schema.py +0 -0
  109. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/store/__init__.py +0 -0
  110. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/store/embed_text_upload.py +0 -0
  111. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/store/image_upload.py +0 -0
  112. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/transform/__init__.py +0 -0
  113. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/transform/caption_image.py +0 -0
  114. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/internal/transform/split_text.py +0 -0
  115. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/__init__.py +0 -0
  116. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/control_message/__init__.py +0 -0
  117. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/control_message/validators.py +0 -0
  118. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/converters/__init__.py +0 -0
  119. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/converters/bytetools.py +0 -0
  120. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/converters/containers.py +0 -0
  121. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/converters/datetools.py +0 -0
  122. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/converters/dftools.py +0 -0
  123. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/converters/formats.py +0 -0
  124. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/converters/type_mappings.py +0 -0
  125. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/detectors/__init__.py +0 -0
  126. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/detectors/language.py +0 -0
  127. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/exception_handlers/__init__.py +0 -0
  128. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/exception_handlers/converters.py +0 -0
  129. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/exception_handlers/decorators.py +0 -0
  130. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/exception_handlers/detectors.py +0 -0
  131. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/exception_handlers/pdf.py +0 -0
  132. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/exception_handlers/schemas.py +0 -0
  133. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/image_processing/__init__.py +0 -0
  134. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/image_processing/clustering.py +0 -0
  135. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/image_processing/processing.py +0 -0
  136. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/image_processing/table_and_chart.py +0 -0
  137. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/image_processing/transforms.py +0 -0
  138. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/imports/__init__.py +0 -0
  139. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/imports/callable_signatures.py +0 -0
  140. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/imports/dynamic_resolvers.py +0 -0
  141. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/introspection/__init__.py +0 -0
  142. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/introspection/class_inspect.py +0 -0
  143. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/introspection/function_inspect.py +0 -0
  144. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/logging/__init__.py +0 -0
  145. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/logging/configuration.py +0 -0
  146. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/message_brokers/__init__.py +0 -0
  147. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/message_brokers/simple_message_broker/__init__.py +0 -0
  148. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/message_brokers/simple_message_broker/broker.py +0 -0
  149. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/message_brokers/simple_message_broker/ordered_message_queue.py +0 -0
  150. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/message_brokers/simple_message_broker/simple_client.py +0 -0
  151. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/metadata/__init__.py +0 -0
  152. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/metadata/aggregators.py +0 -0
  153. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/multi_processing/__init__.py +0 -0
  154. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/multi_processing/mp_pool_singleton.py +0 -0
  155. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/nim/__init__.py +0 -0
  156. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/pdf/__init__.py +0 -0
  157. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/pdf/pdfium.py +0 -0
  158. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/schema/__init__.py +0 -0
  159. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/schema/schema_validator.py +0 -0
  160. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/service_clients/__init__.py +0 -0
  161. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/service_clients/client_base.py +0 -0
  162. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/service_clients/kafka/__init__.py +0 -0
  163. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/service_clients/redis/__init__.py +0 -0
  164. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/service_clients/redis/redis_client.py +0 -0
  165. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/service_clients/rest/__init__.py +0 -0
  166. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/service_clients/rest/rest_client.py +0 -0
  167. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/string_processing/__init__.py +0 -0
  168. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/string_processing/configuration.py +0 -0
  169. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/string_processing/yaml.py +0 -0
  170. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/system/__init__.py +0 -0
  171. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api/util/system/hardware_info.py +0 -0
  172. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api.egg-info/SOURCES.txt +0 -0
  173. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api.egg-info/dependency_links.txt +0 -0
  174. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api.egg-info/requires.txt +0 -0
  175. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/nv_ingest_api.egg-info/top_level.txt +0 -0
  176. {nv_ingest_api-2025.8.18.dev20250818 → nv_ingest_api-2025.8.20.dev20250820}/src/version.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest-api
3
- Version: 2025.8.18.dev20250818
3
+ Version: 2025.8.20.dev20250820
4
4
  Summary: Python module with core document ingestion functions.
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License
@@ -193,7 +193,10 @@ async def async_llama_parse(
193
193
  A string of extracted text.
194
194
  """
195
195
  base_url = "https://api.cloud.llamaindex.ai/api/parsing"
196
- headers = {"Authorization": f"Bearer {api_key}"}
196
+ # Normalize in case api_key contains only whitespace; avoid sending an empty bearer token
197
+ _token = (api_key or "").strip()
198
+ _auth_value = f"Bearer {_token}" if _token else "Bearer <no key provided>"
199
+ headers = {"Authorization": _auth_value}
197
200
  mime_type = "application/pdf"
198
201
 
199
202
  try:
@@ -0,0 +1,33 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2024, NVIDIA CORPORATION & AFFILIATES.
2
+ # All rights reserved.
3
+ # SPDX-License-Identifier: Apache-2.0
4
+
5
+
6
+ from pydantic import ConfigDict, BaseModel, model_validator, field_validator
7
+
8
+
9
+ class ImageCaptionExtractionSchema(BaseModel):
10
+ api_key: str = ""
11
+ endpoint_url: str = "https://integrate.api.nvidia.com/v1/chat/completions"
12
+ prompt: str = "Caption the content of this image:"
13
+ model_name: str = "nvidia/llama-3.1-nemotron-nano-vl-8b-v1"
14
+ raise_on_failure: bool = False
15
+ model_config = ConfigDict(extra="forbid")
16
+
17
+ @field_validator("api_key", mode="before")
18
+ @classmethod
19
+ def _coerce_api_key_none(cls, v):
20
+ return "" if v is None else v
21
+
22
+ @model_validator(mode="before")
23
+ @classmethod
24
+ def _coerce_none_to_empty(cls, values):
25
+ """Allow None for string fields where empty string is acceptable.
26
+
27
+ Specifically, convert api_key=None to api_key="" so validation passes
28
+ when no API key is supplied.
29
+ """
30
+ if isinstance(values, dict):
31
+ if values.get("api_key") is None:
32
+ values["api_key"] = ""
33
+ return values
@@ -5,7 +5,7 @@
5
5
 
6
6
  import logging
7
7
 
8
- from pydantic import ConfigDict, BaseModel, Field
8
+ from pydantic import ConfigDict, BaseModel, Field, model_validator, field_validator
9
9
 
10
10
  from nv_ingest_api.util.logging.configuration import LogLevel
11
11
 
@@ -13,7 +13,7 @@ logger = logging.getLogger(__name__)
13
13
 
14
14
 
15
15
  class TextEmbeddingSchema(BaseModel):
16
- api_key: str = Field(default="api_key")
16
+ api_key: str = Field(default="")
17
17
  batch_size: int = Field(default=4)
18
18
  embedding_model: str = Field(default="nvidia/llama-3.2-nv-embedqa-1b-v2")
19
19
  embedding_nim_endpoint: str = Field(default="http://embedding:8000/v1")
@@ -28,3 +28,16 @@ class TextEmbeddingSchema(BaseModel):
28
28
  audio_elements_modality: str = Field(default="text")
29
29
 
30
30
  model_config = ConfigDict(extra="forbid")
31
+
32
+ @field_validator("api_key", mode="before")
33
+ @classmethod
34
+ def _coerce_api_key_none(cls, v):
35
+ return "" if v is None else v
36
+
37
+ @model_validator(mode="before")
38
+ @classmethod
39
+ def _coerce_none_to_empty(cls, values):
40
+ """Convert api_key=None to empty string so validation passes when key is omitted."""
41
+ if isinstance(values, dict) and values.get("api_key") is None:
42
+ values["api_key"] = ""
43
+ return values
@@ -75,8 +75,11 @@ def _make_async_request(
75
75
  response = {}
76
76
 
77
77
  try:
78
+ # Normalize API key to avoid sending an empty bearer token via SDK internals
79
+ _token = (api_key or "").strip()
80
+ _api_key = _token if _token else "<no key provided>"
78
81
  client = OpenAI(
79
- api_key=api_key,
82
+ api_key=_api_key,
80
83
  base_url=embedding_nim_endpoint,
81
84
  )
82
85
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest-api
3
- Version: 2025.8.18.dev20250818
3
+ Version: 2025.8.20.dev20250820
4
4
  Summary: Python module with core document ingestion functions.
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License
@@ -1,15 +0,0 @@
1
- # SPDX-FileCopyrightText: Copyright (c) 2024, NVIDIA CORPORATION & AFFILIATES.
2
- # All rights reserved.
3
- # SPDX-License-Identifier: Apache-2.0
4
-
5
-
6
- from pydantic import ConfigDict, BaseModel
7
-
8
-
9
- class ImageCaptionExtractionSchema(BaseModel):
10
- api_key: str = "api_key"
11
- endpoint_url: str = "https://integrate.api.nvidia.com/v1/chat/completions"
12
- prompt: str = "Caption the content of this image:"
13
- model_name: str = "nvidia/llama-3.1-nemotron-nano-vl-8b-v1"
14
- raise_on_failure: bool = False
15
- model_config = ConfigDict(extra="forbid")