nv-ingest-api 2025.5.11.dev20250511__tar.gz → 2025.5.12.dev20250512__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of nv-ingest-api might be problematic. Click here for more details.

Files changed (159) hide show
  1. {nv_ingest_api-2025.5.11.dev20250511/src/nv_ingest_api.egg-info → nv_ingest_api-2025.5.12.dev20250512}/PKG-INFO +1 -1
  2. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/text_embedding.py +35 -37
  3. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/nim_client.py +17 -9
  4. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512/src/nv_ingest_api.egg-info}/PKG-INFO +1 -1
  5. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/LICENSE +0 -0
  6. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/MANIFEST.in +0 -0
  7. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/README.md +0 -0
  8. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/pyproject.toml +0 -0
  9. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/setup.cfg +0 -0
  10. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/__init__.py +0 -0
  11. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/interface/__init__.py +0 -0
  12. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/interface/extract.py +0 -0
  13. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/interface/mutate.py +0 -0
  14. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/interface/store.py +0 -0
  15. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/interface/transform.py +0 -0
  16. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/interface/utility.py +0 -0
  17. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/__init__.py +0 -0
  18. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/enums/__init__.py +0 -0
  19. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/enums/common.py +0 -0
  20. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/__init__.py +0 -0
  21. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/audio/__init__.py +0 -0
  22. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/audio/audio_extraction.py +0 -0
  23. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/docx/__init__.py +0 -0
  24. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/docx/docx_extractor.py +0 -0
  25. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/docx/engines/__init__.py +0 -0
  26. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/__init__.py +0 -0
  27. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docx_helper.py +0 -0
  28. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/docx/engines/docxreader_helpers/docxreader.py +0 -0
  29. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/image/__init__.py +0 -0
  30. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/image/chart_extractor.py +0 -0
  31. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/image/image_extractor.py +0 -0
  32. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/image/image_helpers/__init__.py +0 -0
  33. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/image/image_helpers/common.py +0 -0
  34. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/image/infographic_extractor.py +0 -0
  35. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/image/table_extractor.py +0 -0
  36. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/__init__.py +0 -0
  37. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/engines/__init__.py +0 -0
  38. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/engines/adobe.py +0 -0
  39. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/engines/llama.py +0 -0
  40. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/engines/nemoretriever.py +0 -0
  41. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/engines/pdf_helpers/__init__.py +0 -0
  42. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/engines/pdfium.py +0 -0
  43. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/engines/tika.py +0 -0
  44. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/engines/unstructured_io.py +0 -0
  45. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pdf/pdf_extractor.py +0 -0
  46. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pptx/__init__.py +0 -0
  47. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pptx/engines/__init__.py +0 -0
  48. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pptx/engines/pptx_helper.py +0 -0
  49. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/extract/pptx/pptx_extractor.py +0 -0
  50. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/mutate/__init__.py +0 -0
  51. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/mutate/deduplicate.py +0 -0
  52. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/mutate/filter.py +0 -0
  53. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/__init__.py +0 -0
  54. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/control_message_task.py +0 -0
  55. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/ingest_control_message.py +0 -0
  56. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/__init__.py +0 -0
  57. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/default_values.py +0 -0
  58. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/__init__.py +0 -0
  59. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/cached.py +0 -0
  60. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/decorators.py +0 -0
  61. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/deplot.py +0 -0
  62. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/helpers.py +0 -0
  63. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/nemoretriever_parse.py +0 -0
  64. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/paddle.py +0 -0
  65. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/parakeet.py +0 -0
  66. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/vlm.py +0 -0
  67. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/model_interface/yolox.py +0 -0
  68. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/nim/nim_model_interface.py +0 -0
  69. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/tracing/__init__.py +0 -0
  70. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/tracing/latency.py +0 -0
  71. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/tracing/logging.py +0 -0
  72. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/primitives/tracing/tagging.py +0 -0
  73. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/__init__.py +0 -0
  74. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/extract/__init__.py +0 -0
  75. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/extract/extract_audio_schema.py +0 -0
  76. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/extract/extract_chart_schema.py +0 -0
  77. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/extract/extract_docx_schema.py +0 -0
  78. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/extract/extract_image_schema.py +0 -0
  79. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/extract/extract_infographic_schema.py +0 -0
  80. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/extract/extract_pdf_schema.py +0 -0
  81. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/extract/extract_pptx_schema.py +0 -0
  82. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/extract/extract_table_schema.py +0 -0
  83. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/message_brokers/__init__.py +0 -0
  84. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/message_brokers/message_broker_client_schema.py +0 -0
  85. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/message_brokers/request_schema.py +0 -0
  86. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/message_brokers/response_schema.py +0 -0
  87. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/meta/__init__.py +0 -0
  88. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/meta/base_model_noext.py +0 -0
  89. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/meta/ingest_job_schema.py +0 -0
  90. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/meta/metadata_schema.py +0 -0
  91. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/mutate/__init__.py +0 -0
  92. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/mutate/mutate_image_dedup_schema.py +0 -0
  93. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/store/__init__.py +0 -0
  94. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/store/store_embedding_schema.py +0 -0
  95. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/store/store_image_schema.py +0 -0
  96. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/transform/__init__.py +0 -0
  97. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/transform/transform_image_caption_schema.py +0 -0
  98. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/transform/transform_image_filter_schema.py +0 -0
  99. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/transform/transform_text_embedding_schema.py +0 -0
  100. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/schemas/transform/transform_text_splitter_schema.py +0 -0
  101. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/store/__init__.py +0 -0
  102. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/store/embed_text_upload.py +0 -0
  103. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/store/image_upload.py +0 -0
  104. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/transform/__init__.py +0 -0
  105. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/transform/caption_image.py +0 -0
  106. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/transform/embed_text.py +0 -0
  107. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/internal/transform/split_text.py +0 -0
  108. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/__init__.py +0 -0
  109. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/control_message/__init__.py +0 -0
  110. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/control_message/validators.py +0 -0
  111. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/converters/__init__.py +0 -0
  112. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/converters/bytetools.py +0 -0
  113. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/converters/containers.py +0 -0
  114. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/converters/datetools.py +0 -0
  115. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/converters/dftools.py +0 -0
  116. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/converters/formats.py +0 -0
  117. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/converters/type_mappings.py +0 -0
  118. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/detectors/__init__.py +0 -0
  119. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/detectors/language.py +0 -0
  120. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/exception_handlers/__init__.py +0 -0
  121. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/exception_handlers/converters.py +0 -0
  122. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/exception_handlers/decorators.py +0 -0
  123. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/exception_handlers/detectors.py +0 -0
  124. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/exception_handlers/pdf.py +0 -0
  125. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/exception_handlers/schemas.py +0 -0
  126. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/image_processing/__init__.py +0 -0
  127. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/image_processing/clustering.py +0 -0
  128. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/image_processing/processing.py +0 -0
  129. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/image_processing/table_and_chart.py +0 -0
  130. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/image_processing/transforms.py +0 -0
  131. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/logging/__init__.py +0 -0
  132. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/logging/configuration.py +0 -0
  133. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/message_brokers/__init__.py +0 -0
  134. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/message_brokers/simple_message_broker/__init__.py +0 -0
  135. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/message_brokers/simple_message_broker/broker.py +0 -0
  136. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/message_brokers/simple_message_broker/ordered_message_queue.py +0 -0
  137. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/message_brokers/simple_message_broker/simple_client.py +0 -0
  138. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/metadata/__init__.py +0 -0
  139. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/metadata/aggregators.py +0 -0
  140. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/multi_processing/__init__.py +0 -0
  141. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/multi_processing/mp_pool_singleton.py +0 -0
  142. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/nim/__init__.py +0 -0
  143. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/pdf/__init__.py +0 -0
  144. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/pdf/pdfium.py +0 -0
  145. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/schema/__init__.py +0 -0
  146. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/schema/schema_validator.py +0 -0
  147. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/service_clients/__init__.py +0 -0
  148. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/service_clients/client_base.py +0 -0
  149. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/service_clients/kafka/__init__.py +0 -0
  150. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/service_clients/redis/__init__.py +0 -0
  151. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/service_clients/redis/redis_client.py +0 -0
  152. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/service_clients/rest/__init__.py +0 -0
  153. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/service_clients/rest/rest_client.py +0 -0
  154. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api/util/string_processing/__init__.py +0 -0
  155. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api.egg-info/SOURCES.txt +0 -0
  156. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api.egg-info/dependency_links.txt +0 -0
  157. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api.egg-info/requires.txt +0 -0
  158. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/nv_ingest_api.egg-info/top_level.txt +0 -0
  159. {nv_ingest_api-2025.5.11.dev20250511 → nv_ingest_api-2025.5.12.dev20250512}/src/version.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest-api
3
- Version: 2025.5.11.dev20250511
3
+ Version: 2025.5.12.dev20250512
4
4
  Summary: Python module with core document ingestion functions.
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License
@@ -5,6 +5,7 @@
5
5
  from typing import Any, Dict, List, Optional, Tuple
6
6
 
7
7
  from nv_ingest_api.internal.primitives.nim import ModelInterface
8
+ import numpy as np
8
9
 
9
10
 
10
11
  # Assume ModelInterface is defined elsewhere in the project.
@@ -22,20 +23,13 @@ class EmbeddingModelInterface(ModelInterface):
22
23
 
23
24
  def prepare_data_for_inference(self, data: Dict[str, Any]) -> Dict[str, Any]:
24
25
  """
25
- Prepare input data for embedding inference. Ensures that a 'prompts' key is provided
26
- and that its value is a list.
27
-
28
- Raises
29
- ------
30
- KeyError
31
- If the 'prompts' key is missing.
26
+ Prepare input data for embedding inference. Returns a list of strings representing the text to be embedded.
32
27
  """
33
28
  if "prompts" not in data:
34
29
  raise KeyError("Input data must include 'prompts'.")
35
- # Ensure the prompts are in list format.
36
30
  if not isinstance(data["prompts"], list):
37
31
  data["prompts"] = [data["prompts"]]
38
- return data
32
+ return {"prompts": data["prompts"]}
39
33
 
40
34
  def format_input(
41
35
  self, data: Dict[str, Any], protocol: str, max_batch_size: int, **kwargs
@@ -63,29 +57,32 @@ class EmbeddingModelInterface(ModelInterface):
63
57
  - payloads is a list of JSON-serializable payload dictionaries.
64
58
  - batch_data_list is a list of dictionaries containing the key "prompts" corresponding to each batch.
65
59
  """
66
- if protocol != "http":
67
- raise ValueError("EmbeddingModelInterface only supports HTTP protocol.")
68
-
69
- prompts = data.get("prompts", [])
70
60
 
71
61
  def chunk_list(lst, chunk_size):
62
+ lst = lst["prompts"]
72
63
  return [lst[i : i + chunk_size] for i in range(0, len(lst), chunk_size)]
73
64
 
74
- batches = chunk_list(prompts, max_batch_size)
75
- payloads = []
76
- batch_data_list = []
77
- for batch in batches:
78
- payload = {
79
- "model": kwargs.get("model_name"),
80
- "input": batch,
81
- "encoding_format": kwargs.get("encoding_format", "float"),
82
- "extra_body": {
83
- "input_type": kwargs.get("input_type", "query"),
65
+ batches = chunk_list(data, max_batch_size)
66
+ if protocol == "http":
67
+ payloads = []
68
+ batch_data_list = []
69
+ for batch in batches:
70
+ payload = {
71
+ "model": kwargs.get("model_name"),
72
+ "input": batch,
73
+ "encoding_format": kwargs.get("encoding_format", "float"),
74
+ "input_type": kwargs.get("input_type", "passage"),
84
75
  "truncate": kwargs.get("truncate", "NONE"),
85
- },
86
- }
87
- payloads.append(payload)
88
- batch_data_list.append({"prompts": batch})
76
+ }
77
+ payloads.append(payload)
78
+ batch_data_list.append({"prompts": batch})
79
+ elif protocol == "grpc":
80
+ payloads = []
81
+ batch_data_list = []
82
+ for batch in batches:
83
+ text_np = np.array([[text.encode("utf-8")] for text in batch], dtype=np.object_)
84
+ payloads.append(text_np)
85
+ batch_data_list.append({"prompts": batch})
89
86
  return payloads, batch_data_list
90
87
 
91
88
  def parse_output(self, response: Any, protocol: str, data: Optional[Dict[str, Any]] = None, **kwargs) -> Any:
@@ -108,16 +105,17 @@ class EmbeddingModelInterface(ModelInterface):
108
105
  list
109
106
  A list of generated embeddings extracted from the response.
110
107
  """
111
- if protocol != "http":
112
- raise ValueError("EmbeddingModelInterface only supports HTTP protocol.")
113
- if isinstance(response, dict):
114
- embeddings = response.get("data")
115
- if not embeddings:
116
- raise RuntimeError("Unexpected response format: 'data' key is missing or empty.")
117
- # Each item in embeddings is expected to have an 'embedding' field.
118
- return [item.get("embedding", None) for item in embeddings]
119
- else:
120
- return [str(response)]
108
+ if protocol == "http":
109
+ if isinstance(response, dict):
110
+ embeddings = response.get("data")
111
+ if not embeddings:
112
+ raise RuntimeError("Unexpected response format: 'data' key is missing or empty.")
113
+ # Each item in embeddings is expected to have an 'embedding' field.
114
+ return [item.get("embedding", None) for item in embeddings]
115
+ else:
116
+ return [str(response)]
117
+ elif protocol == "grpc":
118
+ return [res.flatten() for res in response]
121
119
 
122
120
  def process_inference_results(self, output: Any, protocol: str, **kwargs) -> Any:
123
121
  """
@@ -129,7 +129,7 @@ class NimClient:
129
129
  """
130
130
  if self.protocol == "grpc":
131
131
  logger.debug("Performing gRPC inference for a batch...")
132
- response = self._grpc_infer(batch_input, model_name)
132
+ response = self._grpc_infer(batch_input, model_name, **kwargs)
133
133
  logger.debug("gRPC inference received response for a batch")
134
134
  elif self.protocol == "http":
135
135
  logger.debug("Performing HTTP inference for a batch...")
@@ -221,7 +221,7 @@ class NimClient:
221
221
 
222
222
  return all_results
223
223
 
224
- def _grpc_infer(self, formatted_input: np.ndarray, model_name: str) -> np.ndarray:
224
+ def _grpc_infer(self, formatted_input: np.ndarray, model_name: str, **kwargs) -> np.ndarray:
225
225
  """
226
226
  Perform inference using the gRPC protocol.
227
227
 
@@ -238,16 +238,24 @@ class NimClient:
238
238
  The output of the model as a numpy array.
239
239
  """
240
240
 
241
- input_tensors = [grpcclient.InferInput("input", formatted_input.shape, datatype="FP32")]
242
- input_tensors[0].set_data_from_numpy(formatted_input)
241
+ parameters = kwargs.get("parameters", {})
242
+ output_names = kwargs.get("outputs", ["output"])
243
+ dtype = kwargs.get("dtype", "FP32")
244
+ input_name = kwargs.get("input_name", "input")
243
245
 
244
- outputs = [grpcclient.InferRequestedOutput("output")]
245
- response = self.client.infer(model_name=model_name, inputs=input_tensors, outputs=outputs)
246
- logger.debug(f"gRPC inference response: {response}")
246
+ input_tensors = grpcclient.InferInput(input_name, formatted_input.shape, datatype=dtype)
247
+ input_tensors.set_data_from_numpy(formatted_input)
247
248
 
249
+ outputs = [grpcclient.InferRequestedOutput(output_name) for output_name in output_names]
250
+ response = self.client.infer(
251
+ model_name=model_name, parameters=parameters, inputs=[input_tensors], outputs=outputs
252
+ )
253
+ logger.debug(f"gRPC inference response: {response}")
248
254
  # TODO(self.client.has_error(response)) => raise error
249
-
250
- return response.as_numpy("output")
255
+ if len(outputs) == 1:
256
+ return response.as_numpy(outputs[0].name())
257
+ else:
258
+ return [response.as_numpy(output.name()) for output in outputs]
251
259
 
252
260
  def _http_infer(self, formatted_input: dict) -> dict:
253
261
  """
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest-api
3
- Version: 2025.5.11.dev20250511
3
+ Version: 2025.5.12.dev20250512
4
4
  Summary: Python module with core document ingestion functions.
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License