nv-ingest-client 2025.8.10.dev20250810__tar.gz → 2025.8.11.dev20250811__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of nv-ingest-client might be problematic. Click here for more details.

Files changed (61) hide show
  1. {nv_ingest_client-2025.8.10.dev20250810/src/nv_ingest_client.egg-info → nv_ingest_client-2025.8.11.dev20250811}/PKG-INFO +1 -1
  2. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/transport.py +2 -2
  3. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/vdb/milvus.py +23 -17
  4. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811/src/nv_ingest_client.egg-info}/PKG-INFO +1 -1
  5. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/LICENSE +0 -0
  6. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/MANIFEST.in +0 -0
  7. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/README.md +0 -0
  8. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/pyproject.toml +0 -0
  9. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/setup.cfg +0 -0
  10. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/__init__.py +0 -0
  11. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/cli/__init__.py +0 -0
  12. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/cli/util/__init__.py +0 -0
  13. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/cli/util/click.py +0 -0
  14. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/cli/util/processing.py +0 -0
  15. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/cli/util/system.py +0 -0
  16. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/cli/util/tasks.py +0 -0
  17. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/client/__init__.py +0 -0
  18. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/client/client.py +0 -0
  19. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/client/interface.py +0 -0
  20. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/client/util/processing.py +0 -0
  21. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/nv_ingest_cli.py +0 -0
  22. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/__init__.py +0 -0
  23. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/exceptions.py +0 -0
  24. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/jobs/__init__.py +0 -0
  25. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/jobs/job_spec.py +0 -0
  26. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/jobs/job_state.py +0 -0
  27. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/__init__.py +0 -0
  28. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/audio_extraction.py +0 -0
  29. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/caption.py +0 -0
  30. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/chart_extraction.py +0 -0
  31. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/dedup.py +0 -0
  32. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/embed.py +0 -0
  33. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/extract.py +0 -0
  34. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/filter.py +0 -0
  35. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/infographic_extraction.py +0 -0
  36. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/split.py +0 -0
  37. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/store.py +0 -0
  38. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/table_extraction.py +0 -0
  39. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/task_base.py +0 -0
  40. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/task_factory.py +0 -0
  41. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/transform.py +0 -0
  42. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/primitives/tasks/vdb_upload.py +0 -0
  43. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/__init__.py +0 -0
  44. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/dataset.py +0 -0
  45. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/file_processing/__init__.py +0 -0
  46. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/file_processing/extract.py +0 -0
  47. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/milvus.py +0 -0
  48. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/process_json_files.py +0 -0
  49. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/processing.py +0 -0
  50. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/system.py +0 -0
  51. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/util.py +0 -0
  52. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/vdb/__init__.py +0 -0
  53. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/vdb/adt_vdb.py +0 -0
  54. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/vdb/opensearch.py +0 -0
  55. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client/util/zipkin.py +0 -0
  56. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client.egg-info/SOURCES.txt +0 -0
  57. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client.egg-info/dependency_links.txt +0 -0
  58. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client.egg-info/entry_points.txt +0 -0
  59. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client.egg-info/requires.txt +0 -0
  60. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/nv_ingest_client.egg-info/top_level.txt +0 -0
  61. {nv_ingest_client-2025.8.10.dev20250810 → nv_ingest_client-2025.8.11.dev20250811}/src/version.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest-client
3
- Version: 2025.8.10.dev20250810
3
+ Version: 2025.8.11.dev20250811
4
4
  Summary: Python client for the nv-ingest service
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License
@@ -26,7 +26,7 @@ def infer_microservice(
26
26
  client = NimClient(
27
27
  model_interface=EmbeddingModelInterface(),
28
28
  protocol="grpc",
29
- endpoints=(embedding_endpoint, embedding_endpoint),
29
+ endpoints=(embedding_endpoint, None),
30
30
  auth_token=nvidia_api_key,
31
31
  )
32
32
  return client.infer(
@@ -43,7 +43,7 @@ def infer_microservice(
43
43
  client = NimClient(
44
44
  model_interface=EmbeddingModelInterface(),
45
45
  protocol="http",
46
- endpoints=(embedding_endpoint, embedding_endpoint),
46
+ endpoints=(None, embedding_endpoint),
47
47
  auth_token=nvidia_api_key,
48
48
  )
49
49
  return client.infer(data, model_name, input_type=input_type, truncate=truncate, batch_size=batch_size)
@@ -757,25 +757,31 @@ def bulk_insert_milvus(
757
757
 
758
758
  connections.connect(uri=milvus_uri)
759
759
  t_bulk_start = time.time()
760
- files_to_upload = [_file for file_set in writer.batch_files for _file in file_set]
761
- task_id = utility.do_bulk_insert(
762
- collection_name=collection_name,
763
- files=files_to_upload,
764
- consistency_level=CONSISTENCY,
765
- )
760
+ task_ids = []
761
+ for files in writer.batch_files:
762
+ task_id = utility.do_bulk_insert(
763
+ collection_name=collection_name,
764
+ files=files,
765
+ consistency_level=CONSISTENCY,
766
+ )
767
+ task_ids.append(task_id)
766
768
  # list_bulk_insert_tasks = utility.list_bulk_insert_tasks(collection_name=collection_name)
767
- state = "Pending"
768
- while state != "Completed":
769
- task = utility.get_bulk_insert_state(task_id=task_id)
770
- state = task.state_name
771
- if state == "Completed":
772
- t_bulk_end = time.time()
773
- logger.info("Start time:", task.create_time_str)
774
- logger.info("Imported row count:", task.row_count)
775
- logger.info(f"Bulk {collection_name} upload took {t_bulk_end - t_bulk_start} s")
776
- if task.state == BulkInsertState.ImportFailed:
777
- logger.error("Failed reason:", task.failed_reason)
769
+ while len(task_ids) > 0:
778
770
  time.sleep(1)
771
+ for task_id in task_ids:
772
+ task = utility.get_bulk_insert_state(task_id=task_id)
773
+ state = task.state_name
774
+ if state == "Completed":
775
+ logger.info(f"Task: {task_id}")
776
+ logger.info(f"Start time: {task.create_time_str}")
777
+ logger.info(f"Imported row count: {task.row_count}")
778
+ task_ids.remove(task_id)
779
+ if task.state == BulkInsertState.ImportFailed:
780
+ logger.error(f"Task: {task_id}")
781
+ logger.error(f"Failed reason: {task.failed_reason}")
782
+ task_ids.remove(task_id)
783
+ t_bulk_end = time.time()
784
+ logger.info(f"Bulk {collection_name} upload took {t_bulk_end - t_bulk_start} s")
779
785
 
780
786
 
781
787
  def create_bm25_model(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest-client
3
- Version: 2025.8.10.dev20250810
3
+ Version: 2025.8.11.dev20250811
4
4
  Summary: Python client for the nv-ingest service
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License