nv-ingest 2025.7.19.dev20250719__py3-none-any.whl → 2025.7.21.dev20250721__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of nv-ingest might be problematic. Click here for more details.

@@ -215,7 +215,6 @@ def add_pdf_extractor_stage(pipeline, default_cpu_count, stage_name="pdf_extract
215
215
  min_replicas=0,
216
216
  max_replicas=max_replicas,
217
217
  )
218
-
219
218
  return stage_name
220
219
 
221
220
 
@@ -242,7 +241,7 @@ def add_table_extractor_stage(pipeline, default_cpu_count, stage_name="table_ext
242
241
  stage_actor=TableExtractorStage,
243
242
  config=table_extractor_config,
244
243
  min_replicas=0,
245
- max_replicas=2,
244
+ max_replicas=_get_max_replicas(default_cpu_count, percentage_of_cpu=0.20),
246
245
  )
247
246
 
248
247
  return stage_name
@@ -271,7 +270,7 @@ def add_chart_extractor_stage(pipeline, default_cpu_count, stage_name="chart_ext
271
270
  stage_actor=ChartExtractorStage,
272
271
  config=chart_extractor_config,
273
272
  min_replicas=0,
274
- max_replicas=2,
273
+ max_replicas=_get_max_replicas(default_cpu_count, percentage_of_cpu=0.20),
275
274
  )
276
275
 
277
276
  return stage_name
@@ -295,7 +294,7 @@ def add_infographic_extractor_stage(pipeline, default_cpu_count, stage_name="inf
295
294
  stage_actor=InfographicExtractorStage,
296
295
  config=infographic_content_extractor_config,
297
296
  min_replicas=0,
298
- max_replicas=1,
297
+ max_replicas=2,
299
298
  )
300
299
 
301
300
  return stage_name
@@ -317,7 +316,7 @@ def add_image_extractor_stage(pipeline, default_cpu_count, stage_name="image_ext
317
316
  stage_actor=ImageExtractorStage,
318
317
  config=image_extractor_config,
319
318
  min_replicas=0,
320
- max_replicas=1,
319
+ max_replicas=2,
321
320
  )
322
321
 
323
322
  return stage_name
@@ -383,11 +382,7 @@ def add_audio_extractor_stage(pipeline, default_cpu_count, stage_name="audio_ext
383
382
  )
384
383
 
385
384
  pipeline.add_stage(
386
- name=stage_name,
387
- stage_actor=AudioExtractorStage,
388
- config=audio_extractor_config,
389
- min_replicas=0,
390
- max_replicas=1,
385
+ name=stage_name, stage_actor=AudioExtractorStage, config=audio_extractor_config, min_replicas=0, max_replicas=2
391
386
  )
392
387
 
393
388
  return stage_name
@@ -400,7 +395,7 @@ def add_html_extractor_stage(pipeline, default_cpu_count, stage_name="html_extra
400
395
  stage_actor=HtmlExtractorStage,
401
396
  config=HtmlExtractorSchema(),
402
397
  min_replicas=0,
403
- max_replicas=1,
398
+ max_replicas=2,
404
399
  )
405
400
 
406
401
  return stage_name
@@ -630,3 +625,10 @@ def add_source_stage(pipeline, default_cpu_count, source_name="pipeline_source")
630
625
  start_simple_message_broker(source_config.broker_client.model_dump())
631
626
 
632
627
  return source_name
628
+
629
+
630
+ def _get_max_replicas(default_cpu_count=None, percentage_of_cpu=0.14):
631
+ if default_cpu_count is None:
632
+ default_cpu_count = _system_resource_probe.get_cpu_count()
633
+
634
+ return int(max(1, (default_cpu_count * percentage_of_cpu)))
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest
3
- Version: 2025.7.19.dev20250719
3
+ Version: 2025.7.21.dev20250721
4
4
  Summary: Python module for multimodal document ingestion
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License
@@ -67,7 +67,7 @@ nv_ingest/framework/orchestration/ray/util/pipeline/__init__.py,sha256=wQSlVx3T1
67
67
  nv_ingest/framework/orchestration/ray/util/pipeline/pid_controller.py,sha256=flRLS7yc5n6gheykayuL3prC7O-ZhcVY2s9Wc14SGWE,47377
68
68
  nv_ingest/framework/orchestration/ray/util/pipeline/pipeline_builders.py,sha256=d2-GS2tqk6JOFdw65CL1AwfjdUbkC_XxUuJH8Dy-aQ0,10456
69
69
  nv_ingest/framework/orchestration/ray/util/pipeline/pipeline_runners.py,sha256=dlz83vEFKcvrwsPFP1M0Md1lOYbuOVX2MeyCPq43RGg,14392
70
- nv_ingest/framework/orchestration/ray/util/pipeline/stage_builders.py,sha256=rlMqLtuaI-VdVlAT_7-9HSIgX6YfsxWsBzKe3fBvYl0,21136
70
+ nv_ingest/framework/orchestration/ray/util/pipeline/stage_builders.py,sha256=bnhnrl6Yp39txWoLCB9os9PEzHs5WVJlbW4aE6_yNFo,21459
71
71
  nv_ingest/framework/orchestration/ray/util/pipeline/tools.py,sha256=LQVb8k9jURaxh2Ga44Js_XuYFCbeN4_nLgDmtExovQg,8026
72
72
  nv_ingest/framework/orchestration/ray/util/system_tools/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
73
73
  nv_ingest/framework/orchestration/ray/util/system_tools/memory.py,sha256=ICqY0LLB3hFTZk03iX5yffMSKFH2q_aQomtDVzS_mKw,2228
@@ -96,8 +96,8 @@ nv_ingest/framework/util/service/meta/ingest/__init__.py,sha256=wQSlVx3T14ZgQAt-
96
96
  nv_ingest/framework/util/service/meta/ingest/ingest_service_meta.py,sha256=QS3uNxWBl5dIcmIpJKNe8_TLcTUuN2vcKyHeAwa-eSo,1589
97
97
  nv_ingest/framework/util/telemetry/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
98
98
  nv_ingest/framework/util/telemetry/global_stats.py,sha256=nq65pEEdiwjAfGiqsxG1CeQMC96O3CfQxsZuGFCY-ds,4554
99
- nv_ingest-2025.7.19.dev20250719.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
100
- nv_ingest-2025.7.19.dev20250719.dist-info/METADATA,sha256=mWq6HM-znacym6NTDg4UsUXcxQ8OYKNMlrSQsweU3C0,15142
101
- nv_ingest-2025.7.19.dev20250719.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
102
- nv_ingest-2025.7.19.dev20250719.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
103
- nv_ingest-2025.7.19.dev20250719.dist-info/RECORD,,
99
+ nv_ingest-2025.7.21.dev20250721.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
100
+ nv_ingest-2025.7.21.dev20250721.dist-info/METADATA,sha256=5pQ5u5URCsxzHsroY3_BNcc9ziLzke-HsWH1gOuqT9A,15142
101
+ nv_ingest-2025.7.21.dev20250721.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
102
+ nv_ingest-2025.7.21.dev20250721.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
103
+ nv_ingest-2025.7.21.dev20250721.dist-info/RECORD,,