nv-ingest 25.6.4rc4__py3-none-any.whl → 25.6.4rc6__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of nv-ingest might be problematic. Click here for more details.

@@ -230,11 +230,7 @@ def add_table_extractor_stage(pipeline, default_cpu_count, stage_name="table_ext
230
230
  )
231
231
 
232
232
  pipeline.add_stage(
233
- name=stage_name,
234
- stage_actor=TableExtractorStage,
235
- config=table_extractor_config,
236
- min_replicas=0,
237
- max_replicas=int(max(1, (default_cpu_count // 7))), # 14% of available CPU cores
233
+ name=stage_name, stage_actor=TableExtractorStage, config=table_extractor_config, min_replicas=1, max_replicas=1
238
234
  )
239
235
 
240
236
  return stage_name
@@ -262,8 +258,8 @@ def add_chart_extractor_stage(pipeline, default_cpu_count, stage_name="chart_ext
262
258
  name=stage_name,
263
259
  stage_actor=ChartExtractorStage,
264
260
  config=chart_extractor_config,
265
- min_replicas=0,
266
- max_replicas=int(max(1, (default_cpu_count // 7))), # 14% of available CPU cores
261
+ min_replicas=1,
262
+ max_replicas=1,
267
263
  )
268
264
 
269
265
  return stage_name
@@ -286,8 +282,8 @@ def add_infographic_extractor_stage(pipeline, default_cpu_count, stage_name="inf
286
282
  name=stage_name,
287
283
  stage_actor=InfographicExtractorStage,
288
284
  config=infographic_content_extractor_config,
289
- min_replicas=0,
290
- max_replicas=int(max(1, (default_cpu_count // 14))), # 7% of available CPU cores
285
+ min_replicas=1,
286
+ max_replicas=1,
291
287
  )
292
288
 
293
289
  return stage_name
@@ -308,8 +304,8 @@ def add_image_extractor_stage(pipeline, default_cpu_count, stage_name="image_ext
308
304
  name=stage_name,
309
305
  stage_actor=ImageExtractorStage,
310
306
  config=image_extractor_config,
311
- min_replicas=0,
312
- max_replicas=int(max(1, (default_cpu_count // 14))), # 7% of available CPU cores
307
+ min_replicas=1,
308
+ max_replicas=1,
313
309
  )
314
310
 
315
311
  return stage_name
@@ -330,8 +326,8 @@ def add_docx_extractor_stage(pipeline, default_cpu_count, stage_name="docx_extra
330
326
  name=stage_name,
331
327
  stage_actor=DocxExtractorStage,
332
328
  config=DocxExtractorSchema(**docx_extractor_config),
333
- min_replicas=0,
334
- max_replicas=int(max(1, (default_cpu_count // 14))), # 7% of available CPU cores
329
+ min_replicas=1,
330
+ max_replicas=1,
335
331
  )
336
332
 
337
333
  return stage_name
@@ -352,8 +348,8 @@ def add_pptx_extractor_stage(pipeline, default_cpu_count, stage_name="pptx_extra
352
348
  name=stage_name,
353
349
  stage_actor=PPTXExtractorStage,
354
350
  config=PPTXExtractorSchema(**pptx_extractor_config),
355
- min_replicas=0,
356
- max_replicas=int(max(1, (default_cpu_count // 14))), # 7% of available CPU cores
351
+ min_replicas=1,
352
+ max_replicas=1,
357
353
  )
358
354
 
359
355
  return stage_name
@@ -378,7 +374,7 @@ def add_audio_extractor_stage(pipeline, default_cpu_count, stage_name="audio_ext
378
374
  name=stage_name,
379
375
  stage_actor=AudioExtractorStage,
380
376
  config=audio_extractor_config,
381
- min_replicas=0,
377
+ min_replicas=1,
382
378
  max_replicas=1, # Audio extraction is a heavy IO bound operation with minimal CPU usage
383
379
  )
384
380
 
@@ -391,8 +387,8 @@ def add_html_extractor_stage(pipeline, default_cpu_count, stage_name="html_extra
391
387
  name=stage_name,
392
388
  stage_actor=HtmlExtractorStage,
393
389
  config=HtmlExtractorSchema(),
394
- min_replicas=0,
395
- max_replicas=int(max(1, (default_cpu_count // 14))), # 7% of available CPU cores
390
+ min_replicas=1,
391
+ max_replicas=1,
396
392
  )
397
393
 
398
394
  return stage_name
@@ -412,8 +408,8 @@ def add_otel_tracer_stage(pipeline, default_cpu_count, stage_name="otel_tracer")
412
408
  name=stage_name,
413
409
  stage_actor=OpenTelemetryTracerStage,
414
410
  config=otel_tracer_config,
415
- min_replicas=0,
416
- max_replicas=2,
411
+ min_replicas=1,
412
+ max_replicas=1,
417
413
  )
418
414
 
419
415
  return stage_name
@@ -426,7 +422,7 @@ def add_image_dedup_stage(pipeline, default_cpu_count, stage_name="image_dedup")
426
422
  name=stage_name,
427
423
  stage_actor=ImageDedupStage,
428
424
  config=config,
429
- min_replicas=0,
425
+ min_replicas=1,
430
426
  max_replicas=1,
431
427
  )
432
428
 
@@ -440,7 +436,7 @@ def add_image_filter_stage(pipeline, default_cpu_count, stage_name="image_filter
440
436
  name=stage_name,
441
437
  stage_actor=ImageFilterStage,
442
438
  config=config,
443
- min_replicas=0,
439
+ min_replicas=1,
444
440
  max_replicas=1,
445
441
  )
446
442
 
@@ -456,8 +452,8 @@ def add_text_splitter_stage(pipeline, default_cpu_count, stage_name="text_splitt
456
452
  name=stage_name,
457
453
  stage_actor=TextSplitterStage,
458
454
  config=config,
459
- min_replicas=0,
460
- max_replicas=int(max(1, (default_cpu_count // 14))), # 7% of available CPU cores
455
+ min_replicas=1,
456
+ max_replicas=1,
461
457
  )
462
458
 
463
459
  return stage_name
@@ -488,7 +484,7 @@ def add_image_caption_stage(pipeline, default_cpu_count, stage_name="image_capti
488
484
  name=stage_name,
489
485
  stage_actor=ImageCaptionTransformStage,
490
486
  config=config,
491
- min_replicas=0,
487
+ min_replicas=1,
492
488
  max_replicas=1,
493
489
  )
494
490
 
@@ -515,11 +511,7 @@ def add_text_embedding_stage(pipeline, default_cpu_count, stage_name="text_embed
515
511
  )
516
512
 
517
513
  pipeline.add_stage(
518
- name=stage_name,
519
- stage_actor=TextEmbeddingTransformStage,
520
- config=config,
521
- min_replicas=0,
522
- max_replicas=int(max(1, (default_cpu_count // 14))), # 7% of available CPU cores
514
+ name=stage_name, stage_actor=TextEmbeddingTransformStage, config=config, min_replicas=1, max_replicas=1
523
515
  )
524
516
 
525
517
  return stage_name
@@ -532,7 +524,7 @@ def add_embedding_storage_stage(pipeline, default_cpu_count, stage_name="embeddi
532
524
  name=stage_name,
533
525
  stage_actor=EmbeddingStorageStage,
534
526
  config=config,
535
- min_replicas=0,
527
+ min_replicas=1,
536
528
  max_replicas=1,
537
529
  )
538
530
 
@@ -545,7 +537,7 @@ def add_image_storage_stage(pipeline, default_cpu_count, stage_name="image_stora
545
537
  name=stage_name,
546
538
  stage_actor=ImageStorageStage,
547
539
  config=config,
548
- min_replicas=0,
540
+ min_replicas=1,
549
541
  max_replicas=1,
550
542
  )
551
543
 
@@ -583,8 +575,8 @@ def add_message_broker_response_stage(pipeline, default_cpu_count, stage_name="b
583
575
  name=stage_name,
584
576
  stage_actor=MessageBrokerTaskSinkStage,
585
577
  config=sink_config,
586
- min_replicas=0,
587
- max_replicas=2,
578
+ min_replicas=1,
579
+ max_replicas=1,
588
580
  )
589
581
 
590
582
  return stage_name
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest
3
- Version: 25.6.4rc4
3
+ Version: 25.6.4rc6
4
4
  Summary: Python module for multimodal document ingestion
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License
@@ -67,7 +67,7 @@ nv_ingest/framework/orchestration/ray/util/pipeline/__init__.py,sha256=wQSlVx3T1
67
67
  nv_ingest/framework/orchestration/ray/util/pipeline/pid_controller.py,sha256=AWyCFPP41vp1NOkO2urqm7vh-sTGKypJxwhdq8HxK6Q,50681
68
68
  nv_ingest/framework/orchestration/ray/util/pipeline/pipeline_builders.py,sha256=jMYnVe_0rb1OIO9mlB4LH3uXtgaXBbUG-rDPx6fe6J8,10456
69
69
  nv_ingest/framework/orchestration/ray/util/pipeline/pipeline_runners.py,sha256=IKQHlEwe0xsjr4MgQJVL0UtnKha1qaoPFc08DF5QzMM,14351
70
- nv_ingest/framework/orchestration/ray/util/pipeline/stage_builders.py,sha256=ZFJkeJNbDM_GsedUlfk2B8kI93L_MNK6gxPgeryZM6I,21463
70
+ nv_ingest/framework/orchestration/ray/util/pipeline/stage_builders.py,sha256=rE1azhkVh5Gk_j4GdmUArSM76SByR44YRNFar4-BSkw,20803
71
71
  nv_ingest/framework/orchestration/ray/util/system_tools/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
72
72
  nv_ingest/framework/orchestration/ray/util/system_tools/memory.py,sha256=ICqY0LLB3hFTZk03iX5yffMSKFH2q_aQomtDVzS_mKw,2228
73
73
  nv_ingest/framework/orchestration/ray/util/system_tools/visualizers.py,sha256=2oHZdO_3L1LGuzpyNmZBDh19n0E-APAaHk4MEwBwSHs,12895
@@ -95,8 +95,8 @@ nv_ingest/framework/util/service/meta/ingest/__init__.py,sha256=wQSlVx3T14ZgQAt-
95
95
  nv_ingest/framework/util/service/meta/ingest/ingest_service_meta.py,sha256=QS3uNxWBl5dIcmIpJKNe8_TLcTUuN2vcKyHeAwa-eSo,1589
96
96
  nv_ingest/framework/util/telemetry/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
97
97
  nv_ingest/framework/util/telemetry/global_stats.py,sha256=nq65pEEdiwjAfGiqsxG1CeQMC96O3CfQxsZuGFCY-ds,4554
98
- nv_ingest-25.6.4rc4.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
99
- nv_ingest-25.6.4rc4.dist-info/METADATA,sha256=FL8Q5cnYKQKGxGuURlNuGhOOUYjGlBkRz7BzAebV4e8,15167
100
- nv_ingest-25.6.4rc4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
101
- nv_ingest-25.6.4rc4.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
102
- nv_ingest-25.6.4rc4.dist-info/RECORD,,
98
+ nv_ingest-25.6.4rc6.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
99
+ nv_ingest-25.6.4rc6.dist-info/METADATA,sha256=ZbUiqF3zSJpLlk9P_uSQ3D_JcUUMHSVGSttvzyuZLlo,15167
100
+ nv_ingest-25.6.4rc6.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
101
+ nv_ingest-25.6.4rc6.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
102
+ nv_ingest-25.6.4rc6.dist-info/RECORD,,