nv-ingest 25.6.4rc4__py3-none-any.whl → 25.6.4rc6__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of nv-ingest might be problematic. Click here for more details.
- nv_ingest/framework/orchestration/ray/util/pipeline/stage_builders.py +26 -34
- {nv_ingest-25.6.4rc4.dist-info → nv_ingest-25.6.4rc6.dist-info}/METADATA +1 -1
- {nv_ingest-25.6.4rc4.dist-info → nv_ingest-25.6.4rc6.dist-info}/RECORD +6 -6
- {nv_ingest-25.6.4rc4.dist-info → nv_ingest-25.6.4rc6.dist-info}/WHEEL +0 -0
- {nv_ingest-25.6.4rc4.dist-info → nv_ingest-25.6.4rc6.dist-info}/licenses/LICENSE +0 -0
- {nv_ingest-25.6.4rc4.dist-info → nv_ingest-25.6.4rc6.dist-info}/top_level.txt +0 -0
|
@@ -230,11 +230,7 @@ def add_table_extractor_stage(pipeline, default_cpu_count, stage_name="table_ext
|
|
|
230
230
|
)
|
|
231
231
|
|
|
232
232
|
pipeline.add_stage(
|
|
233
|
-
name=stage_name,
|
|
234
|
-
stage_actor=TableExtractorStage,
|
|
235
|
-
config=table_extractor_config,
|
|
236
|
-
min_replicas=0,
|
|
237
|
-
max_replicas=int(max(1, (default_cpu_count // 7))), # 14% of available CPU cores
|
|
233
|
+
name=stage_name, stage_actor=TableExtractorStage, config=table_extractor_config, min_replicas=1, max_replicas=1
|
|
238
234
|
)
|
|
239
235
|
|
|
240
236
|
return stage_name
|
|
@@ -262,8 +258,8 @@ def add_chart_extractor_stage(pipeline, default_cpu_count, stage_name="chart_ext
|
|
|
262
258
|
name=stage_name,
|
|
263
259
|
stage_actor=ChartExtractorStage,
|
|
264
260
|
config=chart_extractor_config,
|
|
265
|
-
min_replicas=
|
|
266
|
-
max_replicas=
|
|
261
|
+
min_replicas=1,
|
|
262
|
+
max_replicas=1,
|
|
267
263
|
)
|
|
268
264
|
|
|
269
265
|
return stage_name
|
|
@@ -286,8 +282,8 @@ def add_infographic_extractor_stage(pipeline, default_cpu_count, stage_name="inf
|
|
|
286
282
|
name=stage_name,
|
|
287
283
|
stage_actor=InfographicExtractorStage,
|
|
288
284
|
config=infographic_content_extractor_config,
|
|
289
|
-
min_replicas=
|
|
290
|
-
max_replicas=
|
|
285
|
+
min_replicas=1,
|
|
286
|
+
max_replicas=1,
|
|
291
287
|
)
|
|
292
288
|
|
|
293
289
|
return stage_name
|
|
@@ -308,8 +304,8 @@ def add_image_extractor_stage(pipeline, default_cpu_count, stage_name="image_ext
|
|
|
308
304
|
name=stage_name,
|
|
309
305
|
stage_actor=ImageExtractorStage,
|
|
310
306
|
config=image_extractor_config,
|
|
311
|
-
min_replicas=
|
|
312
|
-
max_replicas=
|
|
307
|
+
min_replicas=1,
|
|
308
|
+
max_replicas=1,
|
|
313
309
|
)
|
|
314
310
|
|
|
315
311
|
return stage_name
|
|
@@ -330,8 +326,8 @@ def add_docx_extractor_stage(pipeline, default_cpu_count, stage_name="docx_extra
|
|
|
330
326
|
name=stage_name,
|
|
331
327
|
stage_actor=DocxExtractorStage,
|
|
332
328
|
config=DocxExtractorSchema(**docx_extractor_config),
|
|
333
|
-
min_replicas=
|
|
334
|
-
max_replicas=
|
|
329
|
+
min_replicas=1,
|
|
330
|
+
max_replicas=1,
|
|
335
331
|
)
|
|
336
332
|
|
|
337
333
|
return stage_name
|
|
@@ -352,8 +348,8 @@ def add_pptx_extractor_stage(pipeline, default_cpu_count, stage_name="pptx_extra
|
|
|
352
348
|
name=stage_name,
|
|
353
349
|
stage_actor=PPTXExtractorStage,
|
|
354
350
|
config=PPTXExtractorSchema(**pptx_extractor_config),
|
|
355
|
-
min_replicas=
|
|
356
|
-
max_replicas=
|
|
351
|
+
min_replicas=1,
|
|
352
|
+
max_replicas=1,
|
|
357
353
|
)
|
|
358
354
|
|
|
359
355
|
return stage_name
|
|
@@ -378,7 +374,7 @@ def add_audio_extractor_stage(pipeline, default_cpu_count, stage_name="audio_ext
|
|
|
378
374
|
name=stage_name,
|
|
379
375
|
stage_actor=AudioExtractorStage,
|
|
380
376
|
config=audio_extractor_config,
|
|
381
|
-
min_replicas=
|
|
377
|
+
min_replicas=1,
|
|
382
378
|
max_replicas=1, # Audio extraction is a heavy IO bound operation with minimal CPU usage
|
|
383
379
|
)
|
|
384
380
|
|
|
@@ -391,8 +387,8 @@ def add_html_extractor_stage(pipeline, default_cpu_count, stage_name="html_extra
|
|
|
391
387
|
name=stage_name,
|
|
392
388
|
stage_actor=HtmlExtractorStage,
|
|
393
389
|
config=HtmlExtractorSchema(),
|
|
394
|
-
min_replicas=
|
|
395
|
-
max_replicas=
|
|
390
|
+
min_replicas=1,
|
|
391
|
+
max_replicas=1,
|
|
396
392
|
)
|
|
397
393
|
|
|
398
394
|
return stage_name
|
|
@@ -412,8 +408,8 @@ def add_otel_tracer_stage(pipeline, default_cpu_count, stage_name="otel_tracer")
|
|
|
412
408
|
name=stage_name,
|
|
413
409
|
stage_actor=OpenTelemetryTracerStage,
|
|
414
410
|
config=otel_tracer_config,
|
|
415
|
-
min_replicas=
|
|
416
|
-
max_replicas=
|
|
411
|
+
min_replicas=1,
|
|
412
|
+
max_replicas=1,
|
|
417
413
|
)
|
|
418
414
|
|
|
419
415
|
return stage_name
|
|
@@ -426,7 +422,7 @@ def add_image_dedup_stage(pipeline, default_cpu_count, stage_name="image_dedup")
|
|
|
426
422
|
name=stage_name,
|
|
427
423
|
stage_actor=ImageDedupStage,
|
|
428
424
|
config=config,
|
|
429
|
-
min_replicas=
|
|
425
|
+
min_replicas=1,
|
|
430
426
|
max_replicas=1,
|
|
431
427
|
)
|
|
432
428
|
|
|
@@ -440,7 +436,7 @@ def add_image_filter_stage(pipeline, default_cpu_count, stage_name="image_filter
|
|
|
440
436
|
name=stage_name,
|
|
441
437
|
stage_actor=ImageFilterStage,
|
|
442
438
|
config=config,
|
|
443
|
-
min_replicas=
|
|
439
|
+
min_replicas=1,
|
|
444
440
|
max_replicas=1,
|
|
445
441
|
)
|
|
446
442
|
|
|
@@ -456,8 +452,8 @@ def add_text_splitter_stage(pipeline, default_cpu_count, stage_name="text_splitt
|
|
|
456
452
|
name=stage_name,
|
|
457
453
|
stage_actor=TextSplitterStage,
|
|
458
454
|
config=config,
|
|
459
|
-
min_replicas=
|
|
460
|
-
max_replicas=
|
|
455
|
+
min_replicas=1,
|
|
456
|
+
max_replicas=1,
|
|
461
457
|
)
|
|
462
458
|
|
|
463
459
|
return stage_name
|
|
@@ -488,7 +484,7 @@ def add_image_caption_stage(pipeline, default_cpu_count, stage_name="image_capti
|
|
|
488
484
|
name=stage_name,
|
|
489
485
|
stage_actor=ImageCaptionTransformStage,
|
|
490
486
|
config=config,
|
|
491
|
-
min_replicas=
|
|
487
|
+
min_replicas=1,
|
|
492
488
|
max_replicas=1,
|
|
493
489
|
)
|
|
494
490
|
|
|
@@ -515,11 +511,7 @@ def add_text_embedding_stage(pipeline, default_cpu_count, stage_name="text_embed
|
|
|
515
511
|
)
|
|
516
512
|
|
|
517
513
|
pipeline.add_stage(
|
|
518
|
-
name=stage_name,
|
|
519
|
-
stage_actor=TextEmbeddingTransformStage,
|
|
520
|
-
config=config,
|
|
521
|
-
min_replicas=0,
|
|
522
|
-
max_replicas=int(max(1, (default_cpu_count // 14))), # 7% of available CPU cores
|
|
514
|
+
name=stage_name, stage_actor=TextEmbeddingTransformStage, config=config, min_replicas=1, max_replicas=1
|
|
523
515
|
)
|
|
524
516
|
|
|
525
517
|
return stage_name
|
|
@@ -532,7 +524,7 @@ def add_embedding_storage_stage(pipeline, default_cpu_count, stage_name="embeddi
|
|
|
532
524
|
name=stage_name,
|
|
533
525
|
stage_actor=EmbeddingStorageStage,
|
|
534
526
|
config=config,
|
|
535
|
-
min_replicas=
|
|
527
|
+
min_replicas=1,
|
|
536
528
|
max_replicas=1,
|
|
537
529
|
)
|
|
538
530
|
|
|
@@ -545,7 +537,7 @@ def add_image_storage_stage(pipeline, default_cpu_count, stage_name="image_stora
|
|
|
545
537
|
name=stage_name,
|
|
546
538
|
stage_actor=ImageStorageStage,
|
|
547
539
|
config=config,
|
|
548
|
-
min_replicas=
|
|
540
|
+
min_replicas=1,
|
|
549
541
|
max_replicas=1,
|
|
550
542
|
)
|
|
551
543
|
|
|
@@ -583,8 +575,8 @@ def add_message_broker_response_stage(pipeline, default_cpu_count, stage_name="b
|
|
|
583
575
|
name=stage_name,
|
|
584
576
|
stage_actor=MessageBrokerTaskSinkStage,
|
|
585
577
|
config=sink_config,
|
|
586
|
-
min_replicas=
|
|
587
|
-
max_replicas=
|
|
578
|
+
min_replicas=1,
|
|
579
|
+
max_replicas=1,
|
|
588
580
|
)
|
|
589
581
|
|
|
590
582
|
return stage_name
|
|
@@ -67,7 +67,7 @@ nv_ingest/framework/orchestration/ray/util/pipeline/__init__.py,sha256=wQSlVx3T1
|
|
|
67
67
|
nv_ingest/framework/orchestration/ray/util/pipeline/pid_controller.py,sha256=AWyCFPP41vp1NOkO2urqm7vh-sTGKypJxwhdq8HxK6Q,50681
|
|
68
68
|
nv_ingest/framework/orchestration/ray/util/pipeline/pipeline_builders.py,sha256=jMYnVe_0rb1OIO9mlB4LH3uXtgaXBbUG-rDPx6fe6J8,10456
|
|
69
69
|
nv_ingest/framework/orchestration/ray/util/pipeline/pipeline_runners.py,sha256=IKQHlEwe0xsjr4MgQJVL0UtnKha1qaoPFc08DF5QzMM,14351
|
|
70
|
-
nv_ingest/framework/orchestration/ray/util/pipeline/stage_builders.py,sha256=
|
|
70
|
+
nv_ingest/framework/orchestration/ray/util/pipeline/stage_builders.py,sha256=rE1azhkVh5Gk_j4GdmUArSM76SByR44YRNFar4-BSkw,20803
|
|
71
71
|
nv_ingest/framework/orchestration/ray/util/system_tools/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
72
72
|
nv_ingest/framework/orchestration/ray/util/system_tools/memory.py,sha256=ICqY0LLB3hFTZk03iX5yffMSKFH2q_aQomtDVzS_mKw,2228
|
|
73
73
|
nv_ingest/framework/orchestration/ray/util/system_tools/visualizers.py,sha256=2oHZdO_3L1LGuzpyNmZBDh19n0E-APAaHk4MEwBwSHs,12895
|
|
@@ -95,8 +95,8 @@ nv_ingest/framework/util/service/meta/ingest/__init__.py,sha256=wQSlVx3T14ZgQAt-
|
|
|
95
95
|
nv_ingest/framework/util/service/meta/ingest/ingest_service_meta.py,sha256=QS3uNxWBl5dIcmIpJKNe8_TLcTUuN2vcKyHeAwa-eSo,1589
|
|
96
96
|
nv_ingest/framework/util/telemetry/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
97
97
|
nv_ingest/framework/util/telemetry/global_stats.py,sha256=nq65pEEdiwjAfGiqsxG1CeQMC96O3CfQxsZuGFCY-ds,4554
|
|
98
|
-
nv_ingest-25.6.
|
|
99
|
-
nv_ingest-25.6.
|
|
100
|
-
nv_ingest-25.6.
|
|
101
|
-
nv_ingest-25.6.
|
|
102
|
-
nv_ingest-25.6.
|
|
98
|
+
nv_ingest-25.6.4rc6.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
|
99
|
+
nv_ingest-25.6.4rc6.dist-info/METADATA,sha256=ZbUiqF3zSJpLlk9P_uSQ3D_JcUUMHSVGSttvzyuZLlo,15167
|
|
100
|
+
nv_ingest-25.6.4rc6.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
101
|
+
nv_ingest-25.6.4rc6.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
|
|
102
|
+
nv_ingest-25.6.4rc6.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|