nv-ingest 2025.9.15.dev20250915__py3-none-any.whl → 2025.12.13.dev20251213__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (25) hide show
  1. nv_ingest/api/__init__.py +6 -0
  2. nv_ingest/api/main.py +2 -0
  3. nv_ingest/api/tracing.py +82 -0
  4. nv_ingest/api/v2/README.md +203 -0
  5. nv_ingest/api/v2/__init__.py +3 -0
  6. nv_ingest/api/v2/ingest.py +1300 -0
  7. nv_ingest/framework/orchestration/process/dependent_services.py +17 -10
  8. nv_ingest/framework/orchestration/process/execution.py +6 -0
  9. nv_ingest/framework/orchestration/process/strategies.py +6 -2
  10. nv_ingest/framework/orchestration/process/termination.py +49 -9
  11. nv_ingest/framework/orchestration/ray/examples/pipeline_test_harness.py +11 -11
  12. nv_ingest/framework/orchestration/ray/stages/extractors/audio_extractor.py +0 -2
  13. nv_ingest/framework/orchestration/ray/stages/extractors/ocr_extractor.py +71 -0
  14. nv_ingest/framework/orchestration/ray/stages/sources/message_broker_task_source.py +41 -8
  15. nv_ingest/framework/orchestration/ray/stages/storage/image_storage.py +72 -6
  16. nv_ingest/framework/orchestration/ray/util/pipeline/pipeline_runners.py +40 -0
  17. nv_ingest/framework/util/service/impl/ingest/redis_ingest_service.py +215 -11
  18. nv_ingest/pipeline/config/replica_resolver.py +12 -2
  19. nv_ingest/pipeline/default_libmode_pipeline_impl.py +40 -25
  20. nv_ingest/pipeline/default_pipeline_impl.py +83 -40
  21. {nv_ingest-2025.9.15.dev20250915.dist-info → nv_ingest-2025.12.13.dev20251213.dist-info}/METADATA +5 -2
  22. {nv_ingest-2025.9.15.dev20250915.dist-info → nv_ingest-2025.12.13.dev20251213.dist-info}/RECORD +25 -20
  23. {nv_ingest-2025.9.15.dev20250915.dist-info → nv_ingest-2025.12.13.dev20251213.dist-info}/WHEEL +0 -0
  24. {nv_ingest-2025.9.15.dev20250915.dist-info → nv_ingest-2025.12.13.dev20251213.dist-info}/licenses/LICENSE +0 -0
  25. {nv_ingest-2025.9.15.dev20250915.dist-info → nv_ingest-2025.12.13.dev20251213.dist-info}/top_level.txt +0 -0
@@ -64,20 +64,20 @@ stages:
64
64
  actor: "nv_ingest.framework.orchestration.ray.stages.extractors.pdf_extractor:PDFExtractorStage"
65
65
  config:
66
66
  pdfium_config:
67
- auth_token: $NGC_API_KEY|""
67
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
68
68
  yolox_endpoints: [
69
69
  $YOLOX_GRPC_ENDPOINT|"page-elements:8001",
70
70
  $YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
71
71
  ]
72
72
  yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
73
- nemoretriever_parse_config:
74
- auth_token: $NGC_API_KEY|""
75
- nemoretriever_parse_endpoints: [
76
- $NEMORETRIEVER_PARSE_GRPC_ENDPOINT|"",
77
- $NEMORETRIEVER_PARSE_HTTP_ENDPOINT|"http://nemoretriever-parse:8000/v1/chat/completions",
73
+ nemotron_parse_config:
74
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
75
+ nemotron_parse_endpoints: [
76
+ $NEMOTRON_PARSE_GRPC_ENDPOINT|"",
77
+ $NEMOTRON_PARSE_HTTP_ENDPOINT|"http://nemotron-parse:8000/v1/chat/completions",
78
78
  ]
79
- nemoretriever_parse_infer_protocol: $NEMORETRIEVER_PARSE_INFER_PROTOCOL|http
80
- nemoretriever_parse_model_name: $NEMORETRIEVER_PARSE_MODEL_NAME|"nvidia/nemoretriever-parse"
79
+ nemotron_parse_infer_protocol: $NEMOTRON_PARSE_INFER_PROTOCOL|http
80
+ nemotron_parse_model_name: $NEMOTRON_PARSE_MODEL_NAME|"nvidia/nemotron-parse"
81
81
  yolox_endpoints: [
82
82
  $YOLOX_GRPC_ENDPOINT|"page-elements:8001",
83
83
  $YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
@@ -105,7 +105,7 @@ stages:
105
105
  ]
106
106
  function_id: $AUDIO_FUNCTION_ID|""
107
107
  audio_infer_protocol: $AUDIO_INFER_PROTOCOL|grpc
108
- auth_token: $NGC_API_KEY|""
108
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
109
109
  replicas:
110
110
  min_replicas: 0
111
111
  max_replicas:
@@ -123,10 +123,17 @@ stages:
123
123
  docx_extraction_config:
124
124
  yolox_endpoints: [
125
125
  $YOLOX_GRPC_ENDPOINT|"page-elements:8001",
126
- $YOLOX_HTTP_ENDPOINT|"",
126
+ $YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
127
+ ]
128
+ yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
129
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
130
+ pdfium_config:
131
+ yolox_endpoints: [
132
+ $YOLOX_GRPC_ENDPOINT|"page-elements:8001",
133
+ $YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
127
134
  ]
128
135
  yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
129
- auth_token: $NGC_API_KEY|""
136
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
130
137
  replicas:
131
138
  min_replicas: 0
132
139
  max_replicas:
@@ -147,7 +154,14 @@ stages:
147
154
  $YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
148
155
  ]
149
156
  yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
150
- auth_token: $NGC_API_KEY|""
157
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
158
+ pdfium_config:
159
+ yolox_endpoints: [
160
+ $YOLOX_GRPC_ENDPOINT|"page-elements:8001",
161
+ $YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
162
+ ]
163
+ yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
164
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
151
165
  replicas:
152
166
  min_replicas: 0
153
167
  max_replicas:
@@ -168,7 +182,7 @@ stages:
168
182
  $YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
169
183
  ]
170
184
  yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
171
- auth_token: $NGC_API_KEY|""
185
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
172
186
  replicas:
173
187
  min_replicas: 0
174
188
  max_replicas:
@@ -192,6 +206,27 @@ stages:
192
206
  strategy: "static"
193
207
  value: 1
194
208
 
209
+ - name: "ocr_extractor"
210
+ type: "stage"
211
+ phase: 1 # EXTRACTION
212
+ actor: "nv_ingest.framework.orchestration.ray.stages.extractors.ocr_extractor:OCRExtractorStage"
213
+ config:
214
+ endpoint_config:
215
+ ocr_endpoints: [
216
+ $OCR_GRPC_ENDPOINT|"ocr:8001",
217
+ $OCR_HTTP_ENDPOINT|"http://ocr:8000/v1/infer",
218
+ ]
219
+ ocr_infer_protocol: $OCR_INFER_PROTOCOL|grpc
220
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
221
+ replicas:
222
+ min_replicas: 0
223
+ max_replicas:
224
+ strategy: "static"
225
+ value: 4
226
+ static_replicas:
227
+ strategy: "static"
228
+ value: 3
229
+
195
230
  - name: "infographic_extractor"
196
231
  type: "stage"
197
232
  phase: 1 # EXTRACTION
@@ -203,7 +238,7 @@ stages:
203
238
  $OCR_HTTP_ENDPOINT|"http://ocr:8000/v1/infer",
204
239
  ]
205
240
  ocr_infer_protocol: $OCR_INFER_PROTOCOL|grpc
206
- auth_token: $NGC_API_KEY|""
241
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
207
242
  replicas:
208
243
  min_replicas: 0
209
244
  max_replicas:
@@ -229,7 +264,7 @@ stages:
229
264
  $OCR_HTTP_ENDPOINT|"http://ocr:8000/v1/infer",
230
265
  ]
231
266
  ocr_infer_protocol: $OCR_INFER_PROTOCOL|grpc
232
- auth_token: $NGC_API_KEY|""
267
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
233
268
  replicas:
234
269
  min_replicas: 0
235
270
  max_replicas:
@@ -256,7 +291,7 @@ stages:
256
291
  $OCR_HTTP_ENDPOINT|""
257
292
  ]
258
293
  ocr_infer_protocol: $OCR_INFER_PROTOCOL|grpc
259
- auth_token: $NGC_API_KEY|""
294
+ auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
260
295
  replicas:
261
296
  min_replicas: 0
262
297
  max_replicas:
@@ -316,9 +351,11 @@ stages:
316
351
  phase: 4 # TRANSFORM
317
352
  actor: "nv_ingest.framework.orchestration.ray.stages.transforms.image_caption:ImageCaptionTransformStage"
318
353
  config:
319
- api_key: $NGC_API_KEY|""
320
- model_name: $VLM_CAPTION_MODEL_NAME|"nvidia/llama-3.1-nemotron-nano-vl-8b-v1"
321
- prompt: "Caption the content of this image:"
354
+ api_key: $NGC_API_KEY|$NVIDIA_API_KEY
355
+ model_name: $VLM_CAPTION_MODEL_NAME|"nvidia/nemotron-nano-12b-v2-vl"
356
+ endpoint_url: $VLM_CAPTION_ENDPOINT|"http://vlm:8000/v1/chat/completions"
357
+ prompt: $VLM_CAPTION_PROMPT|"Caption the content of this image:"
358
+ system_prompt: $VLM_CAPTION_SYSTEM_PROMPT|"/no_think"
322
359
  replicas:
323
360
  min_replicas: 0
324
361
  max_replicas:
@@ -333,7 +370,7 @@ stages:
333
370
  phase: 4 # TRANSFORM
334
371
  actor: "nv_ingest.framework.orchestration.ray.stages.transforms.text_embed:TextEmbeddingTransformStage"
335
372
  config:
336
- api_key: $NGC_API_KEY|""
373
+ api_key: $NGC_API_KEY|$NVIDIA_API_KEY
337
374
  embedding_model: $EMBEDDING_NIM_MODEL_NAME|"nvidia/llama-3.2-nv-embedqa-1b-v2"
338
375
  embedding_nim_endpoint: $EMBEDDING_NIM_ENDPOINT|"http://embedding:8000/v1"
339
376
  replicas:
@@ -350,6 +387,9 @@ stages:
350
387
  type: "stage"
351
388
  phase: 5 # RESPONSE
352
389
  actor: "nv_ingest.framework.orchestration.ray.stages.storage.image_storage:ImageStorageStage"
390
+ config:
391
+ storage_uri: $IMAGE_STORAGE_URI|"s3://nv-ingest/artifacts/store/images"
392
+ public_base_url: $IMAGE_STORAGE_PUBLIC_BASE_URL|""
353
393
  replicas:
354
394
  min_replicas: 0
355
395
  max_replicas:
@@ -427,76 +467,79 @@ edges:
427
467
  # Intake
428
468
  - from: "source_stage"
429
469
  to: "metadata_injector"
430
- queue_size: 32
470
+ queue_size: 4
431
471
 
432
472
  # Document Extractors
433
473
  - from: "metadata_injector"
434
474
  to: "pdf_extractor"
435
- queue_size: 32
475
+ queue_size: 8
436
476
  - from: "pdf_extractor"
437
477
  to: "audio_extractor"
438
- queue_size: 32
478
+ queue_size: 4
439
479
  - from: "audio_extractor"
440
480
  to: "docx_extractor"
441
- queue_size: 32
481
+ queue_size: 4
442
482
  - from: "docx_extractor"
443
483
  to: "pptx_extractor"
444
- queue_size: 32
484
+ queue_size: 4
445
485
  - from: "pptx_extractor"
446
486
  to: "image_extractor"
447
- queue_size: 32
487
+ queue_size: 4
448
488
  - from: "image_extractor"
449
489
  to: "html_extractor"
450
- queue_size: 32
490
+ queue_size: 4
451
491
  - from: "html_extractor"
452
492
  to: "infographic_extractor"
453
- queue_size: 32
493
+ queue_size: 4
454
494
 
455
495
  # Primitive Extractors
456
496
  - from: "infographic_extractor"
457
497
  to: "table_extractor"
458
- queue_size: 32
498
+ queue_size: 4
459
499
  - from: "table_extractor"
460
500
  to: "chart_extractor"
461
- queue_size: 32
501
+ queue_size: 4
462
502
  - from: "chart_extractor"
503
+ to: "ocr_extractor"
504
+ queue_size: 8
505
+ - from: "ocr_extractor"
463
506
  to: "image_filter"
464
- queue_size: 32
507
+ queue_size: 4
465
508
 
466
509
  # Primitive Mutators
467
510
  - from: "image_filter"
468
511
  to: "image_dedup"
469
- queue_size: 32
512
+ queue_size: 4
470
513
  - from: "image_dedup"
471
514
  to: "text_splitter"
472
- queue_size: 32
515
+ queue_size: 4
473
516
 
474
517
  # Primitive Transforms
475
518
  - from: "text_splitter"
476
519
  to: "image_caption"
477
- queue_size: 32
520
+ queue_size: 4
478
521
  - from: "image_caption"
479
522
  to: "text_embedder"
480
- queue_size: 32
523
+ queue_size: 4
481
524
  - from: "text_embedder"
482
525
  to: "image_storage"
483
- queue_size: 32
526
+ queue_size: 4
484
527
 
485
528
  # Primitive Storage
486
529
  - from: "image_storage"
487
530
  to: "embedding_storage"
488
- queue_size: 32
531
+ queue_size: 4
489
532
  - from: "embedding_storage"
490
533
  to: "broker_response"
491
- queue_size: 32
534
+ queue_size: 4
492
535
 
493
536
  # Response and Telemetry
494
537
  - from: "broker_response"
495
538
  to: "otel_tracer"
496
- queue_size: 32
539
+ queue_size: 4
497
540
  - from: "otel_tracer"
498
541
  to: "default_drain"
499
- queue_size: 32
542
+ queue_size: 4
500
543
 
501
544
  # Pipeline Runtime Configuration
502
545
  pipeline:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest
3
- Version: 2025.9.15.dev20250915
3
+ Version: 2025.12.13.dev20251213
4
4
  Summary: Python module for multimodal document ingestion
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License
@@ -219,16 +219,19 @@ Requires-Dist: diskcache>=5.6.3
219
219
  Requires-Dist: fastapi>=0.115.6
220
220
  Requires-Dist: fastparquet>=2024.11.0
221
221
  Requires-Dist: fsspec>=2024.10.0
222
+ Requires-Dist: universal_pathlib>=0.2.6
223
+ Requires-Dist: s3fs>=2024.10.0
222
224
  Requires-Dist: gunicorn
223
225
  Requires-Dist: h11>=0.16.0
224
226
  Requires-Dist: httpx>=0.28.1
225
227
  Requires-Dist: isodate>=0.7.2
226
228
  Requires-Dist: langdetect>=1.0.9
227
229
  Requires-Dist: minio>=7.2.12
228
- Requires-Dist: openai>=1.82.0
230
+ Requires-Dist: librosa>=0.10.2
229
231
  Requires-Dist: opentelemetry-api>=1.27.0
230
232
  Requires-Dist: opentelemetry-exporter-otlp>=1.27.0
231
233
  Requires-Dist: opentelemetry-sdk>=1.27.0
234
+ Requires-Dist: psutil>=7.1.0
232
235
  Requires-Dist: pydantic>2.0.0
233
236
  Requires-Dist: pydantic-settings>2.0.0
234
237
  Requires-Dist: pypdfium2==4.30.0
@@ -1,29 +1,33 @@
1
1
  nv_ingest/__init__.py,sha256=vJLPeuxiIHqbxXPJSu9qe3MS-GPavbOUExyRq83DxxM,895
2
2
  nv_ingest/version.py,sha256=MG7DxlzpnoJI56vqxwzs9WeMAEI3uPhfDiNLs6GN6wI,986
3
- nv_ingest/api/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
4
- nv_ingest/api/main.py,sha256=XE-p4lJp1E7CCDOB8ENtYFrf63Dtq2bzQiGxpRfL2LA,1603
3
+ nv_ingest/api/__init__.py,sha256=ED07QUqwVyJalH0ahhnnjvc2W_in6TpZZ5nJ6NWU9-Y,271
4
+ nv_ingest/api/main.py,sha256=uCCkUNLS1xE9TDYKDOdxEfo_9jQWumpQAPWrxj5m9Go,1706
5
+ nv_ingest/api/tracing.py,sha256=NkqMuUiB6ixGU5MYp3TrODsZDQepJ1kbH8JFHsYjuE0,2940
5
6
  nv_ingest/api/v1/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
6
7
  nv_ingest/api/v1/health.py,sha256=pV-RoVq5y0iBPp0qZoLzd1xKpd0JiHAi0UMyMj99LqU,4740
7
8
  nv_ingest/api/v1/ingest.py,sha256=LWk3LN4lBd3uO8h30EN42g3LHCVcO00avVd5ohVK7NI,19392
8
9
  nv_ingest/api/v1/metrics.py,sha256=ZGVRApYLnzc2f2C7wRgGd7deqiXan-jxfA-33a16clY,981
10
+ nv_ingest/api/v2/README.md,sha256=VhpdjEmCyr3qIOhwqISFx9C5WezJFcxYc-NB9S98HMg,7562
11
+ nv_ingest/api/v2/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
12
+ nv_ingest/api/v2/ingest.py,sha256=vjjb2xOOtlTVoTMc4rNdUI6yKYdEeR-umA_pwP_Rt64,53103
9
13
  nv_ingest/framework/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
10
14
  nv_ingest/framework/orchestration/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
11
15
  nv_ingest/framework/orchestration/execution/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
12
16
  nv_ingest/framework/orchestration/execution/helpers.py,sha256=-F8SZh7ISWtzJz6X1O2LQ133t-17Jxi8lL-NHz4rwj0,2818
13
17
  nv_ingest/framework/orchestration/execution/options.py,sha256=Ms1t4591EIv4ZrMRdhsCYPgLnMVXJosG3MURCbPXUoA,3983
14
18
  nv_ingest/framework/orchestration/process/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
15
- nv_ingest/framework/orchestration/process/dependent_services.py,sha256=ERf2M4O6pvbLDFrvayBHHL7M-FIwECeDEDTY3bi7MBg,2940
16
- nv_ingest/framework/orchestration/process/execution.py,sha256=P1kzpYV23e4QYrKw9Td1TCZK3CK1ENVqqnI_axRCqBk,19814
19
+ nv_ingest/framework/orchestration/process/dependent_services.py,sha256=s0j_rsFtCKHFIuvOkBe9NEAkPNPhSYse_ApeHka8gyg,3032
20
+ nv_ingest/framework/orchestration/process/execution.py,sha256=dkGldoudRsFl5wWAbvWnhGBv4ZYOpFOK5fXWncbPFIY,20149
17
21
  nv_ingest/framework/orchestration/process/lifecycle.py,sha256=L5NDwnzSMQPGjqJDC8jC75L1YqWey-dtK8N_HgBzb0E,8001
18
- nv_ingest/framework/orchestration/process/strategies.py,sha256=D7fdTPA7uuteoj6McA6hm1J5ArqoDdSZ7W6_ONDX7N0,7845
19
- nv_ingest/framework/orchestration/process/termination.py,sha256=_aI2ZzCasGfqwu0fcvufOlr1BGAay_Noxq5pAu67gv4,3593
22
+ nv_ingest/framework/orchestration/process/strategies.py,sha256=Q1Q04PPseF775omeS0FoXfK187NiS_bbqTaaJRwzKn8,7972
23
+ nv_ingest/framework/orchestration/process/termination.py,sha256=PAogFeW0FATFS6Mcp_UkZgq_SbWV18RtdZN-0NbComw,5042
20
24
  nv_ingest/framework/orchestration/ray/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
21
25
  nv_ingest/framework/orchestration/ray/edges/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
22
26
  nv_ingest/framework/orchestration/ray/edges/async_queue_edge.py,sha256=PQliU_kyGbO9o42njpb8FrDMLrbLqwZzmBNXifxyG5Y,2312
23
27
  nv_ingest/framework/orchestration/ray/edges/ray_queue_edge.py,sha256=VFii2yxJuikimOxie3edKq5JN06g78AF8bdHSHVX8p8,2677
24
28
  nv_ingest/framework/orchestration/ray/edges/threaded_queue_edge.py,sha256=N6NH4KgZJ60e_JkGRcSmfQtX37qtX4TMcavOR-n3heE,2549
25
29
  nv_ingest/framework/orchestration/ray/examples/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
26
- nv_ingest/framework/orchestration/ray/examples/pipeline_test_harness.py,sha256=hnRLybIpVTj3mXkLW0ErWVn4vRsInjNZmA80JqDiQuw,16473
30
+ nv_ingest/framework/orchestration/ray/examples/pipeline_test_harness.py,sha256=UMvrDMZmOu2FKa4W8oD_kpKDXgxYWSifdMbBGveyFh4,16373
27
31
  nv_ingest/framework/orchestration/ray/examples/task_source_harness.py,sha256=Yt7uxThg7s8WuMiaHLKC8r1XAG7QixegfkT-juE5oNw,1953
28
32
  nv_ingest/framework/orchestration/ray/examples/task_source_sink_harness.py,sha256=XkvsoIzH5ftXvAZ4ox7mxbx7ESVx6D8Xupcwbqgd52w,3277
29
33
  nv_ingest/framework/orchestration/ray/primitives/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
@@ -34,12 +38,13 @@ nv_ingest/framework/orchestration/ray/primitives/ray_pipeline.py,sha256=t9lf6zTj
34
38
  nv_ingest/framework/orchestration/ray/primitives/ray_stat_collector.py,sha256=GGY6_i6_g5xTFzdo9Qmsu9i4knMTq6pJfgm-aaPEt_o,17226
35
39
  nv_ingest/framework/orchestration/ray/stages/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
36
40
  nv_ingest/framework/orchestration/ray/stages/extractors/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
37
- nv_ingest/framework/orchestration/ray/stages/extractors/audio_extractor.py,sha256=4SdgvzI9oJ_OK5oWGir9wXVIPV4Pont2EKv9mwcWMC0,3631
41
+ nv_ingest/framework/orchestration/ray/stages/extractors/audio_extractor.py,sha256=UVp_kDmkaBlfO0Mbl_IxKq6imzLvs4-DKHgUHJIh3mo,3629
38
42
  nv_ingest/framework/orchestration/ray/stages/extractors/chart_extractor.py,sha256=rfaDx6PqRCguhSYkJI6iVmMMtAlJNxzKfUrLmw_fKqs,4381
39
43
  nv_ingest/framework/orchestration/ray/stages/extractors/docx_extractor.py,sha256=R4vshPcAUN2U6BIv8BCZQ862wLx8RJhCGXfpQ3K09Bs,3627
40
44
  nv_ingest/framework/orchestration/ray/stages/extractors/html_extractor.py,sha256=7JrZSVIrK4_wr2s7TOTss7pgTY2F9GPQ7Ze3F_WFlKU,3642
41
45
  nv_ingest/framework/orchestration/ray/stages/extractors/image_extractor.py,sha256=iY9fEfucfgCmO2ixX6qwn418J97nJz_FQGh7B6yziVo,3980
42
46
  nv_ingest/framework/orchestration/ray/stages/extractors/infographic_extractor.py,sha256=v5J7dnJBEaDfjoTz_N_yC3RAt6lwMLgLT28V-ahquLE,3261
47
+ nv_ingest/framework/orchestration/ray/stages/extractors/ocr_extractor.py,sha256=pwVoA5-CF9GVWusoFZOMGBvSyW5udD9bdxVJXA_SghE,3188
43
48
  nv_ingest/framework/orchestration/ray/stages/extractors/pdf_extractor.py,sha256=QagIA99AsHLihjRbXm-2BphdoQGHwzOHlqLyz7oDOSk,4992
44
49
  nv_ingest/framework/orchestration/ray/stages/extractors/pptx_extractor.py,sha256=RMbbl7Cuj4BT-TcgUx_0k8R-DLdw-o3fHxcIBIgrWt4,3776
45
50
  nv_ingest/framework/orchestration/ray/stages/extractors/table_extractor.py,sha256=p71ktv6v5T-9npYpCbgbwW6-fS-65UWS7rCm8OWr2Bc,4170
@@ -57,9 +62,9 @@ nv_ingest/framework/orchestration/ray/stages/sinks/__init__.py,sha256=wQSlVx3T14
57
62
  nv_ingest/framework/orchestration/ray/stages/sinks/default_drain.py,sha256=_USW1Vq8G2Wn-QFdPfFQCrtKG46hHeJvkEGbBxdpbVM,1488
58
63
  nv_ingest/framework/orchestration/ray/stages/sinks/message_broker_task_sink.py,sha256=QcvMQXIJ7EWIxty76Mo5Xv38Oj6X2KuS8qXQlf7E1uA,11676
59
64
  nv_ingest/framework/orchestration/ray/stages/sources/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
60
- nv_ingest/framework/orchestration/ray/stages/sources/message_broker_task_source.py,sha256=Qm9XtTNX2CcUAlZRw33BS3Ql0djcsMGp52FPA2zHu3Q,22340
65
+ nv_ingest/framework/orchestration/ray/stages/sources/message_broker_task_source.py,sha256=LrqaWpWyuiAHlpXWKYSyHZJBFegGXfNlpCXrucbK5NM,24067
61
66
  nv_ingest/framework/orchestration/ray/stages/storage/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
62
- nv_ingest/framework/orchestration/ray/stages/storage/image_storage.py,sha256=WZN_-3Li-izDaPtk8IMrtn2os1ckT3U8Rb2PsfOWrcI,4009
67
+ nv_ingest/framework/orchestration/ray/stages/storage/image_storage.py,sha256=f1iA7rjYFA1G1EXqFM6URUi_QRql1Y1OrnMPKONsSqo,6907
63
68
  nv_ingest/framework/orchestration/ray/stages/storage/store_embeddings.py,sha256=EUtwhSDf-qGLVEhWEInr1VaLsvpcHUSyzCmHQVai-Ps,3547
64
69
  nv_ingest/framework/orchestration/ray/stages/telemetry/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
65
70
  nv_ingest/framework/orchestration/ray/stages/telemetry/job_counter.py,sha256=jEtEUibqs6IS6QakrzWY9zmxSUzuBpg_hzXy2R-I10Y,2870
@@ -75,7 +80,7 @@ nv_ingest/framework/orchestration/ray/util/__init__.py,sha256=wQSlVx3T14ZgQAt-EP
75
80
  nv_ingest/framework/orchestration/ray/util/env_config.py,sha256=GN9msJ_3jdOBIAPnXNxX0ds_BKtHRnRhnYxwzcAU2KY,2386
76
81
  nv_ingest/framework/orchestration/ray/util/pipeline/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
77
82
  nv_ingest/framework/orchestration/ray/util/pipeline/pid_controller.py,sha256=0dSDVTv3FXjMZ79sQh4i4YEwnqND5iPw8GAeZI0oJO4,47338
78
- nv_ingest/framework/orchestration/ray/util/pipeline/pipeline_runners.py,sha256=zWi-6-7dfb_3R00uVi3wdYMH1HgeevkBkg47UY8QqUQ,4386
83
+ nv_ingest/framework/orchestration/ray/util/pipeline/pipeline_runners.py,sha256=yisg0iRC5ss__Sg2HfJBQvqq2qJ_bj288go8FSMc2Zs,6020
79
84
  nv_ingest/framework/orchestration/ray/util/pipeline/tools.py,sha256=MzxLjElEVb6C5ghfJ7GCp8uqNZeVuzz8xJnxzdQmOsI,8425
80
85
  nv_ingest/framework/orchestration/ray/util/system_tools/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
81
86
  nv_ingest/framework/orchestration/ray/util/system_tools/memory.py,sha256=ICqY0LLB3hFTZk03iX5yffMSKFH2q_aQomtDVzS_mKw,2228
@@ -99,22 +104,22 @@ nv_ingest/framework/util/flow_control/udf_intercept.py,sha256=zQ9uuCcHLEd0P52Eiw
99
104
  nv_ingest/framework/util/service/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
100
105
  nv_ingest/framework/util/service/impl/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
101
106
  nv_ingest/framework/util/service/impl/ingest/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
102
- nv_ingest/framework/util/service/impl/ingest/redis_ingest_service.py,sha256=KbzQFo7qVbCITiKYVPcGN0x4NI8piJy70Dz-8jf59Xs,15415
107
+ nv_ingest/framework/util/service/impl/ingest/redis_ingest_service.py,sha256=59P-BMWnFY37GJm5w23-TMxgLhiZGZpJogC0gjDBaTA,23835
103
108
  nv_ingest/framework/util/service/meta/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
104
109
  nv_ingest/framework/util/service/meta/ingest/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
105
110
  nv_ingest/framework/util/service/meta/ingest/ingest_service_meta.py,sha256=QS3uNxWBl5dIcmIpJKNe8_TLcTUuN2vcKyHeAwa-eSo,1589
106
111
  nv_ingest/framework/util/telemetry/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
107
112
  nv_ingest/framework/util/telemetry/global_stats.py,sha256=nq65pEEdiwjAfGiqsxG1CeQMC96O3CfQxsZuGFCY-ds,4554
108
113
  nv_ingest/pipeline/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
109
- nv_ingest/pipeline/default_libmode_pipeline_impl.py,sha256=jcpTTC3yPt77EvNSyXxdnRryHLKQ2cMTMAo_0ZuLSNg,15450
110
- nv_ingest/pipeline/default_pipeline_impl.py,sha256=Vlui2jk27DFD9lPX_FYLPzPGIfk1AqRvbcf5lGZeQPE,15145
114
+ nv_ingest/pipeline/default_libmode_pipeline_impl.py,sha256=YYASfM68qNhGL5PcK0Fv72qmRZfE2TtY3cq2Oz-L478,16267
115
+ nv_ingest/pipeline/default_pipeline_impl.py,sha256=6SykgH_LJ8uuE2jrWGIT7OkJP6EjPyB8Ju6LMDu5IK0,16800
111
116
  nv_ingest/pipeline/ingest_pipeline.py,sha256=wHAJhqAM2s8nbY-8itVogmSU-yVN4PZONGWcKnhzgfg,17794
112
117
  nv_ingest/pipeline/pipeline_schema.py,sha256=rLZZz2It2o2hVNWrZUJU8CarrqRei1fho3ZEMkkoBcg,17940
113
118
  nv_ingest/pipeline/config/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
114
119
  nv_ingest/pipeline/config/loaders.py,sha256=75Yr9WYO7j7ghvKTnYLfZXQZEH3J3VEZo5J4TunC_Us,7590
115
- nv_ingest/pipeline/config/replica_resolver.py,sha256=3zjh8gmepEYORFZRM4inq7GoBW0YL3gzUDiixUugjzQ,8899
116
- nv_ingest-2025.9.15.dev20250915.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
117
- nv_ingest-2025.9.15.dev20250915.dist-info/METADATA,sha256=d2iY-cbHAvrbxBaVbYIjn9PUPP06Ky6HBDeFw6WN11I,15061
118
- nv_ingest-2025.9.15.dev20250915.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
119
- nv_ingest-2025.9.15.dev20250915.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
120
- nv_ingest-2025.9.15.dev20250915.dist-info/RECORD,,
120
+ nv_ingest/pipeline/config/replica_resolver.py,sha256=dEwqMXNttfw0QeisTGGkp24785jqzVCDAEFyQIffeGc,9369
121
+ nv_ingest-2025.12.13.dev20251213.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
122
+ nv_ingest-2025.12.13.dev20251213.dist-info/METADATA,sha256=lnUtBJCrO_1d6sSsKrQBxp6BYlDPn2offXNBVHayW7o,15163
123
+ nv_ingest-2025.12.13.dev20251213.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
124
+ nv_ingest-2025.12.13.dev20251213.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
125
+ nv_ingest-2025.12.13.dev20251213.dist-info/RECORD,,