nv-ingest 2025.8.16.dev20250816__py3-none-any.whl → 2025.11.21.dev20251121__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- nv_ingest/api/__init__.py +6 -0
- nv_ingest/api/main.py +2 -0
- nv_ingest/api/tracing.py +82 -0
- nv_ingest/api/v2/README.md +203 -0
- nv_ingest/api/v2/__init__.py +3 -0
- nv_ingest/api/v2/ingest.py +1300 -0
- nv_ingest/framework/orchestration/process/dependent_services.py +43 -14
- nv_ingest/framework/orchestration/process/execution.py +92 -94
- nv_ingest/framework/orchestration/process/lifecycle.py +98 -6
- nv_ingest/framework/orchestration/process/strategies.py +41 -5
- nv_ingest/framework/orchestration/process/termination.py +147 -0
- nv_ingest/framework/orchestration/ray/examples/pipeline_test_harness.py +2 -2
- nv_ingest/framework/orchestration/ray/primitives/ray_pipeline.py +9 -15
- nv_ingest/framework/orchestration/ray/stages/extractors/audio_extractor.py +2 -3
- nv_ingest/framework/orchestration/ray/stages/extractors/chart_extractor.py +5 -2
- nv_ingest/framework/orchestration/ray/stages/extractors/docx_extractor.py +2 -1
- nv_ingest/framework/orchestration/ray/stages/extractors/html_extractor.py +2 -1
- nv_ingest/framework/orchestration/ray/stages/extractors/image_extractor.py +2 -1
- nv_ingest/framework/orchestration/ray/stages/extractors/ocr_extractor.py +71 -0
- nv_ingest/framework/orchestration/ray/stages/extractors/pdf_extractor.py +5 -2
- nv_ingest/framework/orchestration/ray/stages/extractors/table_extractor.py +2 -1
- nv_ingest/framework/orchestration/ray/stages/injectors/metadata_injector.py +2 -1
- nv_ingest/framework/orchestration/ray/stages/mutate/image_dedup.py +2 -1
- nv_ingest/framework/orchestration/ray/stages/mutate/image_filter.py +2 -1
- nv_ingest/framework/orchestration/ray/stages/sources/message_broker_task_source.py +46 -9
- nv_ingest/framework/orchestration/ray/stages/storage/store_embeddings.py +2 -1
- nv_ingest/framework/orchestration/ray/stages/transforms/image_caption.py +5 -1
- nv_ingest/framework/orchestration/ray/stages/transforms/text_embed.py +5 -1
- nv_ingest/framework/orchestration/ray/stages/transforms/text_splitter.py +4 -3
- nv_ingest/framework/util/service/impl/ingest/redis_ingest_service.py +215 -11
- nv_ingest/pipeline/config/loaders.py +33 -2
- nv_ingest/pipeline/default_libmode_pipeline_impl.py +514 -0
- nv_ingest/pipeline/default_pipeline_impl.py +111 -88
- {nv_ingest-2025.8.16.dev20250816.dist-info → nv_ingest-2025.11.21.dev20251121.dist-info}/METADATA +4 -3
- {nv_ingest-2025.8.16.dev20250816.dist-info → nv_ingest-2025.11.21.dev20251121.dist-info}/RECORD +38 -31
- {nv_ingest-2025.8.16.dev20250816.dist-info → nv_ingest-2025.11.21.dev20251121.dist-info}/WHEEL +0 -0
- {nv_ingest-2025.8.16.dev20250816.dist-info → nv_ingest-2025.11.21.dev20251121.dist-info}/licenses/LICENSE +0 -0
- {nv_ingest-2025.8.16.dev20250816.dist-info → nv_ingest-2025.11.21.dev20251121.dist-info}/top_level.txt +0 -0
|
@@ -7,17 +7,17 @@
|
|
|
7
7
|
# pylint: disable=line-too-long
|
|
8
8
|
|
|
9
9
|
"""
|
|
10
|
-
Default pipeline implementation
|
|
10
|
+
Default pipeline implementation (runtime default).
|
|
11
11
|
|
|
12
|
-
This module
|
|
13
|
-
|
|
12
|
+
This module embeds the exact contents of config/default_pipeline.yaml so code can
|
|
13
|
+
load the default pipeline without reading the YAML file at runtime.
|
|
14
14
|
"""
|
|
15
15
|
|
|
16
|
-
|
|
16
|
+
DEFAULT_PIPELINE_YAML = """# Default Ingestion Pipeline Configuration
|
|
17
17
|
# This file replicates the static pipeline defined in pipeline_builders.py
|
|
18
18
|
|
|
19
|
-
name: "NVIngest default
|
|
20
|
-
description: "This is the default ingestion pipeline for NVIngest
|
|
19
|
+
name: "NVIngest default pipeline"
|
|
20
|
+
description: "This is the default ingestion pipeline for NVIngest"
|
|
21
21
|
stages:
|
|
22
22
|
# Source
|
|
23
23
|
- name: "source_stage"
|
|
@@ -26,20 +26,19 @@ stages:
|
|
|
26
26
|
actor: "nv_ingest.framework.orchestration.ray.stages.sources.message_broker_task_source:MessageBrokerTaskSourceStage"
|
|
27
27
|
config:
|
|
28
28
|
broker_client:
|
|
29
|
-
client_type: "
|
|
30
|
-
host: $MESSAGE_CLIENT_HOST|"
|
|
31
|
-
port: $MESSAGE_CLIENT_PORT|
|
|
29
|
+
client_type: $MESSAGE_CLIENT_TYPE|"redis"
|
|
30
|
+
host: $MESSAGE_CLIENT_HOST|"redis"
|
|
31
|
+
port: $MESSAGE_CLIENT_PORT|6379
|
|
32
32
|
task_queue: "ingest_task_queue"
|
|
33
33
|
poll_interval: 0.1
|
|
34
34
|
replicas:
|
|
35
|
-
min_replicas:
|
|
35
|
+
min_replicas: 1
|
|
36
36
|
max_replicas:
|
|
37
37
|
strategy: "static"
|
|
38
38
|
value: 1
|
|
39
39
|
static_replicas:
|
|
40
40
|
strategy: "static"
|
|
41
41
|
value: 1
|
|
42
|
-
runs_after: []
|
|
43
42
|
|
|
44
43
|
# Pre-processing
|
|
45
44
|
- name: "metadata_injector"
|
|
@@ -65,25 +64,25 @@ stages:
|
|
|
65
64
|
actor: "nv_ingest.framework.orchestration.ray.stages.extractors.pdf_extractor:PDFExtractorStage"
|
|
66
65
|
config:
|
|
67
66
|
pdfium_config:
|
|
68
|
-
auth_token: $NGC_API_KEY
|
|
67
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
69
68
|
yolox_endpoints: [
|
|
70
|
-
$YOLOX_GRPC_ENDPOINT|"",
|
|
71
|
-
$YOLOX_HTTP_ENDPOINT|"
|
|
69
|
+
$YOLOX_GRPC_ENDPOINT|"page-elements:8001",
|
|
70
|
+
$YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
|
|
72
71
|
]
|
|
73
|
-
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|
|
|
72
|
+
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
|
|
74
73
|
nemoretriever_parse_config:
|
|
75
|
-
auth_token: $NGC_API_KEY
|
|
74
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
76
75
|
nemoretriever_parse_endpoints: [
|
|
77
76
|
$NEMORETRIEVER_PARSE_GRPC_ENDPOINT|"",
|
|
78
|
-
$NEMORETRIEVER_PARSE_HTTP_ENDPOINT|"
|
|
77
|
+
$NEMORETRIEVER_PARSE_HTTP_ENDPOINT|"http://nemoretriever-parse:8000/v1/chat/completions",
|
|
79
78
|
]
|
|
80
79
|
nemoretriever_parse_infer_protocol: $NEMORETRIEVER_PARSE_INFER_PROTOCOL|http
|
|
81
80
|
nemoretriever_parse_model_name: $NEMORETRIEVER_PARSE_MODEL_NAME|"nvidia/nemoretriever-parse"
|
|
82
81
|
yolox_endpoints: [
|
|
83
|
-
$YOLOX_GRPC_ENDPOINT|"",
|
|
84
|
-
$YOLOX_HTTP_ENDPOINT|"
|
|
82
|
+
$YOLOX_GRPC_ENDPOINT|"page-elements:8001",
|
|
83
|
+
$YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
|
|
85
84
|
]
|
|
86
|
-
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|
|
|
85
|
+
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
|
|
87
86
|
replicas:
|
|
88
87
|
min_replicas: 0
|
|
89
88
|
max_replicas:
|
|
@@ -101,12 +100,12 @@ stages:
|
|
|
101
100
|
config:
|
|
102
101
|
audio_extraction_config:
|
|
103
102
|
audio_endpoints: [
|
|
104
|
-
$AUDIO_GRPC_ENDPOINT|"
|
|
105
|
-
$AUDIO_HTTP_ENDPOINT|""
|
|
103
|
+
$AUDIO_GRPC_ENDPOINT|"audio:50051",
|
|
104
|
+
$AUDIO_HTTP_ENDPOINT|"",
|
|
106
105
|
]
|
|
107
|
-
function_id: $AUDIO_FUNCTION_ID|"
|
|
106
|
+
function_id: $AUDIO_FUNCTION_ID|""
|
|
108
107
|
audio_infer_protocol: $AUDIO_INFER_PROTOCOL|grpc
|
|
109
|
-
auth_token: $NGC_API_KEY
|
|
108
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
110
109
|
replicas:
|
|
111
110
|
min_replicas: 0
|
|
112
111
|
max_replicas:
|
|
@@ -123,11 +122,11 @@ stages:
|
|
|
123
122
|
config:
|
|
124
123
|
docx_extraction_config:
|
|
125
124
|
yolox_endpoints: [
|
|
126
|
-
$YOLOX_GRPC_ENDPOINT|"",
|
|
127
|
-
$YOLOX_HTTP_ENDPOINT|"
|
|
125
|
+
$YOLOX_GRPC_ENDPOINT|"page-elements:8001",
|
|
126
|
+
$YOLOX_HTTP_ENDPOINT|"",
|
|
128
127
|
]
|
|
129
|
-
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|
|
|
130
|
-
auth_token: $NGC_API_KEY
|
|
128
|
+
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
|
|
129
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
131
130
|
replicas:
|
|
132
131
|
min_replicas: 0
|
|
133
132
|
max_replicas:
|
|
@@ -144,11 +143,11 @@ stages:
|
|
|
144
143
|
config:
|
|
145
144
|
pptx_extraction_config:
|
|
146
145
|
yolox_endpoints: [
|
|
147
|
-
$YOLOX_GRPC_ENDPOINT|"",
|
|
148
|
-
$YOLOX_HTTP_ENDPOINT|"
|
|
146
|
+
$YOLOX_GRPC_ENDPOINT|"page-elements:8001",
|
|
147
|
+
$YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
|
|
149
148
|
]
|
|
150
|
-
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|
|
|
151
|
-
auth_token: $NGC_API_KEY
|
|
149
|
+
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
|
|
150
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
152
151
|
replicas:
|
|
153
152
|
min_replicas: 0
|
|
154
153
|
max_replicas:
|
|
@@ -165,11 +164,11 @@ stages:
|
|
|
165
164
|
config:
|
|
166
165
|
image_extraction_config:
|
|
167
166
|
yolox_endpoints: [
|
|
168
|
-
$YOLOX_GRPC_ENDPOINT|"",
|
|
169
|
-
$YOLOX_HTTP_ENDPOINT|"
|
|
167
|
+
$YOLOX_GRPC_ENDPOINT|"page-elements:8001",
|
|
168
|
+
$YOLOX_HTTP_ENDPOINT|"http://page-elements:8000/v1/infer",
|
|
170
169
|
]
|
|
171
|
-
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|
|
|
172
|
-
auth_token: $NGC_API_KEY
|
|
170
|
+
yolox_infer_protocol: $YOLOX_INFER_PROTOCOL|grpc
|
|
171
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
173
172
|
replicas:
|
|
174
173
|
min_replicas: 0
|
|
175
174
|
max_replicas:
|
|
@@ -193,6 +192,27 @@ stages:
|
|
|
193
192
|
strategy: "static"
|
|
194
193
|
value: 1
|
|
195
194
|
|
|
195
|
+
- name: "ocr_extractor"
|
|
196
|
+
type: "stage"
|
|
197
|
+
phase: 1 # EXTRACTION
|
|
198
|
+
actor: "nv_ingest.framework.orchestration.ray.stages.extractors.ocr_extractor:OCRExtractorStage"
|
|
199
|
+
config:
|
|
200
|
+
endpoint_config:
|
|
201
|
+
ocr_endpoints: [
|
|
202
|
+
$OCR_GRPC_ENDPOINT|"ocr:8001",
|
|
203
|
+
$OCR_HTTP_ENDPOINT|"http://ocr:8000/v1/infer",
|
|
204
|
+
]
|
|
205
|
+
ocr_infer_protocol: $OCR_INFER_PROTOCOL|grpc
|
|
206
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
207
|
+
replicas:
|
|
208
|
+
min_replicas: 0
|
|
209
|
+
max_replicas:
|
|
210
|
+
strategy: "static"
|
|
211
|
+
value: 4
|
|
212
|
+
static_replicas:
|
|
213
|
+
strategy: "static"
|
|
214
|
+
value: 3
|
|
215
|
+
|
|
196
216
|
- name: "infographic_extractor"
|
|
197
217
|
type: "stage"
|
|
198
218
|
phase: 1 # EXTRACTION
|
|
@@ -200,11 +220,11 @@ stages:
|
|
|
200
220
|
config:
|
|
201
221
|
endpoint_config:
|
|
202
222
|
ocr_endpoints: [
|
|
203
|
-
$OCR_GRPC_ENDPOINT|"
|
|
204
|
-
$OCR_HTTP_ENDPOINT|""
|
|
223
|
+
$OCR_GRPC_ENDPOINT|"ocr:8001",
|
|
224
|
+
$OCR_HTTP_ENDPOINT|"http://ocr:8000/v1/infer",
|
|
205
225
|
]
|
|
206
226
|
ocr_infer_protocol: $OCR_INFER_PROTOCOL|grpc
|
|
207
|
-
auth_token: $NGC_API_KEY
|
|
227
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
208
228
|
replicas:
|
|
209
229
|
min_replicas: 0
|
|
210
230
|
max_replicas:
|
|
@@ -221,16 +241,16 @@ stages:
|
|
|
221
241
|
config:
|
|
222
242
|
endpoint_config:
|
|
223
243
|
yolox_endpoints: [
|
|
224
|
-
$YOLOX_TABLE_STRUCTURE_GRPC_ENDPOINT|"",
|
|
225
|
-
$YOLOX_TABLE_STRUCTURE_HTTP_ENDPOINT|"
|
|
244
|
+
$YOLOX_TABLE_STRUCTURE_GRPC_ENDPOINT|"table-structure:8001",
|
|
245
|
+
$YOLOX_TABLE_STRUCTURE_HTTP_ENDPOINT|"http://table-structure:8000/v1/infer",
|
|
226
246
|
]
|
|
227
|
-
yolox_infer_protocol: $YOLOX_TABLE_STRUCTURE_INFER_PROTOCOL|
|
|
247
|
+
yolox_infer_protocol: $YOLOX_TABLE_STRUCTURE_INFER_PROTOCOL|grpc
|
|
228
248
|
ocr_endpoints: [
|
|
229
|
-
$OCR_GRPC_ENDPOINT|"",
|
|
230
|
-
$OCR_HTTP_ENDPOINT|"
|
|
249
|
+
$OCR_GRPC_ENDPOINT|"ocr:8001",
|
|
250
|
+
$OCR_HTTP_ENDPOINT|"http://ocr:8000/v1/infer",
|
|
231
251
|
]
|
|
232
|
-
ocr_infer_protocol: $
|
|
233
|
-
auth_token: $NGC_API_KEY
|
|
252
|
+
ocr_infer_protocol: $OCR_INFER_PROTOCOL|grpc
|
|
253
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
234
254
|
replicas:
|
|
235
255
|
min_replicas: 0
|
|
236
256
|
max_replicas:
|
|
@@ -248,16 +268,16 @@ stages:
|
|
|
248
268
|
config:
|
|
249
269
|
endpoint_config:
|
|
250
270
|
yolox_endpoints: [
|
|
251
|
-
$YOLOX_GRAPHIC_ELEMENTS_GRPC_ENDPOINT|"",
|
|
252
|
-
$YOLOX_GRAPHIC_ELEMENTS_HTTP_ENDPOINT|"
|
|
271
|
+
$YOLOX_GRAPHIC_ELEMENTS_GRPC_ENDPOINT|"graphic-elements:8001",
|
|
272
|
+
$YOLOX_GRAPHIC_ELEMENTS_HTTP_ENDPOINT|""
|
|
253
273
|
]
|
|
254
|
-
yolox_infer_protocol: $YOLOX_GRAPHIC_ELEMENTS_INFER_PROTOCOL|
|
|
274
|
+
yolox_infer_protocol: $YOLOX_GRAPHIC_ELEMENTS_INFER_PROTOCOL|grpc
|
|
255
275
|
ocr_endpoints: [
|
|
256
|
-
$OCR_GRPC_ENDPOINT|"",
|
|
257
|
-
$OCR_HTTP_ENDPOINT|"
|
|
276
|
+
$OCR_GRPC_ENDPOINT|"ocr:8001",
|
|
277
|
+
$OCR_HTTP_ENDPOINT|""
|
|
258
278
|
]
|
|
259
|
-
ocr_infer_protocol: $OCR_INFER_PROTOCOL|
|
|
260
|
-
auth_token: $NGC_API_KEY
|
|
279
|
+
ocr_infer_protocol: $OCR_INFER_PROTOCOL|grpc
|
|
280
|
+
auth_token: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
261
281
|
replicas:
|
|
262
282
|
min_replicas: 0
|
|
263
283
|
max_replicas:
|
|
@@ -317,9 +337,9 @@ stages:
|
|
|
317
337
|
phase: 4 # TRANSFORM
|
|
318
338
|
actor: "nv_ingest.framework.orchestration.ray.stages.transforms.image_caption:ImageCaptionTransformStage"
|
|
319
339
|
config:
|
|
320
|
-
api_key: $NGC_API_KEY
|
|
321
|
-
|
|
322
|
-
|
|
340
|
+
api_key: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
341
|
+
model_name: $VLM_CAPTION_MODEL_NAME|"nvidia/nemotron-nano-12b-v2-vl"
|
|
342
|
+
endpoint_url: $VLM_CAPTION_ENDPOINT|"http://vlm:8000/v1/chat/completions"
|
|
323
343
|
prompt: "Caption the content of this image:"
|
|
324
344
|
replicas:
|
|
325
345
|
min_replicas: 0
|
|
@@ -335,17 +355,17 @@ stages:
|
|
|
335
355
|
phase: 4 # TRANSFORM
|
|
336
356
|
actor: "nv_ingest.framework.orchestration.ray.stages.transforms.text_embed:TextEmbeddingTransformStage"
|
|
337
357
|
config:
|
|
338
|
-
api_key: $NGC_API_KEY
|
|
358
|
+
api_key: $NGC_API_KEY|$NVIDIA_API_KEY
|
|
339
359
|
embedding_model: $EMBEDDING_NIM_MODEL_NAME|"nvidia/llama-3.2-nv-embedqa-1b-v2"
|
|
340
|
-
embedding_nim_endpoint: $EMBEDDING_NIM_ENDPOINT|"
|
|
360
|
+
embedding_nim_endpoint: $EMBEDDING_NIM_ENDPOINT|"http://embedding:8000/v1"
|
|
341
361
|
replicas:
|
|
342
362
|
min_replicas: 0
|
|
343
363
|
max_replicas:
|
|
344
364
|
strategy: "static"
|
|
345
|
-
value:
|
|
365
|
+
value: 4
|
|
346
366
|
static_replicas:
|
|
347
367
|
strategy: "static"
|
|
348
|
-
value:
|
|
368
|
+
value: 3
|
|
349
369
|
|
|
350
370
|
# Storage and Output
|
|
351
371
|
- name: "image_storage"
|
|
@@ -380,9 +400,10 @@ stages:
|
|
|
380
400
|
actor: "nv_ingest.framework.orchestration.ray.stages.sinks.message_broker_task_sink:MessageBrokerTaskSinkStage"
|
|
381
401
|
config:
|
|
382
402
|
broker_client:
|
|
383
|
-
client_type: "
|
|
384
|
-
host:
|
|
385
|
-
port:
|
|
403
|
+
client_type: $MESSAGE_CLIENT_TYPE|"redis"
|
|
404
|
+
host: $MESSAGE_CLIENT_HOST|localhost
|
|
405
|
+
port: $MESSAGE_CLIENT_PORT|6379
|
|
406
|
+
poll_interval: 0.1
|
|
386
407
|
replicas:
|
|
387
408
|
min_replicas: 1
|
|
388
409
|
max_replicas:
|
|
@@ -416,7 +437,7 @@ stages:
|
|
|
416
437
|
actor: "nv_ingest.framework.orchestration.ray.stages.sinks.default_drain:DefaultDrainSink"
|
|
417
438
|
config: {}
|
|
418
439
|
replicas:
|
|
419
|
-
min_replicas:
|
|
440
|
+
min_replicas: 1
|
|
420
441
|
max_replicas:
|
|
421
442
|
strategy: "static"
|
|
422
443
|
value: 1
|
|
@@ -428,83 +449,85 @@ edges:
|
|
|
428
449
|
# Intake
|
|
429
450
|
- from: "source_stage"
|
|
430
451
|
to: "metadata_injector"
|
|
431
|
-
queue_size:
|
|
452
|
+
queue_size: 4
|
|
432
453
|
|
|
433
454
|
# Document Extractors
|
|
434
455
|
- from: "metadata_injector"
|
|
435
456
|
to: "pdf_extractor"
|
|
436
|
-
queue_size:
|
|
457
|
+
queue_size: 8
|
|
437
458
|
- from: "pdf_extractor"
|
|
438
459
|
to: "audio_extractor"
|
|
439
|
-
queue_size:
|
|
460
|
+
queue_size: 4
|
|
440
461
|
- from: "audio_extractor"
|
|
441
462
|
to: "docx_extractor"
|
|
442
|
-
queue_size:
|
|
463
|
+
queue_size: 4
|
|
443
464
|
- from: "docx_extractor"
|
|
444
465
|
to: "pptx_extractor"
|
|
445
|
-
queue_size:
|
|
466
|
+
queue_size: 4
|
|
446
467
|
- from: "pptx_extractor"
|
|
447
468
|
to: "image_extractor"
|
|
448
|
-
queue_size:
|
|
469
|
+
queue_size: 4
|
|
449
470
|
- from: "image_extractor"
|
|
450
471
|
to: "html_extractor"
|
|
451
|
-
queue_size:
|
|
472
|
+
queue_size: 4
|
|
452
473
|
- from: "html_extractor"
|
|
453
474
|
to: "infographic_extractor"
|
|
454
|
-
queue_size:
|
|
475
|
+
queue_size: 4
|
|
455
476
|
|
|
456
477
|
# Primitive Extractors
|
|
457
478
|
- from: "infographic_extractor"
|
|
458
479
|
to: "table_extractor"
|
|
459
|
-
queue_size:
|
|
480
|
+
queue_size: 4
|
|
460
481
|
- from: "table_extractor"
|
|
461
482
|
to: "chart_extractor"
|
|
462
|
-
queue_size:
|
|
483
|
+
queue_size: 4
|
|
463
484
|
- from: "chart_extractor"
|
|
485
|
+
to: "ocr_extractor"
|
|
486
|
+
queue_size: 8
|
|
487
|
+
- from: "ocr_extractor"
|
|
464
488
|
to: "image_filter"
|
|
465
|
-
queue_size:
|
|
489
|
+
queue_size: 4
|
|
466
490
|
|
|
467
491
|
# Primitive Mutators
|
|
468
492
|
- from: "image_filter"
|
|
469
493
|
to: "image_dedup"
|
|
470
|
-
queue_size:
|
|
494
|
+
queue_size: 4
|
|
471
495
|
- from: "image_dedup"
|
|
472
496
|
to: "text_splitter"
|
|
473
|
-
queue_size:
|
|
497
|
+
queue_size: 4
|
|
474
498
|
|
|
475
499
|
# Primitive Transforms
|
|
476
500
|
- from: "text_splitter"
|
|
477
501
|
to: "image_caption"
|
|
478
|
-
queue_size:
|
|
502
|
+
queue_size: 4
|
|
479
503
|
- from: "image_caption"
|
|
480
504
|
to: "text_embedder"
|
|
481
|
-
queue_size:
|
|
505
|
+
queue_size: 4
|
|
482
506
|
- from: "text_embedder"
|
|
483
507
|
to: "image_storage"
|
|
484
|
-
queue_size:
|
|
508
|
+
queue_size: 4
|
|
485
509
|
|
|
486
510
|
# Primitive Storage
|
|
487
511
|
- from: "image_storage"
|
|
488
512
|
to: "embedding_storage"
|
|
489
|
-
queue_size:
|
|
513
|
+
queue_size: 4
|
|
490
514
|
- from: "embedding_storage"
|
|
491
515
|
to: "broker_response"
|
|
492
|
-
queue_size:
|
|
516
|
+
queue_size: 4
|
|
493
517
|
|
|
494
518
|
# Response and Telemetry
|
|
495
519
|
- from: "broker_response"
|
|
496
520
|
to: "otel_tracer"
|
|
497
|
-
queue_size:
|
|
521
|
+
queue_size: 4
|
|
498
522
|
- from: "otel_tracer"
|
|
499
523
|
to: "default_drain"
|
|
500
|
-
queue_size:
|
|
524
|
+
queue_size: 4
|
|
501
525
|
|
|
502
526
|
# Pipeline Runtime Configuration
|
|
503
|
-
# These parameters control dynamic scaling and PID controller behavior
|
|
504
|
-
# All values can be overridden by environment variables from env_config.py
|
|
505
527
|
pipeline:
|
|
506
|
-
disable_dynamic_scaling: $INGEST_DISABLE_DYNAMIC_SCALING|
|
|
528
|
+
disable_dynamic_scaling: $INGEST_DISABLE_DYNAMIC_SCALING|false
|
|
507
529
|
dynamic_memory_threshold: $INGEST_DYNAMIC_MEMORY_THRESHOLD|0.75
|
|
530
|
+
static_memory_threshold: $INGEST_STATIC_MEMORY_THRESHOLD|0.75
|
|
508
531
|
pid_controller:
|
|
509
532
|
kp: $INGEST_DYNAMIC_MEMORY_KP|0.2
|
|
510
533
|
ki: $INGEST_DYNAMIC_MEMORY_KI|0.01
|
|
@@ -513,5 +536,5 @@ pipeline:
|
|
|
513
536
|
penalty_factor: $INGEST_DYNAMIC_MEMORY_PENALTY_FACTOR|0.1
|
|
514
537
|
error_boost_factor: $INGEST_DYNAMIC_MEMORY_ERROR_BOOST_FACTOR|1.5
|
|
515
538
|
rcm_memory_safety_buffer_fraction: $INGEST_DYNAMIC_MEMORY_RCM_MEMORY_SAFETY_BUFFER_FRACTION|0.15
|
|
516
|
-
launch_simple_broker:
|
|
539
|
+
launch_simple_broker: $INGEST_LAUNCH_SIMPLE_BROKER|false
|
|
517
540
|
"""
|
{nv_ingest-2025.8.16.dev20250816.dist-info → nv_ingest-2025.11.21.dev20251121.dist-info}/METADATA
RENAMED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: nv-ingest
|
|
3
|
-
Version: 2025.
|
|
3
|
+
Version: 2025.11.21.dev20251121
|
|
4
4
|
Summary: Python module for multimodal document ingestion
|
|
5
5
|
Author-email: Jeremy Dyer <jdyer@nvidia.com>
|
|
6
6
|
License: Apache License
|
|
@@ -225,10 +225,11 @@ Requires-Dist: httpx>=0.28.1
|
|
|
225
225
|
Requires-Dist: isodate>=0.7.2
|
|
226
226
|
Requires-Dist: langdetect>=1.0.9
|
|
227
227
|
Requires-Dist: minio>=7.2.12
|
|
228
|
-
Requires-Dist:
|
|
228
|
+
Requires-Dist: librosa>=0.10.2
|
|
229
229
|
Requires-Dist: opentelemetry-api>=1.27.0
|
|
230
230
|
Requires-Dist: opentelemetry-exporter-otlp>=1.27.0
|
|
231
231
|
Requires-Dist: opentelemetry-sdk>=1.27.0
|
|
232
|
+
Requires-Dist: psutil>=7.1.0
|
|
232
233
|
Requires-Dist: pydantic>2.0.0
|
|
233
234
|
Requires-Dist: pydantic-settings>2.0.0
|
|
234
235
|
Requires-Dist: pypdfium2==4.30.0
|
|
@@ -240,7 +241,7 @@ Requires-Dist: python-docx>=1.1.2
|
|
|
240
241
|
Requires-Dist: python-dotenv>=1.0.1
|
|
241
242
|
Requires-Dist: python-pptx>=1.0.2
|
|
242
243
|
Requires-Dist: prometheus-client
|
|
243
|
-
Requires-Dist: ray[all]>=2.
|
|
244
|
+
Requires-Dist: ray[all]>=2.49.0
|
|
244
245
|
Requires-Dist: redis>=5.2.1
|
|
245
246
|
Requires-Dist: requests>=2.28.2
|
|
246
247
|
Requires-Dist: scikit-learn>=1.6.0
|
{nv_ingest-2025.8.16.dev20250816.dist-info → nv_ingest-2025.11.21.dev20251121.dist-info}/RECORD
RENAMED
|
@@ -1,73 +1,79 @@
|
|
|
1
1
|
nv_ingest/__init__.py,sha256=vJLPeuxiIHqbxXPJSu9qe3MS-GPavbOUExyRq83DxxM,895
|
|
2
2
|
nv_ingest/version.py,sha256=MG7DxlzpnoJI56vqxwzs9WeMAEI3uPhfDiNLs6GN6wI,986
|
|
3
|
-
nv_ingest/api/__init__.py,sha256=
|
|
4
|
-
nv_ingest/api/main.py,sha256=
|
|
3
|
+
nv_ingest/api/__init__.py,sha256=ED07QUqwVyJalH0ahhnnjvc2W_in6TpZZ5nJ6NWU9-Y,271
|
|
4
|
+
nv_ingest/api/main.py,sha256=uCCkUNLS1xE9TDYKDOdxEfo_9jQWumpQAPWrxj5m9Go,1706
|
|
5
|
+
nv_ingest/api/tracing.py,sha256=NkqMuUiB6ixGU5MYp3TrODsZDQepJ1kbH8JFHsYjuE0,2940
|
|
5
6
|
nv_ingest/api/v1/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
6
7
|
nv_ingest/api/v1/health.py,sha256=pV-RoVq5y0iBPp0qZoLzd1xKpd0JiHAi0UMyMj99LqU,4740
|
|
7
8
|
nv_ingest/api/v1/ingest.py,sha256=LWk3LN4lBd3uO8h30EN42g3LHCVcO00avVd5ohVK7NI,19392
|
|
8
9
|
nv_ingest/api/v1/metrics.py,sha256=ZGVRApYLnzc2f2C7wRgGd7deqiXan-jxfA-33a16clY,981
|
|
10
|
+
nv_ingest/api/v2/README.md,sha256=VhpdjEmCyr3qIOhwqISFx9C5WezJFcxYc-NB9S98HMg,7562
|
|
11
|
+
nv_ingest/api/v2/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
12
|
+
nv_ingest/api/v2/ingest.py,sha256=ikbZE2eAjSnFmt5CcpTduY1t9DsUQBhnBQlsd3HaBww,53103
|
|
9
13
|
nv_ingest/framework/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
10
14
|
nv_ingest/framework/orchestration/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
11
15
|
nv_ingest/framework/orchestration/execution/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
12
16
|
nv_ingest/framework/orchestration/execution/helpers.py,sha256=-F8SZh7ISWtzJz6X1O2LQ133t-17Jxi8lL-NHz4rwj0,2818
|
|
13
17
|
nv_ingest/framework/orchestration/execution/options.py,sha256=Ms1t4591EIv4ZrMRdhsCYPgLnMVXJosG3MURCbPXUoA,3983
|
|
14
18
|
nv_ingest/framework/orchestration/process/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
15
|
-
nv_ingest/framework/orchestration/process/dependent_services.py,sha256=
|
|
16
|
-
nv_ingest/framework/orchestration/process/execution.py,sha256=
|
|
17
|
-
nv_ingest/framework/orchestration/process/lifecycle.py,sha256=
|
|
18
|
-
nv_ingest/framework/orchestration/process/strategies.py,sha256=
|
|
19
|
+
nv_ingest/framework/orchestration/process/dependent_services.py,sha256=s0j_rsFtCKHFIuvOkBe9NEAkPNPhSYse_ApeHka8gyg,3032
|
|
20
|
+
nv_ingest/framework/orchestration/process/execution.py,sha256=P1kzpYV23e4QYrKw9Td1TCZK3CK1ENVqqnI_axRCqBk,19814
|
|
21
|
+
nv_ingest/framework/orchestration/process/lifecycle.py,sha256=L5NDwnzSMQPGjqJDC8jC75L1YqWey-dtK8N_HgBzb0E,8001
|
|
22
|
+
nv_ingest/framework/orchestration/process/strategies.py,sha256=Q1Q04PPseF775omeS0FoXfK187NiS_bbqTaaJRwzKn8,7972
|
|
23
|
+
nv_ingest/framework/orchestration/process/termination.py,sha256=PAogFeW0FATFS6Mcp_UkZgq_SbWV18RtdZN-0NbComw,5042
|
|
19
24
|
nv_ingest/framework/orchestration/ray/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
20
25
|
nv_ingest/framework/orchestration/ray/edges/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
21
26
|
nv_ingest/framework/orchestration/ray/edges/async_queue_edge.py,sha256=PQliU_kyGbO9o42njpb8FrDMLrbLqwZzmBNXifxyG5Y,2312
|
|
22
27
|
nv_ingest/framework/orchestration/ray/edges/ray_queue_edge.py,sha256=VFii2yxJuikimOxie3edKq5JN06g78AF8bdHSHVX8p8,2677
|
|
23
28
|
nv_ingest/framework/orchestration/ray/edges/threaded_queue_edge.py,sha256=N6NH4KgZJ60e_JkGRcSmfQtX37qtX4TMcavOR-n3heE,2549
|
|
24
29
|
nv_ingest/framework/orchestration/ray/examples/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
25
|
-
nv_ingest/framework/orchestration/ray/examples/pipeline_test_harness.py,sha256=
|
|
30
|
+
nv_ingest/framework/orchestration/ray/examples/pipeline_test_harness.py,sha256=Bn4rjkO14BwvvUNG_HBCSVXetYk7DKqRRsYHJADWqjc,16455
|
|
26
31
|
nv_ingest/framework/orchestration/ray/examples/task_source_harness.py,sha256=Yt7uxThg7s8WuMiaHLKC8r1XAG7QixegfkT-juE5oNw,1953
|
|
27
32
|
nv_ingest/framework/orchestration/ray/examples/task_source_sink_harness.py,sha256=XkvsoIzH5ftXvAZ4ox7mxbx7ESVx6D8Xupcwbqgd52w,3277
|
|
28
33
|
nv_ingest/framework/orchestration/ray/primitives/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
29
34
|
nv_ingest/framework/orchestration/ray/primitives/dataclasses.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
30
35
|
nv_ingest/framework/orchestration/ray/primitives/pipeline_monitor.py,sha256=L8ENPiF-lxqhIXVEQwQD5CCqQMb710ynj5D_Y4ixGhs,11077
|
|
31
36
|
nv_ingest/framework/orchestration/ray/primitives/pipeline_topology.py,sha256=yd2sb_q_FbBLDWiYgdKRhpPVAIl26Wg8w3yelZ7c5zQ,15741
|
|
32
|
-
nv_ingest/framework/orchestration/ray/primitives/ray_pipeline.py,sha256=
|
|
37
|
+
nv_ingest/framework/orchestration/ray/primitives/ray_pipeline.py,sha256=t9lf6zTjl_P5pe8mW-5F5pbZoC5mlcvEn2RCaLn_3Tk,66521
|
|
33
38
|
nv_ingest/framework/orchestration/ray/primitives/ray_stat_collector.py,sha256=GGY6_i6_g5xTFzdo9Qmsu9i4knMTq6pJfgm-aaPEt_o,17226
|
|
34
39
|
nv_ingest/framework/orchestration/ray/stages/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
35
40
|
nv_ingest/framework/orchestration/ray/stages/extractors/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
36
|
-
nv_ingest/framework/orchestration/ray/stages/extractors/audio_extractor.py,sha256=
|
|
37
|
-
nv_ingest/framework/orchestration/ray/stages/extractors/chart_extractor.py,sha256=
|
|
38
|
-
nv_ingest/framework/orchestration/ray/stages/extractors/docx_extractor.py,sha256=
|
|
39
|
-
nv_ingest/framework/orchestration/ray/stages/extractors/html_extractor.py,sha256=
|
|
40
|
-
nv_ingest/framework/orchestration/ray/stages/extractors/image_extractor.py,sha256=
|
|
41
|
+
nv_ingest/framework/orchestration/ray/stages/extractors/audio_extractor.py,sha256=UVp_kDmkaBlfO0Mbl_IxKq6imzLvs4-DKHgUHJIh3mo,3629
|
|
42
|
+
nv_ingest/framework/orchestration/ray/stages/extractors/chart_extractor.py,sha256=rfaDx6PqRCguhSYkJI6iVmMMtAlJNxzKfUrLmw_fKqs,4381
|
|
43
|
+
nv_ingest/framework/orchestration/ray/stages/extractors/docx_extractor.py,sha256=R4vshPcAUN2U6BIv8BCZQ862wLx8RJhCGXfpQ3K09Bs,3627
|
|
44
|
+
nv_ingest/framework/orchestration/ray/stages/extractors/html_extractor.py,sha256=7JrZSVIrK4_wr2s7TOTss7pgTY2F9GPQ7Ze3F_WFlKU,3642
|
|
45
|
+
nv_ingest/framework/orchestration/ray/stages/extractors/image_extractor.py,sha256=iY9fEfucfgCmO2ixX6qwn418J97nJz_FQGh7B6yziVo,3980
|
|
41
46
|
nv_ingest/framework/orchestration/ray/stages/extractors/infographic_extractor.py,sha256=v5J7dnJBEaDfjoTz_N_yC3RAt6lwMLgLT28V-ahquLE,3261
|
|
42
|
-
nv_ingest/framework/orchestration/ray/stages/extractors/
|
|
47
|
+
nv_ingest/framework/orchestration/ray/stages/extractors/ocr_extractor.py,sha256=pwVoA5-CF9GVWusoFZOMGBvSyW5udD9bdxVJXA_SghE,3188
|
|
48
|
+
nv_ingest/framework/orchestration/ray/stages/extractors/pdf_extractor.py,sha256=QagIA99AsHLihjRbXm-2BphdoQGHwzOHlqLyz7oDOSk,4992
|
|
43
49
|
nv_ingest/framework/orchestration/ray/stages/extractors/pptx_extractor.py,sha256=RMbbl7Cuj4BT-TcgUx_0k8R-DLdw-o3fHxcIBIgrWt4,3776
|
|
44
|
-
nv_ingest/framework/orchestration/ray/stages/extractors/table_extractor.py,sha256=
|
|
50
|
+
nv_ingest/framework/orchestration/ray/stages/extractors/table_extractor.py,sha256=p71ktv6v5T-9npYpCbgbwW6-fS-65UWS7rCm8OWr2Bc,4170
|
|
45
51
|
nv_ingest/framework/orchestration/ray/stages/injectors/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
46
|
-
nv_ingest/framework/orchestration/ray/stages/injectors/metadata_injector.py,sha256=
|
|
52
|
+
nv_ingest/framework/orchestration/ray/stages/injectors/metadata_injector.py,sha256=gTPRFOoUGcwNrmPeqv4n5VmU-LBkha9QTYHO0ntiaIk,7116
|
|
47
53
|
nv_ingest/framework/orchestration/ray/stages/meta/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
48
54
|
nv_ingest/framework/orchestration/ray/stages/meta/ray_actor_edge_base.py,sha256=LnVqBJmpfCmcI-eJLbkwK-7SS-hpEp98P4iCRv_Zhb0,1726
|
|
49
55
|
nv_ingest/framework/orchestration/ray/stages/meta/ray_actor_sink_stage_base.py,sha256=HQJXIuU7VjiQ6fQjHjbNNmIJX5f30cXFB0CJGixgwVo,3633
|
|
50
56
|
nv_ingest/framework/orchestration/ray/stages/meta/ray_actor_source_stage_base.py,sha256=hP25MLTP2bOEEncrYdxPPqeRyRVbij8aEurR1F1ZmhE,1811
|
|
51
57
|
nv_ingest/framework/orchestration/ray/stages/meta/ray_actor_stage_base.py,sha256=qiB_ZU5_3bXgvE9C2rvnXIS0Alm6M5PWLCeQm8ZxOy4,29812
|
|
52
58
|
nv_ingest/framework/orchestration/ray/stages/mutate/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
53
|
-
nv_ingest/framework/orchestration/ray/stages/mutate/image_dedup.py,sha256=
|
|
54
|
-
nv_ingest/framework/orchestration/ray/stages/mutate/image_filter.py,sha256
|
|
59
|
+
nv_ingest/framework/orchestration/ray/stages/mutate/image_dedup.py,sha256=cPLG3ZEqhZkRiSsbL7cbF1zsvOAimd8K5O-qadUR9Mg,3709
|
|
60
|
+
nv_ingest/framework/orchestration/ray/stages/mutate/image_filter.py,sha256=f1CS8x9uifY1FJ_1lUF0fNNMExvM4zBIF012gxnSpqU,3523
|
|
55
61
|
nv_ingest/framework/orchestration/ray/stages/sinks/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
56
62
|
nv_ingest/framework/orchestration/ray/stages/sinks/default_drain.py,sha256=_USW1Vq8G2Wn-QFdPfFQCrtKG46hHeJvkEGbBxdpbVM,1488
|
|
57
63
|
nv_ingest/framework/orchestration/ray/stages/sinks/message_broker_task_sink.py,sha256=QcvMQXIJ7EWIxty76Mo5Xv38Oj6X2KuS8qXQlf7E1uA,11676
|
|
58
64
|
nv_ingest/framework/orchestration/ray/stages/sources/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
59
|
-
nv_ingest/framework/orchestration/ray/stages/sources/message_broker_task_source.py,sha256=
|
|
65
|
+
nv_ingest/framework/orchestration/ray/stages/sources/message_broker_task_source.py,sha256=LrqaWpWyuiAHlpXWKYSyHZJBFegGXfNlpCXrucbK5NM,24067
|
|
60
66
|
nv_ingest/framework/orchestration/ray/stages/storage/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
61
67
|
nv_ingest/framework/orchestration/ray/stages/storage/image_storage.py,sha256=WZN_-3Li-izDaPtk8IMrtn2os1ckT3U8Rb2PsfOWrcI,4009
|
|
62
|
-
nv_ingest/framework/orchestration/ray/stages/storage/store_embeddings.py,sha256=
|
|
68
|
+
nv_ingest/framework/orchestration/ray/stages/storage/store_embeddings.py,sha256=EUtwhSDf-qGLVEhWEInr1VaLsvpcHUSyzCmHQVai-Ps,3547
|
|
63
69
|
nv_ingest/framework/orchestration/ray/stages/telemetry/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
64
70
|
nv_ingest/framework/orchestration/ray/stages/telemetry/job_counter.py,sha256=jEtEUibqs6IS6QakrzWY9zmxSUzuBpg_hzXy2R-I10Y,2870
|
|
65
71
|
nv_ingest/framework/orchestration/ray/stages/telemetry/otel_meter.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
66
72
|
nv_ingest/framework/orchestration/ray/stages/telemetry/otel_tracer.py,sha256=GqFwRpTlIu2qgb08B3OqVIKUG8QQAwSOHhjvnyL_9UE,8553
|
|
67
73
|
nv_ingest/framework/orchestration/ray/stages/transforms/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
68
|
-
nv_ingest/framework/orchestration/ray/stages/transforms/image_caption.py,sha256=
|
|
69
|
-
nv_ingest/framework/orchestration/ray/stages/transforms/text_embed.py,sha256=
|
|
70
|
-
nv_ingest/framework/orchestration/ray/stages/transforms/text_splitter.py,sha256=
|
|
74
|
+
nv_ingest/framework/orchestration/ray/stages/transforms/image_caption.py,sha256=GYF41y_teXMIzB24JQXuesVmvksmgNvTGYU3uU4TzbM,3742
|
|
75
|
+
nv_ingest/framework/orchestration/ray/stages/transforms/text_embed.py,sha256=o6QPd3GCPxbAvQFeb1oByOP5LII-FVkKbmAkBjCioB0,3435
|
|
76
|
+
nv_ingest/framework/orchestration/ray/stages/transforms/text_splitter.py,sha256=FAScWaZijrJHc5F5jgulHP_cdX2telS4pq3spwliFXw,4963
|
|
71
77
|
nv_ingest/framework/orchestration/ray/stages/utility/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
72
78
|
nv_ingest/framework/orchestration/ray/stages/utility/throughput_monitor.py,sha256=J7Qs745rt7cQlR3L2K9U6Mb_BDKUNpl_xoqCZMEPlks,2674
|
|
73
79
|
nv_ingest/framework/orchestration/ray/util/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
@@ -98,21 +104,22 @@ nv_ingest/framework/util/flow_control/udf_intercept.py,sha256=zQ9uuCcHLEd0P52Eiw
|
|
|
98
104
|
nv_ingest/framework/util/service/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
99
105
|
nv_ingest/framework/util/service/impl/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
100
106
|
nv_ingest/framework/util/service/impl/ingest/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
101
|
-
nv_ingest/framework/util/service/impl/ingest/redis_ingest_service.py,sha256=
|
|
107
|
+
nv_ingest/framework/util/service/impl/ingest/redis_ingest_service.py,sha256=59P-BMWnFY37GJm5w23-TMxgLhiZGZpJogC0gjDBaTA,23835
|
|
102
108
|
nv_ingest/framework/util/service/meta/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
103
109
|
nv_ingest/framework/util/service/meta/ingest/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
104
110
|
nv_ingest/framework/util/service/meta/ingest/ingest_service_meta.py,sha256=QS3uNxWBl5dIcmIpJKNe8_TLcTUuN2vcKyHeAwa-eSo,1589
|
|
105
111
|
nv_ingest/framework/util/telemetry/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
106
112
|
nv_ingest/framework/util/telemetry/global_stats.py,sha256=nq65pEEdiwjAfGiqsxG1CeQMC96O3CfQxsZuGFCY-ds,4554
|
|
107
113
|
nv_ingest/pipeline/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
108
|
-
nv_ingest/pipeline/
|
|
114
|
+
nv_ingest/pipeline/default_libmode_pipeline_impl.py,sha256=yNJtjfHQyxtasGa1hQrvgX7UrPa7BAd0oog8EIN8Y_w,15592
|
|
115
|
+
nv_ingest/pipeline/default_pipeline_impl.py,sha256=DhClC17lWUvtBIi2mCC4WkLWT0lxY-CFY0n6nriAxas,16017
|
|
109
116
|
nv_ingest/pipeline/ingest_pipeline.py,sha256=wHAJhqAM2s8nbY-8itVogmSU-yVN4PZONGWcKnhzgfg,17794
|
|
110
117
|
nv_ingest/pipeline/pipeline_schema.py,sha256=rLZZz2It2o2hVNWrZUJU8CarrqRei1fho3ZEMkkoBcg,17940
|
|
111
118
|
nv_ingest/pipeline/config/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
|
|
112
|
-
nv_ingest/pipeline/config/loaders.py,sha256=
|
|
119
|
+
nv_ingest/pipeline/config/loaders.py,sha256=75Yr9WYO7j7ghvKTnYLfZXQZEH3J3VEZo5J4TunC_Us,7590
|
|
113
120
|
nv_ingest/pipeline/config/replica_resolver.py,sha256=3zjh8gmepEYORFZRM4inq7GoBW0YL3gzUDiixUugjzQ,8899
|
|
114
|
-
nv_ingest-2025.
|
|
115
|
-
nv_ingest-2025.
|
|
116
|
-
nv_ingest-2025.
|
|
117
|
-
nv_ingest-2025.
|
|
118
|
-
nv_ingest-2025.
|
|
121
|
+
nv_ingest-2025.11.21.dev20251121.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
|
122
|
+
nv_ingest-2025.11.21.dev20251121.dist-info/METADATA,sha256=tY61Ze6cR62q-06kGMCBpCaRpqeY5IdmxfAKPie_Qjc,15092
|
|
123
|
+
nv_ingest-2025.11.21.dev20251121.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
124
|
+
nv_ingest-2025.11.21.dev20251121.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
|
|
125
|
+
nv_ingest-2025.11.21.dev20251121.dist-info/RECORD,,
|
{nv_ingest-2025.8.16.dev20250816.dist-info → nv_ingest-2025.11.21.dev20251121.dist-info}/WHEEL
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|