nv-ingest 2025.8.20.dev20250820__py3-none-any.whl → 2025.8.22.dev20250822__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of nv-ingest might be problematic. Click here for more details.

Files changed (20) hide show
  1. nv_ingest/framework/orchestration/ray/stages/extractors/audio_extractor.py +2 -1
  2. nv_ingest/framework/orchestration/ray/stages/extractors/chart_extractor.py +5 -2
  3. nv_ingest/framework/orchestration/ray/stages/extractors/docx_extractor.py +2 -1
  4. nv_ingest/framework/orchestration/ray/stages/extractors/html_extractor.py +2 -1
  5. nv_ingest/framework/orchestration/ray/stages/extractors/image_extractor.py +2 -1
  6. nv_ingest/framework/orchestration/ray/stages/extractors/pdf_extractor.py +5 -2
  7. nv_ingest/framework/orchestration/ray/stages/extractors/table_extractor.py +2 -1
  8. nv_ingest/framework/orchestration/ray/stages/injectors/metadata_injector.py +2 -1
  9. nv_ingest/framework/orchestration/ray/stages/mutate/image_dedup.py +2 -1
  10. nv_ingest/framework/orchestration/ray/stages/mutate/image_filter.py +2 -1
  11. nv_ingest/framework/orchestration/ray/stages/sources/message_broker_task_source.py +5 -1
  12. nv_ingest/framework/orchestration/ray/stages/storage/store_embeddings.py +2 -1
  13. nv_ingest/framework/orchestration/ray/stages/transforms/image_caption.py +5 -1
  14. nv_ingest/framework/orchestration/ray/stages/transforms/text_embed.py +5 -1
  15. nv_ingest/framework/orchestration/ray/stages/transforms/text_splitter.py +4 -3
  16. {nv_ingest-2025.8.20.dev20250820.dist-info → nv_ingest-2025.8.22.dev20250822.dist-info}/METADATA +1 -1
  17. {nv_ingest-2025.8.20.dev20250820.dist-info → nv_ingest-2025.8.22.dev20250822.dist-info}/RECORD +20 -20
  18. {nv_ingest-2025.8.20.dev20250820.dist-info → nv_ingest-2025.8.22.dev20250822.dist-info}/WHEEL +0 -0
  19. {nv_ingest-2025.8.20.dev20250820.dist-info → nv_ingest-2025.8.22.dev20250822.dist-info}/licenses/LICENSE +0 -0
  20. {nv_ingest-2025.8.20.dev20250820.dist-info → nv_ingest-2025.8.22.dev20250822.dist-info}/top_level.txt +0 -0
@@ -17,6 +17,7 @@ from nv_ingest_api.internal.schemas.extract.extract_audio_schema import AudioExt
17
17
  from nv_ingest_api.util.exception_handlers.decorators import (
18
18
  nv_ingest_node_failure_try_except,
19
19
  )
20
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
20
21
 
21
22
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
22
23
 
@@ -69,7 +70,7 @@ class AudioExtractorStage(RayActorStage):
69
70
 
70
71
  # Remove the "audio_data_extract" task from the message to obtain task-specific configuration.
71
72
  task_config = remove_task_by_type(control_message, "extract")
72
- self._logger.debug("Extracted task config: %s", task_config)
73
+ self._logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
73
74
 
74
75
  # Perform audio text extraction.
75
76
  new_df, extraction_info = extract_text_from_audio_internal(
@@ -13,8 +13,11 @@ from nv_ingest.framework.util.flow_control import filter_by_task
13
13
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
14
14
  from nv_ingest_api.internal.primitives.tracing.tagging import traceable
15
15
  from nv_ingest_api.internal.schemas.extract.extract_chart_schema import ChartExtractorSchema
16
- from nv_ingest_api.util.exception_handlers.decorators import nv_ingest_node_failure_try_except
17
16
  from nv_ingest.framework.orchestration.ray.stages.meta.ray_actor_stage_base import RayActorStage
17
+ from nv_ingest_api.util.exception_handlers.decorators import (
18
+ nv_ingest_node_failure_try_except,
19
+ )
20
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
18
21
 
19
22
  logger = logging.getLogger(__name__)
20
23
 
@@ -66,7 +69,7 @@ class ChartExtractorStage(RayActorStage):
66
69
 
67
70
  # Remove the "chart_data_extract" task to obtain task-specific configuration.
68
71
  task_config = remove_task_by_type(control_message, "chart_data_extract")
69
- logger.debug("ChartExtractorStage: Task config extracted: %s", task_config)
72
+ logger.debug("ChartExtractorStage: Task config extracted: %s", sanitize_for_logging(task_config))
70
73
 
71
74
  # Perform chart data extraction.
72
75
  execution_trace_log = {}
@@ -16,6 +16,7 @@ from nv_ingest_api.internal.schemas.extract.extract_docx_schema import DocxExtra
16
16
  from nv_ingest_api.util.exception_handlers.decorators import (
17
17
  nv_ingest_node_failure_try_except,
18
18
  )
19
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
19
20
 
20
21
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
21
22
 
@@ -68,7 +69,7 @@ class DocxExtractorStage(RayActorStage):
68
69
 
69
70
  # Remove the "docx-extract" task from the message to obtain task-specific configuration.
70
71
  task_config = remove_task_by_type(control_message, "extract")
71
- self._logger.debug("Extracted task config: %s", task_config)
72
+ self._logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
72
73
 
73
74
  # Perform DOCX content extraction.
74
75
  new_df, extraction_info = extract_primitives_from_docx_internal(
@@ -17,6 +17,7 @@ from nv_ingest_api.internal.schemas.extract.extract_html_schema import HtmlExtra
17
17
  from nv_ingest_api.util.exception_handlers.decorators import (
18
18
  nv_ingest_node_failure_try_except,
19
19
  )
20
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
20
21
 
21
22
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
22
23
 
@@ -69,7 +70,7 @@ class HtmlExtractorStage(RayActorStage):
69
70
 
70
71
  # Remove the "html_content_extract" task from the message to obtain task-specific configuration.
71
72
  task_config = remove_task_by_type(control_message, "extract")
72
- self._logger.debug("Extracted task config: %s", task_config)
73
+ self._logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
73
74
 
74
75
  # Perform html content extraction.
75
76
  new_df, extraction_info = extract_markdown_from_html_internal(
@@ -16,6 +16,7 @@ from nv_ingest_api.internal.schemas.extract.extract_image_schema import ImageExt
16
16
  from nv_ingest_api.util.exception_handlers.decorators import (
17
17
  nv_ingest_node_failure_try_except,
18
18
  )
19
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
19
20
 
20
21
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
21
22
 
@@ -68,7 +69,7 @@ class ImageExtractorStage(RayActorStage):
68
69
 
69
70
  # Remove the "extract" task from the message to obtain task-specific configuration.
70
71
  task_config = remove_task_by_type(control_message, "extract")
71
- logger.debug("Extracted task config: %s", task_config)
72
+ logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
72
73
 
73
74
  # Perform image primitives extraction.
74
75
  new_df, extraction_info = extract_primitives_from_image_internal(
@@ -15,7 +15,10 @@ from nv_ingest_api.internal.primitives.tracing.tagging import set_trace_timestam
15
15
  from nv_ingest.framework.orchestration.ray.stages.meta.ray_actor_stage_base import RayActorStage
16
16
  from nv_ingest.framework.util.flow_control import filter_by_task
17
17
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
18
- from nv_ingest_api.util.exception_handlers.decorators import nv_ingest_node_failure_try_except
18
+ from nv_ingest_api.util.exception_handlers.decorators import (
19
+ nv_ingest_node_failure_try_except,
20
+ )
21
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
19
22
 
20
23
  logger = logging.getLogger(__name__)
21
24
 
@@ -87,7 +90,7 @@ class PDFExtractorStage(RayActorStage):
87
90
 
88
91
  # Remove the "extract" task from the message to obtain task-specific configuration.
89
92
  task_config = remove_task_by_type(control_message, "extract")
90
- logger.debug("Extracted task config: %s", task_config)
93
+ logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
91
94
 
92
95
  # Perform PDF extraction.
93
96
  execution_trace_log = {}
@@ -16,6 +16,7 @@ from nv_ingest_api.internal.schemas.extract.extract_table_schema import TableExt
16
16
  from nv_ingest_api.util.exception_handlers.decorators import (
17
17
  nv_ingest_node_failure_try_except,
18
18
  )
19
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
19
20
 
20
21
  logger = logging.getLogger(__name__)
21
22
 
@@ -65,7 +66,7 @@ class TableExtractorStage(RayActorStage):
65
66
 
66
67
  # Remove the "table_data_extract" task to obtain task-specific configuration.
67
68
  task_config = remove_task_by_type(control_message, "table_data_extract")
68
- logger.debug("Extracted task configuration: %s", task_config)
69
+ logger.debug("Extracted task configuration: %s", sanitize_for_logging(task_config))
69
70
 
70
71
  # Perform table data extraction.
71
72
  execution_trace_log = {}
@@ -25,6 +25,7 @@ from nv_ingest_api.util.exception_handlers.decorators import (
25
25
  nv_ingest_node_failure_try_except,
26
26
  )
27
27
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
28
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
28
29
 
29
30
  logger = logging.getLogger(__name__)
30
31
 
@@ -42,7 +43,7 @@ class MetadataInjectionStage(RayActorStage):
42
43
  # Call the base initializer to set attributes like self._running.
43
44
  super().__init__(config, stage_name=stage_name)
44
45
  # Additional initialization can be added here if necessary.
45
- self._logger.debug("MetadataInjectionStage initialized with config: %s", config)
46
+ self._logger.debug("MetadataInjectionStage initialized with config: %s", sanitize_for_logging(config))
46
47
 
47
48
  @nv_ingest_node_failure_try_except()
48
49
  @traceable()
@@ -18,6 +18,7 @@ from nv_ingest_api.internal.schemas.mutate.mutate_image_dedup_schema import Imag
18
18
  from nv_ingest_api.util.exception_handlers.decorators import (
19
19
  nv_ingest_node_failure_try_except,
20
20
  )
21
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
21
22
 
22
23
  logger = logging.getLogger(__name__)
23
24
 
@@ -68,7 +69,7 @@ class ImageDedupStage(RayActorStage):
68
69
 
69
70
  # Remove the "dedup" task from the message to obtain task-specific configuration.
70
71
  task_config = remove_task_by_type(control_message, "dedup")
71
- logger.debug("Extracted task config: %s", task_config)
72
+ logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
72
73
 
73
74
  # Perform image deduplication.
74
75
  new_df = deduplicate_images_internal(
@@ -17,6 +17,7 @@ from nv_ingest_api.internal.schemas.transform.transform_image_filter_schema impo
17
17
  from nv_ingest_api.util.exception_handlers.decorators import (
18
18
  nv_ingest_node_failure_try_except,
19
19
  )
20
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
20
21
 
21
22
  logger = logging.getLogger(__name__)
22
23
 
@@ -67,7 +68,7 @@ class ImageFilterStage(RayActorStage):
67
68
 
68
69
  # Remove the "filter" task from the message to obtain task-specific configuration.
69
70
  task_config = remove_task_by_type(control_message, "filter")
70
- logger.debug("Extracted task config: %s", task_config)
71
+ logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
71
72
 
72
73
  task_params: Dict[str, Any] = task_config.get("params", {})
73
74
 
@@ -29,6 +29,7 @@ from nv_ingest_api.internal.schemas.meta.ingest_job_schema import validate_inges
29
29
  # Import clients
30
30
  from nv_ingest_api.util.message_brokers.simple_message_broker.simple_client import SimpleClient
31
31
  from nv_ingest_api.util.service_clients.redis.redis_client import RedisClient
32
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
32
33
 
33
34
  logger = logging.getLogger(__name__)
34
35
 
@@ -104,8 +105,11 @@ class MessageBrokerTaskSourceStage(RayActorSourceStage):
104
105
  def __init__(self, config: MessageBrokerTaskSourceConfig, stage_name: Optional[str] = None) -> None:
105
106
  super().__init__(config, log_to_stdout=False, stage_name=stage_name)
106
107
  self.config: MessageBrokerTaskSourceConfig # Add a type hint for self.config
108
+
109
+ # Sanitize config before logging to avoid leaking secrets
110
+ _sanitized = sanitize_for_logging(config)
107
111
  self._logger.debug(
108
- "Initializing MessageBrokerTaskSourceStage with config: %s", config.model_dump()
112
+ "Initializing MessageBrokerTaskSourceStage with config: %s", _sanitized
109
113
  ) # Log validated config
110
114
 
111
115
  # Access validated configuration directly via self.config
@@ -16,6 +16,7 @@ from nv_ingest_api.internal.store.embed_text_upload import store_text_embeddings
16
16
  from nv_ingest_api.util.exception_handlers.decorators import (
17
17
  nv_ingest_node_failure_try_except,
18
18
  )
19
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
19
20
 
20
21
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
21
22
 
@@ -68,7 +69,7 @@ class EmbeddingStorageStage(RayActorStage):
68
69
 
69
70
  # Remove the "store_embedding" task from the message to obtain task-specific configuration.
70
71
  task_config = remove_task_by_type(control_message, "store_embedding")
71
- logger.debug("Extracted task config: %s", task_config)
72
+ logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
72
73
 
73
74
  # Perform embedding storage.
74
75
  new_df = store_text_embeddings_internal(
@@ -18,6 +18,7 @@ from nv_ingest_api.internal.transform.caption_image import transform_image_creat
18
18
  from nv_ingest_api.util.exception_handlers.decorators import (
19
19
  nv_ingest_node_failure_try_except,
20
20
  )
21
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
21
22
 
22
23
  logger = logging.getLogger(__name__)
23
24
 
@@ -67,7 +68,10 @@ class ImageCaptionTransformStage(RayActorStage):
67
68
 
68
69
  # Remove the "caption" task to obtain task-specific configuration.
69
70
  task_config = remove_task_by_type(control_message, "caption")
70
- logger.debug("ImageCaptionTransformStage: Task configuration extracted: %s", pprint.pformat(task_config))
71
+ logger.debug(
72
+ "ImageCaptionTransformStage: Task configuration extracted: %s",
73
+ pprint.pformat(sanitize_for_logging(task_config)),
74
+ )
71
75
 
72
76
  # Call the caption extraction function.
73
77
  new_df = transform_image_create_vlm_caption_internal(
@@ -15,6 +15,7 @@ from nv_ingest_api.internal.transform.embed_text import transform_create_text_em
15
15
  from nv_ingest_api.util.exception_handlers.decorators import (
16
16
  nv_ingest_node_failure_try_except,
17
17
  )
18
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
18
19
 
19
20
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
20
21
 
@@ -62,7 +63,10 @@ class TextEmbeddingTransformStage(RayActorStage):
62
63
 
63
64
  # Remove the "embed" task to obtain task-specific configuration.
64
65
  task_config = remove_task_by_type(control_message, "embed")
65
- self._logger.debug("TextEmbeddingTransformStage: Task configuration extracted: %s", pprint.pformat(task_config))
66
+ self._logger.debug(
67
+ "TextEmbeddingTransformStage: Task configuration extracted: %s",
68
+ pprint.pformat(sanitize_for_logging(task_config)),
69
+ )
66
70
 
67
71
  # Call the text embedding extraction function.
68
72
  new_df, execution_trace_log = transform_create_text_embeddings_internal(
@@ -16,6 +16,7 @@ from nv_ingest_api.internal.transform.split_text import transform_text_split_and
16
16
  from nv_ingest_api.util.exception_handlers.decorators import (
17
17
  nv_ingest_node_failure_try_except,
18
18
  )
19
+ from nv_ingest_api.util.logging.sanitize import sanitize_for_logging
19
20
 
20
21
  from nv_ingest.framework.util.flow_control.udf_intercept import udf_intercept_hook
21
22
 
@@ -36,7 +37,7 @@ class TextSplitterStage(RayActorStage):
36
37
  super().__init__(config, stage_name=stage_name)
37
38
  # Store the validated configuration (assumed to be an instance of TextSplitterSchema)
38
39
  self.validated_config: TextSplitterSchema = config
39
- logger.debug("TextSplitterStage initialized with config: %s", config)
40
+ logger.info("TextSplitterStage initialized with config: %s", sanitize_for_logging(config))
40
41
 
41
42
  @nv_ingest_node_failure_try_except()
42
43
  @traceable()
@@ -63,7 +64,7 @@ class TextSplitterStage(RayActorStage):
63
64
 
64
65
  # Remove the "split" task to obtain task-specific configuration.
65
66
  task_config = remove_task_by_type(message, "split")
66
- logger.debug("Extracted task config: %s", task_config)
67
+ logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
67
68
 
68
69
  # Transform the DataFrame (split text and tokenize).
69
70
  df_updated = transform_text_split_and_tokenize_internal(
@@ -107,7 +108,7 @@ def text_splitter_fn(control_message: IngestControlMessage, stage_config: TextSp
107
108
 
108
109
  # Remove the "split" task to obtain task-specific configuration.
109
110
  task_config = remove_task_by_type(control_message, "split")
110
- logger.debug("Extracted task config: %s", task_config)
111
+ logger.debug("Extracted task config: %s", sanitize_for_logging(task_config))
111
112
 
112
113
  # Transform the DataFrame (split text and tokenize).
113
114
  df_updated = transform_text_split_and_tokenize_internal(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nv-ingest
3
- Version: 2025.8.20.dev20250820
3
+ Version: 2025.8.22.dev20250822
4
4
  Summary: Python module for multimodal document ingestion
5
5
  Author-email: Jeremy Dyer <jdyer@nvidia.com>
6
6
  License: Apache License
@@ -34,41 +34,41 @@ nv_ingest/framework/orchestration/ray/primitives/ray_pipeline.py,sha256=t9lf6zTj
34
34
  nv_ingest/framework/orchestration/ray/primitives/ray_stat_collector.py,sha256=GGY6_i6_g5xTFzdo9Qmsu9i4knMTq6pJfgm-aaPEt_o,17226
35
35
  nv_ingest/framework/orchestration/ray/stages/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
36
36
  nv_ingest/framework/orchestration/ray/stages/extractors/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
37
- nv_ingest/framework/orchestration/ray/stages/extractors/audio_extractor.py,sha256=MdJA79_XECTmvksmxRZiIj5cZ46HzvIYOFNi5-S9o1k,3540
38
- nv_ingest/framework/orchestration/ray/stages/extractors/chart_extractor.py,sha256=D_clXtJe63CkeOcqor6C-X3Gbny7rNlp8PRMp9sRuPw,4281
39
- nv_ingest/framework/orchestration/ray/stages/extractors/docx_extractor.py,sha256=8DQOivEfvptUY7x7I6NsdJMTkiLdq2e_xPpPl3_bLJY,3536
40
- nv_ingest/framework/orchestration/ray/stages/extractors/html_extractor.py,sha256=fp0nzRQ21PmIInxtXjTYhOiYytmgBypDlY0e-WHCmGA,3551
41
- nv_ingest/framework/orchestration/ray/stages/extractors/image_extractor.py,sha256=CMIfHLCE4DUIedTxedZWWJKWlrLbWZzsuEE3j_ix_nY,3889
37
+ nv_ingest/framework/orchestration/ray/stages/extractors/audio_extractor.py,sha256=4SdgvzI9oJ_OK5oWGir9wXVIPV4Pont2EKv9mwcWMC0,3631
38
+ nv_ingest/framework/orchestration/ray/stages/extractors/chart_extractor.py,sha256=rfaDx6PqRCguhSYkJI6iVmMMtAlJNxzKfUrLmw_fKqs,4381
39
+ nv_ingest/framework/orchestration/ray/stages/extractors/docx_extractor.py,sha256=R4vshPcAUN2U6BIv8BCZQ862wLx8RJhCGXfpQ3K09Bs,3627
40
+ nv_ingest/framework/orchestration/ray/stages/extractors/html_extractor.py,sha256=7JrZSVIrK4_wr2s7TOTss7pgTY2F9GPQ7Ze3F_WFlKU,3642
41
+ nv_ingest/framework/orchestration/ray/stages/extractors/image_extractor.py,sha256=iY9fEfucfgCmO2ixX6qwn418J97nJz_FQGh7B6yziVo,3980
42
42
  nv_ingest/framework/orchestration/ray/stages/extractors/infographic_extractor.py,sha256=v5J7dnJBEaDfjoTz_N_yC3RAt6lwMLgLT28V-ahquLE,3261
43
- nv_ingest/framework/orchestration/ray/stages/extractors/pdf_extractor.py,sha256=5gpbf2gJiUmL0-XR6nxWih3E0_FqkMRDaLdgP_MQs-c,4892
43
+ nv_ingest/framework/orchestration/ray/stages/extractors/pdf_extractor.py,sha256=QagIA99AsHLihjRbXm-2BphdoQGHwzOHlqLyz7oDOSk,4992
44
44
  nv_ingest/framework/orchestration/ray/stages/extractors/pptx_extractor.py,sha256=RMbbl7Cuj4BT-TcgUx_0k8R-DLdw-o3fHxcIBIgrWt4,3776
45
- nv_ingest/framework/orchestration/ray/stages/extractors/table_extractor.py,sha256=YvCsBD4hxzgY-vGQmDwXVhleClMj2PHzsX71I5_VM_o,4079
45
+ nv_ingest/framework/orchestration/ray/stages/extractors/table_extractor.py,sha256=p71ktv6v5T-9npYpCbgbwW6-fS-65UWS7rCm8OWr2Bc,4170
46
46
  nv_ingest/framework/orchestration/ray/stages/injectors/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
47
- nv_ingest/framework/orchestration/ray/stages/injectors/metadata_injector.py,sha256=b4yve-J7ZMURSSuOPzSvfdIcyZ9fX8d-q7cYnXuxgsM,7025
47
+ nv_ingest/framework/orchestration/ray/stages/injectors/metadata_injector.py,sha256=gTPRFOoUGcwNrmPeqv4n5VmU-LBkha9QTYHO0ntiaIk,7116
48
48
  nv_ingest/framework/orchestration/ray/stages/meta/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
49
49
  nv_ingest/framework/orchestration/ray/stages/meta/ray_actor_edge_base.py,sha256=LnVqBJmpfCmcI-eJLbkwK-7SS-hpEp98P4iCRv_Zhb0,1726
50
50
  nv_ingest/framework/orchestration/ray/stages/meta/ray_actor_sink_stage_base.py,sha256=HQJXIuU7VjiQ6fQjHjbNNmIJX5f30cXFB0CJGixgwVo,3633
51
51
  nv_ingest/framework/orchestration/ray/stages/meta/ray_actor_source_stage_base.py,sha256=hP25MLTP2bOEEncrYdxPPqeRyRVbij8aEurR1F1ZmhE,1811
52
52
  nv_ingest/framework/orchestration/ray/stages/meta/ray_actor_stage_base.py,sha256=qiB_ZU5_3bXgvE9C2rvnXIS0Alm6M5PWLCeQm8ZxOy4,29812
53
53
  nv_ingest/framework/orchestration/ray/stages/mutate/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
54
- nv_ingest/framework/orchestration/ray/stages/mutate/image_dedup.py,sha256=ipH-3dctKaXRbjfkcXfpKRPXJBHXEosqPpm_Gb-5PZ0,3618
55
- nv_ingest/framework/orchestration/ray/stages/mutate/image_filter.py,sha256=-UkLArpgP1cr433dQDzO0g5Wn8cpvjqK6RGamufO5gQ,3432
54
+ nv_ingest/framework/orchestration/ray/stages/mutate/image_dedup.py,sha256=cPLG3ZEqhZkRiSsbL7cbF1zsvOAimd8K5O-qadUR9Mg,3709
55
+ nv_ingest/framework/orchestration/ray/stages/mutate/image_filter.py,sha256=f1CS8x9uifY1FJ_1lUF0fNNMExvM4zBIF012gxnSpqU,3523
56
56
  nv_ingest/framework/orchestration/ray/stages/sinks/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
57
57
  nv_ingest/framework/orchestration/ray/stages/sinks/default_drain.py,sha256=_USW1Vq8G2Wn-QFdPfFQCrtKG46hHeJvkEGbBxdpbVM,1488
58
58
  nv_ingest/framework/orchestration/ray/stages/sinks/message_broker_task_sink.py,sha256=QcvMQXIJ7EWIxty76Mo5Xv38Oj6X2KuS8qXQlf7E1uA,11676
59
59
  nv_ingest/framework/orchestration/ray/stages/sources/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
60
- nv_ingest/framework/orchestration/ray/stages/sources/message_broker_task_source.py,sha256=A_D17mOqTh1a-4_FbcEUzPOhCxK7gqrXdEHXHpnHTcU,22163
60
+ nv_ingest/framework/orchestration/ray/stages/sources/message_broker_task_source.py,sha256=Qm9XtTNX2CcUAlZRw33BS3Ql0djcsMGp52FPA2zHu3Q,22340
61
61
  nv_ingest/framework/orchestration/ray/stages/storage/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
62
62
  nv_ingest/framework/orchestration/ray/stages/storage/image_storage.py,sha256=WZN_-3Li-izDaPtk8IMrtn2os1ckT3U8Rb2PsfOWrcI,4009
63
- nv_ingest/framework/orchestration/ray/stages/storage/store_embeddings.py,sha256=4-bV4lIAdeylBeBHMO-6bVa2xilhPdZqkwfM8OwI2rM,3456
63
+ nv_ingest/framework/orchestration/ray/stages/storage/store_embeddings.py,sha256=EUtwhSDf-qGLVEhWEInr1VaLsvpcHUSyzCmHQVai-Ps,3547
64
64
  nv_ingest/framework/orchestration/ray/stages/telemetry/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
65
65
  nv_ingest/framework/orchestration/ray/stages/telemetry/job_counter.py,sha256=jEtEUibqs6IS6QakrzWY9zmxSUzuBpg_hzXy2R-I10Y,2870
66
66
  nv_ingest/framework/orchestration/ray/stages/telemetry/otel_meter.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
67
67
  nv_ingest/framework/orchestration/ray/stages/telemetry/otel_tracer.py,sha256=GqFwRpTlIu2qgb08B3OqVIKUG8QQAwSOHhjvnyL_9UE,8553
68
68
  nv_ingest/framework/orchestration/ray/stages/transforms/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
69
- nv_ingest/framework/orchestration/ray/stages/transforms/image_caption.py,sha256=Ghg09z5fSH0uyGplJPybE1e6sCD9IFpkGjzU3x8zd9o,3616
70
- nv_ingest/framework/orchestration/ray/stages/transforms/text_embed.py,sha256=RT4SkyjHPSJS7TuQhIcNW3B5a2tahEEtlxwB7M2UBYk,3309
71
- nv_ingest/framework/orchestration/ray/stages/transforms/text_splitter.py,sha256=D8HGPwOCqgCA6PMoeBAHaxKfLUgPhTlSP84uiujskYM,4829
69
+ nv_ingest/framework/orchestration/ray/stages/transforms/image_caption.py,sha256=GYF41y_teXMIzB24JQXuesVmvksmgNvTGYU3uU4TzbM,3742
70
+ nv_ingest/framework/orchestration/ray/stages/transforms/text_embed.py,sha256=o6QPd3GCPxbAvQFeb1oByOP5LII-FVkKbmAkBjCioB0,3435
71
+ nv_ingest/framework/orchestration/ray/stages/transforms/text_splitter.py,sha256=FAScWaZijrJHc5F5jgulHP_cdX2telS4pq3spwliFXw,4963
72
72
  nv_ingest/framework/orchestration/ray/stages/utility/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
73
73
  nv_ingest/framework/orchestration/ray/stages/utility/throughput_monitor.py,sha256=J7Qs745rt7cQlR3L2K9U6Mb_BDKUNpl_xoqCZMEPlks,2674
74
74
  nv_ingest/framework/orchestration/ray/util/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
@@ -113,8 +113,8 @@ nv_ingest/pipeline/pipeline_schema.py,sha256=rLZZz2It2o2hVNWrZUJU8CarrqRei1fho3Z
113
113
  nv_ingest/pipeline/config/__init__.py,sha256=wQSlVx3T14ZgQAt-EPzEczQusXVW0W8yynnUaFFGE3s,143
114
114
  nv_ingest/pipeline/config/loaders.py,sha256=75Yr9WYO7j7ghvKTnYLfZXQZEH3J3VEZo5J4TunC_Us,7590
115
115
  nv_ingest/pipeline/config/replica_resolver.py,sha256=3zjh8gmepEYORFZRM4inq7GoBW0YL3gzUDiixUugjzQ,8899
116
- nv_ingest-2025.8.20.dev20250820.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
117
- nv_ingest-2025.8.20.dev20250820.dist-info/METADATA,sha256=1ebyXL2wfHlv6B2_21Jvawg4mMmicYmf_GCKLMk5aNo,15061
118
- nv_ingest-2025.8.20.dev20250820.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
119
- nv_ingest-2025.8.20.dev20250820.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
120
- nv_ingest-2025.8.20.dev20250820.dist-info/RECORD,,
116
+ nv_ingest-2025.8.22.dev20250822.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
117
+ nv_ingest-2025.8.22.dev20250822.dist-info/METADATA,sha256=8YzCR5EKProTRxaNYN9EiuR0Y5F9hJfFs1_Z6euw40s,15061
118
+ nv_ingest-2025.8.22.dev20250822.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
119
+ nv_ingest-2025.8.22.dev20250822.dist-info/top_level.txt,sha256=sjb0ajIsgn3YgftSjZHlYO0HjYAIIhNuXG_AmywCvaU,10
120
+ nv_ingest-2025.8.22.dev20250822.dist-info/RECORD,,