data-designer 0.3.1__py3-none-any.whl → 0.3.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data_designer/__init__.py +1 -1
- data_designer/_version.py +2 -2
- data_designer/cli/__init__.py +1 -1
- data_designer/cli/commands/__init__.py +1 -1
- data_designer/cli/commands/download.py +1 -1
- data_designer/cli/commands/list.py +1 -1
- data_designer/cli/commands/models.py +1 -1
- data_designer/cli/commands/providers.py +1 -1
- data_designer/cli/commands/reset.py +1 -1
- data_designer/cli/controllers/__init__.py +1 -1
- data_designer/cli/controllers/download_controller.py +1 -1
- data_designer/cli/controllers/model_controller.py +1 -1
- data_designer/cli/controllers/provider_controller.py +1 -1
- data_designer/cli/forms/__init__.py +1 -1
- data_designer/cli/forms/builder.py +1 -1
- data_designer/cli/forms/field.py +1 -1
- data_designer/cli/forms/form.py +1 -1
- data_designer/cli/forms/model_builder.py +1 -1
- data_designer/cli/forms/provider_builder.py +1 -1
- data_designer/cli/main.py +1 -1
- data_designer/cli/repositories/__init__.py +1 -1
- data_designer/cli/repositories/base.py +1 -1
- data_designer/cli/repositories/model_repository.py +1 -1
- data_designer/cli/repositories/persona_repository.py +1 -1
- data_designer/cli/repositories/provider_repository.py +1 -1
- data_designer/cli/services/__init__.py +1 -1
- data_designer/cli/services/download_service.py +1 -1
- data_designer/cli/services/model_service.py +1 -1
- data_designer/cli/services/provider_service.py +1 -1
- data_designer/cli/ui.py +1 -1
- data_designer/cli/utils.py +1 -1
- data_designer/config/__init__.py +1 -1
- data_designer/config/analysis/__init__.py +1 -1
- data_designer/config/analysis/column_profilers.py +1 -1
- data_designer/config/analysis/column_statistics.py +1 -1
- data_designer/config/analysis/dataset_profiler.py +1 -1
- data_designer/config/analysis/utils/errors.py +1 -1
- data_designer/config/analysis/utils/reporting.py +1 -1
- data_designer/config/base.py +1 -1
- data_designer/config/column_configs.py +1 -1
- data_designer/config/column_types.py +1 -36
- data_designer/config/config_builder.py +4 -21
- data_designer/config/data_designer_config.py +1 -1
- data_designer/config/dataset_builders.py +1 -1
- data_designer/config/default_model_settings.py +1 -1
- data_designer/config/errors.py +1 -1
- data_designer/config/exports.py +1 -1
- data_designer/config/interface.py +1 -1
- data_designer/config/models.py +1 -1
- data_designer/config/preview_results.py +1 -1
- data_designer/config/processors.py +1 -1
- data_designer/config/run_config.py +1 -1
- data_designer/config/sampler_constraints.py +1 -1
- data_designer/config/sampler_params.py +1 -1
- data_designer/config/seed.py +2 -2
- data_designer/config/seed_source.py +2 -8
- data_designer/config/seed_source_types.py +17 -0
- data_designer/config/utils/code_lang.py +1 -1
- data_designer/config/utils/constants.py +1 -1
- data_designer/config/utils/errors.py +1 -1
- data_designer/config/utils/info.py +1 -1
- data_designer/config/utils/io_helpers.py +1 -1
- data_designer/config/utils/misc.py +1 -1
- data_designer/config/utils/numerical_helpers.py +1 -1
- data_designer/config/utils/type_helpers.py +1 -1
- data_designer/config/utils/visualization.py +1 -1
- data_designer/config/validator_params.py +1 -1
- data_designer/engine/__init__.py +1 -1
- data_designer/engine/analysis/column_profilers/base.py +1 -1
- data_designer/engine/analysis/column_profilers/judge_score_profiler.py +1 -3
- data_designer/engine/analysis/column_profilers/registry.py +1 -1
- data_designer/engine/analysis/column_statistics.py +1 -1
- data_designer/engine/analysis/dataset_profiler.py +1 -1
- data_designer/engine/analysis/errors.py +1 -1
- data_designer/engine/analysis/utils/column_statistics_calculations.py +1 -1
- data_designer/engine/analysis/utils/judge_score_processing.py +1 -1
- data_designer/engine/column_generators/__init__.py +1 -1
- data_designer/engine/column_generators/generators/__init__.py +1 -1
- data_designer/engine/column_generators/generators/base.py +26 -14
- data_designer/engine/column_generators/generators/embedding.py +3 -6
- data_designer/engine/column_generators/generators/expression.py +3 -2
- data_designer/engine/column_generators/generators/llm_completion.py +8 -13
- data_designer/engine/column_generators/generators/samplers.py +3 -3
- data_designer/engine/column_generators/generators/seed_dataset.py +4 -3
- data_designer/engine/column_generators/generators/validation.py +3 -2
- data_designer/engine/column_generators/registry.py +1 -1
- data_designer/engine/column_generators/utils/errors.py +1 -1
- data_designer/engine/column_generators/utils/generator_classification.py +41 -0
- data_designer/engine/column_generators/utils/judge_score_factory.py +1 -1
- data_designer/engine/column_generators/utils/prompt_renderer.py +1 -1
- data_designer/engine/compiler.py +1 -1
- data_designer/engine/configurable_task.py +3 -13
- data_designer/engine/dataset_builders/artifact_storage.py +1 -1
- data_designer/engine/dataset_builders/column_wise_builder.py +8 -5
- data_designer/engine/dataset_builders/errors.py +1 -1
- data_designer/engine/dataset_builders/multi_column_configs.py +1 -1
- data_designer/engine/dataset_builders/utils/__init__.py +1 -1
- data_designer/engine/dataset_builders/utils/concurrency.py +25 -3
- data_designer/engine/dataset_builders/utils/config_compiler.py +1 -1
- data_designer/engine/dataset_builders/utils/dag.py +3 -2
- data_designer/engine/dataset_builders/utils/dataset_batch_manager.py +1 -1
- data_designer/engine/dataset_builders/utils/errors.py +1 -1
- data_designer/engine/errors.py +1 -1
- data_designer/engine/model_provider.py +1 -1
- data_designer/engine/models/__init__.py +1 -1
- data_designer/engine/models/errors.py +1 -1
- data_designer/engine/models/facade.py +1 -1
- data_designer/engine/models/litellm_overrides.py +1 -1
- data_designer/engine/models/parsers/__init__.py +1 -1
- data_designer/engine/models/parsers/errors.py +1 -1
- data_designer/engine/models/parsers/parser.py +1 -1
- data_designer/engine/models/parsers/postprocessors.py +1 -1
- data_designer/engine/models/parsers/tag_parsers.py +1 -1
- data_designer/engine/models/parsers/types.py +1 -1
- data_designer/engine/models/recipes/base.py +1 -1
- data_designer/engine/models/recipes/response_recipes.py +1 -1
- data_designer/engine/models/registry.py +1 -1
- data_designer/engine/models/telemetry.py +1 -1
- data_designer/engine/models/usage.py +1 -1
- data_designer/engine/models/utils.py +1 -1
- data_designer/engine/processing/ginja/__init__.py +1 -1
- data_designer/engine/processing/ginja/ast.py +1 -1
- data_designer/engine/processing/ginja/environment.py +1 -1
- data_designer/engine/processing/ginja/exceptions.py +1 -1
- data_designer/engine/processing/ginja/record.py +1 -1
- data_designer/engine/processing/gsonschema/__init__.py +1 -1
- data_designer/engine/processing/gsonschema/exceptions.py +1 -1
- data_designer/engine/processing/gsonschema/schema_transformers.py +1 -1
- data_designer/engine/processing/gsonschema/types.py +1 -1
- data_designer/engine/processing/gsonschema/validators.py +1 -1
- data_designer/engine/processing/processors/base.py +3 -1
- data_designer/engine/processing/processors/drop_columns.py +1 -2
- data_designer/engine/processing/processors/registry.py +1 -1
- data_designer/engine/processing/processors/schema_transform.py +1 -2
- data_designer/engine/processing/utils.py +1 -1
- data_designer/engine/registry/base.py +1 -1
- data_designer/engine/registry/data_designer_registry.py +1 -1
- data_designer/engine/registry/errors.py +1 -1
- data_designer/engine/resources/managed_dataset_generator.py +1 -1
- data_designer/engine/resources/managed_dataset_repository.py +1 -1
- data_designer/engine/resources/managed_storage.py +1 -1
- data_designer/engine/resources/resource_provider.py +1 -1
- data_designer/engine/resources/seed_reader.py +1 -1
- data_designer/engine/sampling_gen/column.py +1 -1
- data_designer/engine/sampling_gen/constraints.py +1 -1
- data_designer/engine/sampling_gen/data_sources/base.py +1 -1
- data_designer/engine/sampling_gen/data_sources/errors.py +1 -1
- data_designer/engine/sampling_gen/data_sources/sources.py +1 -1
- data_designer/engine/sampling_gen/entities/__init__.py +1 -1
- data_designer/engine/sampling_gen/entities/dataset_based_person_fields.py +1 -1
- data_designer/engine/sampling_gen/entities/email_address_utils.py +1 -1
- data_designer/engine/sampling_gen/entities/errors.py +1 -1
- data_designer/engine/sampling_gen/entities/national_id_utils.py +1 -1
- data_designer/engine/sampling_gen/entities/person.py +1 -1
- data_designer/engine/sampling_gen/entities/phone_number.py +1 -1
- data_designer/engine/sampling_gen/errors.py +1 -1
- data_designer/engine/sampling_gen/generator.py +1 -1
- data_designer/engine/sampling_gen/jinja_utils.py +1 -1
- data_designer/engine/sampling_gen/people_gen.py +1 -1
- data_designer/engine/sampling_gen/person_constants.py +1 -1
- data_designer/engine/sampling_gen/schema.py +1 -1
- data_designer/engine/sampling_gen/schema_builder.py +1 -1
- data_designer/engine/sampling_gen/utils.py +1 -1
- data_designer/engine/secret_resolver.py +1 -1
- data_designer/engine/validation.py +3 -2
- data_designer/engine/validators/__init__.py +1 -1
- data_designer/engine/validators/base.py +1 -1
- data_designer/engine/validators/local_callable.py +1 -1
- data_designer/engine/validators/python.py +1 -1
- data_designer/engine/validators/remote.py +1 -1
- data_designer/engine/validators/sql.py +1 -1
- data_designer/errors.py +1 -1
- data_designer/essentials/__init__.py +1 -1
- data_designer/interface/__init__.py +1 -1
- data_designer/interface/data_designer.py +5 -1
- data_designer/interface/errors.py +1 -1
- data_designer/interface/results.py +1 -1
- data_designer/logging.py +1 -1
- data_designer/plugin_manager.py +14 -7
- data_designer/plugins/__init__.py +1 -1
- data_designer/plugins/errors.py +1 -1
- data_designer/plugins/plugin.py +4 -1
- data_designer/plugins/registry.py +1 -1
- data_designer/plugins/testing/__init__.py +1 -1
- data_designer/plugins/testing/stubs.py +1 -8
- data_designer/plugins/testing/utils.py +10 -3
- {data_designer-0.3.1.dist-info → data_designer-0.3.3.dist-info}/METADATA +3 -3
- data_designer-0.3.3.dist-info/RECORD +193 -0
- data_designer-0.3.1.dist-info/RECORD +0 -191
- {data_designer-0.3.1.dist-info → data_designer-0.3.3.dist-info}/WHEEL +0 -0
- {data_designer-0.3.1.dist-info → data_designer-0.3.3.dist-info}/entry_points.txt +0 -0
- {data_designer-0.3.1.dist-info → data_designer-0.3.3.dist-info}/licenses/LICENSE +0 -0
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.engine.errors import DataDesignerError
|
data_designer/engine/errors.py
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from pydantic import BaseModel, Field
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from functools import cached_property
|
|
@@ -1,2 +1,2 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -1,2 +1,2 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from functools import reduce
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from lxml.etree import _Element
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from typing import Any, Protocol, runtime_checkable
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -1,2 +1,2 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from collections import deque
|
|
@@ -1,2 +1,2 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from jsonschema import ValidationError
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from copy import deepcopy
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from typing import Any, TypeVar
|
|
@@ -1,6 +1,8 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
|
+
from __future__ import annotations
|
|
5
|
+
|
|
4
6
|
from abc import ABC, abstractmethod
|
|
5
7
|
|
|
6
8
|
from data_designer.engine.configurable_task import ConfigurableTask, ConfigurableTaskMetadata, DataT, TaskConfigT
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
import logging
|
|
@@ -19,7 +19,6 @@ class DropColumnsProcessor(Processor[DropColumnsProcessorConfig]):
|
|
|
19
19
|
return ConfigurableTaskMetadata(
|
|
20
20
|
name="drop_columns_processor",
|
|
21
21
|
description="Drop columns from the input dataset.",
|
|
22
|
-
required_resources=None,
|
|
23
22
|
)
|
|
24
23
|
|
|
25
24
|
def process(self, data: pd.DataFrame, *, current_batch_number: int | None = None) -> pd.DataFrame:
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.config.base import ConfigBase
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
import json
|
|
@@ -22,7 +22,6 @@ class SchemaTransformProcessor(WithJinja2UserTemplateRendering, Processor[Schema
|
|
|
22
22
|
return ConfigurableTaskMetadata(
|
|
23
23
|
name="schema_transform_processor",
|
|
24
24
|
description="Generate dataset with transformed schema using a Jinja2 template.",
|
|
25
|
-
required_resources=None,
|
|
26
25
|
)
|
|
27
26
|
|
|
28
27
|
@property
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.engine.analysis.column_profilers.registry import (
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.engine.errors import DataDesignerError
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.config.base import ConfigBase
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c)
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from abc import ABC, abstractmethod
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from abc import ABC, abstractmethod
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from abc import ABC, abstractmethod
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.engine.sampling_gen.errors import SamplingGenError
|
|
@@ -1,2 +1,2 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.errors import DataDesignerError
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.engine.errors import DataDesignerError
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from typing import NamedTuple
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from copy import deepcopy
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
|
@@ -14,7 +14,7 @@ from rich.console import Console, Group
|
|
|
14
14
|
from rich.padding import Padding
|
|
15
15
|
from rich.panel import Panel
|
|
16
16
|
|
|
17
|
-
from data_designer.config.column_types import ColumnConfigT, DataDesignerColumnType
|
|
17
|
+
from data_designer.config.column_types import ColumnConfigT, DataDesignerColumnType
|
|
18
18
|
from data_designer.config.processors import ProcessorConfigT, ProcessorType
|
|
19
19
|
from data_designer.config.utils.constants import RICH_CONSOLE_THEME
|
|
20
20
|
from data_designer.config.utils.misc import (
|
|
@@ -22,6 +22,7 @@ from data_designer.config.utils.misc import (
|
|
|
22
22
|
get_prompt_template_keywords,
|
|
23
23
|
)
|
|
24
24
|
from data_designer.config.validator_params import ValidatorType
|
|
25
|
+
from data_designer.engine.column_generators.utils.generator_classification import column_type_is_model_generated
|
|
25
26
|
|
|
26
27
|
|
|
27
28
|
class ViolationType(str, Enum):
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.engine.validators.base import BaseValidator, ValidationResult
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from abc import ABC, abstractmethod
|
data_designer/errors.py
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.config.default_model_settings import resolve_seed_default_model_settings
|
|
@@ -1,2 +1,2 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
import logging
|
|
@@ -60,6 +60,8 @@ from data_designer.interface.errors import (
|
|
|
60
60
|
)
|
|
61
61
|
from data_designer.interface.results import DatasetCreationResults
|
|
62
62
|
from data_designer.logging import RandomEmoji
|
|
63
|
+
from data_designer.plugins.plugin import PluginType
|
|
64
|
+
from data_designer.plugins.registry import PluginRegistry
|
|
63
65
|
|
|
64
66
|
DEFAULT_BUFFER_SIZE = 1000
|
|
65
67
|
|
|
@@ -70,6 +72,8 @@ DEFAULT_SEED_READERS = [
|
|
|
70
72
|
LocalFileSeedReader(),
|
|
71
73
|
DataFrameSeedReader(),
|
|
72
74
|
]
|
|
75
|
+
for plugin in PluginRegistry().get_plugins(PluginType.SEED_READER):
|
|
76
|
+
DEFAULT_SEED_READERS.append(plugin.impl_cls())
|
|
73
77
|
|
|
74
78
|
logger = logging.getLogger(__name__)
|
|
75
79
|
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from data_designer.errors import DataDesignerError
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
2
|
# SPDX-License-Identifier: Apache-2.0
|
|
3
3
|
|
|
4
4
|
from __future__ import annotations
|
data_designer/logging.py
CHANGED