data-designer 0.3.0__tar.gz → 0.3.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {data_designer-0.3.0 → data_designer-0.3.2}/.github/workflows/ci.yml +26 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/.gitignore +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/Makefile +10 -4
- {data_designer-0.3.0 → data_designer-0.3.2}/PKG-INFO +2 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/README.md +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/colab_notebooks/1-the-basics.ipynb +33 -33
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/colab_notebooks/2-structured-outputs-and-jinja-expressions.ipynb +30 -30
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/colab_notebooks/3-seeding-with-a-dataset.ipynb +27 -27
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/colab_notebooks/4-providing-images-as-context.ipynb +34 -34
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/notebook_source/1-the-basics.py +2 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/notebook_source/2-structured-outputs-and-jinja-expressions.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/plugins/example.md +0 -3
- data_designer-0.3.2/e2e_tests/pyproject.toml +38 -0
- data_designer-0.3.2/e2e_tests/src/data_designer_e2e_tests/plugins/__init__.py +2 -0
- data_designer-0.3.2/e2e_tests/src/data_designer_e2e_tests/plugins/column_generator/__init__.py +2 -0
- data_designer-0.3.2/e2e_tests/src/data_designer_e2e_tests/plugins/column_generator/config.py +12 -0
- data_designer-0.3.2/e2e_tests/src/data_designer_e2e_tests/plugins/column_generator/impl.py +26 -0
- data_designer-0.3.2/e2e_tests/src/data_designer_e2e_tests/plugins/column_generator/plugin.py +10 -0
- data_designer-0.3.2/e2e_tests/src/data_designer_e2e_tests/plugins/seed_reader/__init__.py +2 -0
- data_designer-0.3.2/e2e_tests/src/data_designer_e2e_tests/plugins/seed_reader/config.py +13 -0
- data_designer-0.3.2/e2e_tests/src/data_designer_e2e_tests/plugins/seed_reader/impl.py +15 -0
- data_designer-0.3.2/e2e_tests/src/data_designer_e2e_tests/plugins/seed_reader/plugin.py +10 -0
- data_designer-0.3.2/e2e_tests/tests/test_e2e.py +73 -0
- data_designer-0.3.2/e2e_tests/tests/test_seed.csv +4 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/pyproject.toml +1 -1
- data_designer-0.3.2/scripts/test_license_headers.py +899 -0
- data_designer-0.3.2/scripts/update_license_headers.py +373 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/__init__.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/_version.py +2 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/__init__.py +1 -1
- data_designer-0.3.2/src/data_designer/cli/commands/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/commands/download.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/commands/list.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/commands/models.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/commands/providers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/commands/reset.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/controllers/__init__.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/controllers/download_controller.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/controllers/model_controller.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/controllers/provider_controller.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/forms/__init__.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/forms/builder.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/forms/field.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/forms/form.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/forms/model_builder.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/forms/provider_builder.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/main.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/repositories/__init__.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/repositories/base.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/repositories/model_repository.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/repositories/persona_repository.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/repositories/provider_repository.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/services/__init__.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/services/download_service.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/services/model_service.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/services/provider_service.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/ui.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/utils.py +1 -1
- data_designer-0.3.2/src/data_designer/config/__init__.py +2 -0
- data_designer-0.3.2/src/data_designer/config/analysis/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/analysis/column_profilers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/analysis/column_statistics.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/analysis/dataset_profiler.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/analysis/utils/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/analysis/utils/reporting.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/base.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/column_configs.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/column_types.py +1 -36
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/config_builder.py +4 -21
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/data_designer_config.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/dataset_builders.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/default_model_settings.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/exports.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/interface.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/models.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/preview_results.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/processors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/run_config.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/sampler_constraints.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/sampler_params.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/seed.py +2 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/seed_source.py +15 -10
- data_designer-0.3.2/src/data_designer/config/seed_source_types.py +17 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/utils/code_lang.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/utils/constants.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/utils/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/utils/info.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/utils/io_helpers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/utils/misc.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/utils/numerical_helpers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/utils/type_helpers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/utils/visualization.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/config/validator_params.py +1 -1
- data_designer-0.3.2/src/data_designer/engine/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/analysis/column_profilers/base.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/analysis/column_profilers/judge_score_profiler.py +1 -3
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/analysis/column_profilers/registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/analysis/column_statistics.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/analysis/dataset_profiler.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/analysis/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/analysis/utils/column_statistics_calculations.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/analysis/utils/judge_score_processing.py +1 -1
- data_designer-0.3.2/src/data_designer/engine/column_generators/__init__.py +2 -0
- data_designer-0.3.2/src/data_designer/engine/column_generators/generators/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/generators/base.py +26 -14
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/generators/embedding.py +3 -6
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/generators/expression.py +3 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/generators/llm_completion.py +8 -13
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/generators/samplers.py +3 -3
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/generators/seed_dataset.py +4 -3
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/generators/validation.py +3 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/utils/errors.py +1 -1
- data_designer-0.3.2/src/data_designer/engine/column_generators/utils/generator_classification.py +41 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/utils/judge_score_factory.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/column_generators/utils/prompt_renderer.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/compiler.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/configurable_task.py +3 -13
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/dataset_builders/artifact_storage.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/dataset_builders/column_wise_builder.py +8 -5
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/dataset_builders/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/dataset_builders/multi_column_configs.py +1 -1
- data_designer-0.3.2/src/data_designer/engine/dataset_builders/utils/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/dataset_builders/utils/concurrency.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/dataset_builders/utils/config_compiler.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/dataset_builders/utils/dag.py +3 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/dataset_builders/utils/dataset_batch_manager.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/dataset_builders/utils/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/model_provider.py +1 -1
- data_designer-0.3.2/src/data_designer/engine/models/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/facade.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/litellm_overrides.py +1 -1
- data_designer-0.3.2/src/data_designer/engine/models/parsers/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/parsers/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/parsers/parser.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/parsers/postprocessors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/parsers/tag_parsers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/parsers/types.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/recipes/base.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/recipes/response_recipes.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/telemetry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/usage.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/models/utils.py +1 -1
- data_designer-0.3.2/src/data_designer/engine/processing/ginja/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/ginja/ast.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/ginja/environment.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/ginja/exceptions.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/ginja/record.py +1 -1
- data_designer-0.3.2/src/data_designer/engine/processing/gsonschema/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/gsonschema/exceptions.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/gsonschema/schema_transformers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/gsonschema/types.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/gsonschema/validators.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/processors/base.py +3 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/processors/drop_columns.py +1 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/processors/registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/processors/schema_transform.py +1 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/processing/utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/registry/base.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/registry/data_designer_registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/registry/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/resources/managed_dataset_generator.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/resources/managed_dataset_repository.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/resources/managed_storage.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/resources/resource_provider.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/resources/seed_reader.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/column.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/constraints.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/data_sources/base.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/data_sources/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/data_sources/sources.py +1 -1
- data_designer-0.3.2/src/data_designer/engine/sampling_gen/entities/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/entities/dataset_based_person_fields.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/entities/email_address_utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/entities/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/entities/national_id_utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/entities/person.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/entities/phone_number.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/generator.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/jinja_utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/people_gen.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/person_constants.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/schema.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/schema_builder.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/secret_resolver.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/validation.py +3 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/validators/__init__.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/validators/base.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/validators/local_callable.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/validators/python.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/validators/remote.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/validators/sql.py +1 -1
- data_designer-0.3.2/src/data_designer/errors.py +5 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/essentials/__init__.py +1 -1
- data_designer-0.3.2/src/data_designer/interface/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/interface/data_designer.py +5 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/interface/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/interface/results.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/logging.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/plugin_manager.py +14 -7
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/plugins/__init__.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/plugins/errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/plugins/plugin.py +4 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/plugins/registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/plugins/testing/__init__.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/plugins/testing/stubs.py +1 -8
- data_designer-0.3.2/src/data_designer/plugins/testing/utils.py +18 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/commands/test_download_command.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/commands/test_list_command.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/commands/test_models_command.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/commands/test_providers_command.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/commands/test_reset_command.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/conftest.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/controllers/test_download_controller.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/controllers/test_model_controller.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/controllers/test_provider_controller.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/forms/test_field.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/forms/test_form.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/forms/test_model_builder.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/forms/test_provider_builder.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/repositories/test_model_repository.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/repositories/test_persona_repository.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/repositories/test_provider_repository.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/services/test_download_service.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/services/test_model_service.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/services/test_provider_service.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/cli/test_cli_utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/analysis/conftest.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/analysis/test_column_statistics.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/analysis/test_dataset_profiler_results.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/analysis/utils/test_reporting.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_columns.py +1 -27
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_config_builder.py +1 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_data_designer_config.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_default_model_settings.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_models.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_processors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_sampler_constraints.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_sampler_params.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_seed.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_seed_source.py +13 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/test_validator_params.py +1 -1
- data_designer-0.3.2/tests/config/utils/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/utils/test_code_lang.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/utils/test_info.py +2 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/utils/test_io_helpers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/utils/test_misc.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/utils/test_type_helpers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/config/utils/test_visualization.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/conftest.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/column_profilers/test_base.py +1 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/column_profilers/test_judge_score_profiler.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/conftest.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/test_column_statistics_calculator.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/test_dataset_profiler.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/test_errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/utils/test_column_statistics_calculations.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/utils/test_judge_score_processing.py +1 -1
- data_designer-0.3.2/tests/engine/column_generators/generators/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/generators/test_column_generator_base.py +1 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/generators/test_embedding.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/generators/test_expression.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/generators/test_llm_completion_generators.py +21 -12
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/generators/test_samplers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/generators/test_seed_dataset.py +2 -3
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/generators/test_validation.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/test_registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/utils/test_column_generator_errors.py +1 -1
- data_designer-0.3.2/tests/engine/column_generators/utils/test_generator_classification.py +32 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/utils/test_judge_score_factory.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/column_generators/utils/test_prompt_renderer.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/conftest.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/dataset_builders/test_artifact_storage.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/dataset_builders/test_column_wise_builder.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/dataset_builders/test_multi_column_configs.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/dataset_builders/utils/test_concurrency.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/dataset_builders/utils/test_config_compiler.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/dataset_builders/utils/test_dag.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/dataset_builders/utils/test_dataset_batch_manager.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/conftest.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/parsers/test_parser.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/parsers/test_parsers_types.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/parsers/test_postprocessors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/parsers/test_tag_parsers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/recipes/test_recipe_base.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/recipes/test_response_recipes.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/test_facade.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/test_litellm_overrides.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/test_model_errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/test_model_registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/test_model_utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/test_usage.py +1 -1
- data_designer-0.3.2/tests/engine/processing/__init__.py +2 -0
- data_designer-0.3.2/tests/engine/processing/ginja/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/ginja/test_ast.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/ginja/test_environment.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/ginja/test_exceptions.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/ginja/test_record.py +1 -1
- data_designer-0.3.2/tests/engine/processing/gsonschema/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/gsonschema/test_exceptions.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/gsonschema/test_schema_transformers.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/gsonschema/test_types.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/gsonschema/test_validators.py +1 -1
- data_designer-0.3.2/tests/engine/processing/processors/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/processors/test_drop_columns.py +1 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/processors/test_registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/processors/test_schema_transform.py +1 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/processing/test_utils.py +1 -1
- data_designer-0.3.2/tests/engine/registry/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/registry/conftest.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/registry/test_base.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/registry/test_data_designer_registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/registry/test_errors.py +1 -1
- data_designer-0.3.2/tests/engine/resources/__init__.py +2 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/resources/conftest.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/resources/test_managed_dataset_generator.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/resources/test_managed_dataset_repository.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/resources/test_managed_storage.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/resources/test_resource_provider.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/resources/test_seed_reader.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/conftest.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/data_sources/test_sampler_errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/data_sources/test_sources.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/entities/test_email_address_utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/entities/test_national_id_utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/entities/test_person.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/entities/test_phone_number.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/test_column.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/test_constraints.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/test_generator.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/test_jinja_utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/test_people_gen.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/test_schema.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/sampling_gen/test_utils.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/test_compiler.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/test_configurable_task.py +8 -14
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/test_engine_errors.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/test_model_provider.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/test_secret_resolver.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/test_validation.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/validators/test_local_callable.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/validators/test_python.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/validators/test_remote.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/validators/test_sql.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/essentials/test_init.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/interface/test_data_designer.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/interface/test_results.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/plugins/test_plugin.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/plugins/test_plugin_registry.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/test_logging.py +1 -1
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/test_plugin_manager.py +1 -27
- data_designer-0.3.0/scripts/update_license_headers.py +0 -215
- data_designer-0.3.0/src/data_designer/cli/commands/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/config/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/config/analysis/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/engine/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/engine/column_generators/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/engine/column_generators/generators/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/engine/dataset_builders/utils/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/engine/models/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/engine/models/parsers/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/engine/processing/ginja/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/engine/processing/gsonschema/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/engine/sampling_gen/entities/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/errors.py +0 -5
- data_designer-0.3.0/src/data_designer/interface/__init__.py +0 -2
- data_designer-0.3.0/src/data_designer/plugins/testing/utils.py +0 -11
- data_designer-0.3.0/tests/config/utils/__init__.py +0 -2
- data_designer-0.3.0/tests/engine/column_generators/generators/__init__.py +0 -2
- data_designer-0.3.0/tests/engine/processing/__init__.py +0 -2
- data_designer-0.3.0/tests/engine/processing/ginja/__init__.py +0 -2
- data_designer-0.3.0/tests/engine/processing/gsonschema/__init__.py +0 -2
- data_designer-0.3.0/tests/engine/processing/processors/__init__.py +0 -2
- data_designer-0.3.0/tests/engine/registry/__init__.py +0 -2
- data_designer-0.3.0/tests/engine/resources/__init__.py +0 -2
- {data_designer-0.3.0 → data_designer-0.3.2}/.github/workflows/build-docs.yml +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/.github/workflows/build-notebooks.yml +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/.github/workflows/check-colab-notebooks.yml +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/.github/workflows/dco-assistant.yml +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/.github/workflows/pack-tutorials.yml +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/.github/workflows/semantic-pull-requests.yml +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/.pre-commit-config.yaml +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/AGENTS.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/CLAUDE.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/CODE_OF_CONDUCT.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/CONTRIBUTING.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/DCO +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/LICENSE +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/VERSIONING.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/CONTRIBUTING.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/assets/palette-favicon.png +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/assets/recipes/code_generation/text_to_python.py +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/assets/recipes/code_generation/text_to_sql.py +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/assets/recipes/qa_and_chat/multi_turn_chat.py +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/assets/recipes/qa_and_chat/product_info_qa.py +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/code_reference/analysis.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/code_reference/column_configs.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/code_reference/config_builder.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/code_reference/data_designer_config.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/code_reference/models.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/code_reference/processors.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/code_reference/sampler_params.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/code_reference/validator_params.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/columns.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/models/configure-model-settings-with-the-cli.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/models/custom-model-settings.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/models/default-model-settings.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/models/inference-parameters.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/models/model-configs.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/models/model-providers.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/person_sampling.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/processors.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/concepts/validators.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/css/mkdocstrings.css +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/css/style.css +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/index.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/installation.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/js/toc-toggle.js +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/notebook_source/3-seeding-with-a-dataset.py +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/notebook_source/4-providing-images-as-context.py +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/notebook_source/README.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/notebook_source/_README.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/notebook_source/_pyproject.toml +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/overrides/main.html +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/plugins/available.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/plugins/overview.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/quick-start.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/recipes/cards.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/recipes/code_generation/text_to_python.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/recipes/code_generation/text_to_sql.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/recipes/qa_and_chat/multi_turn_chat.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/recipes/qa_and_chat/product_info_qa.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/docs/scripts/generate_colab_notebooks.py +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/mkdocs.yml +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/cli/README.md +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/src/data_designer/engine/sampling_gen/entities/assets/zip_area_code_map.parquet +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/test_data/artifacts/dataset/column_configs.json +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/test_data/artifacts/dataset/dataset.json +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/analysis/test_data/artifacts/dataset/metadata.json +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/tests/engine/models/stub_secrets.json +0 -0
- {data_designer-0.3.0 → data_designer-0.3.2}/uv.lock +0 -0
|
@@ -36,6 +36,30 @@ jobs:
|
|
|
36
36
|
run: |
|
|
37
37
|
uv run pytest -v --cov=data_designer --cov-report=term-missing --cov-report=xml --cov-fail-under=90
|
|
38
38
|
|
|
39
|
+
test-e2e:
|
|
40
|
+
name: End to end test (Python ${{ matrix.python-version }} on ${{ matrix.os }})
|
|
41
|
+
runs-on: ${{ matrix.os }}
|
|
42
|
+
strategy:
|
|
43
|
+
fail-fast: false
|
|
44
|
+
matrix:
|
|
45
|
+
os: [ubuntu-latest, macos-latest]
|
|
46
|
+
python-version: ["3.10", "3.11", "3.12", "3.13"]
|
|
47
|
+
|
|
48
|
+
steps:
|
|
49
|
+
- name: Checkout code
|
|
50
|
+
uses: actions/checkout@v4
|
|
51
|
+
|
|
52
|
+
- name: Install uv
|
|
53
|
+
uses: astral-sh/setup-uv@v5
|
|
54
|
+
with:
|
|
55
|
+
version: "latest"
|
|
56
|
+
python-version: ${{ matrix.python-version }}
|
|
57
|
+
enable-cache: true
|
|
58
|
+
|
|
59
|
+
- name: Run e2e tests
|
|
60
|
+
run: |
|
|
61
|
+
make test-e2e
|
|
62
|
+
|
|
39
63
|
lint:
|
|
40
64
|
name: Lint and Format Check
|
|
41
65
|
runs-on: ubuntu-latest
|
|
@@ -70,6 +94,8 @@ jobs:
|
|
|
70
94
|
steps:
|
|
71
95
|
- name: Checkout code
|
|
72
96
|
uses: actions/checkout@v4
|
|
97
|
+
with:
|
|
98
|
+
fetch-depth: 0 # Full history needed for file creation dates
|
|
73
99
|
|
|
74
100
|
- name: Install uv
|
|
75
101
|
uses: astral-sh/setup-uv@v5
|
|
@@ -63,28 +63,34 @@ check-all-fix: format lint-fix
|
|
|
63
63
|
|
|
64
64
|
format:
|
|
65
65
|
@echo "📐 Formatting code with ruff..."
|
|
66
|
-
uv run ruff format src/ tests/ scripts/ --exclude '**/src/data_designer/_version.py'
|
|
66
|
+
uv run ruff format src/ tests/ scripts/ e2e_tests/ --exclude '**/src/data_designer/_version.py'
|
|
67
67
|
@echo "✅ Formatting complete!"
|
|
68
68
|
|
|
69
69
|
format-check:
|
|
70
70
|
@echo "📐 Checking code formatting with ruff..."
|
|
71
|
-
uv run ruff format --check src/ tests/ scripts/ --exclude '**/src/data_designer/_version.py'
|
|
71
|
+
uv run ruff format --check src/ tests/ scripts/ e2e_tests/ --exclude '**/src/data_designer/_version.py'
|
|
72
72
|
@echo "✅ Formatting check complete! Run 'make format' to auto-fix issues."
|
|
73
73
|
|
|
74
74
|
lint:
|
|
75
75
|
@echo "🔍 Linting code with ruff..."
|
|
76
|
-
uv run ruff check --output-format=full src/ tests/ scripts/ --exclude '**/src/data_designer/_version.py'
|
|
76
|
+
uv run ruff check --output-format=full src/ tests/ scripts/ e2e_tests/ --exclude '**/src/data_designer/_version.py'
|
|
77
77
|
@echo "✅ Linting complete! Run 'make lint-fix' to auto-fix issues."
|
|
78
78
|
|
|
79
79
|
lint-fix:
|
|
80
80
|
@echo "🔍 Fixing linting issues with ruff..."
|
|
81
|
-
uv run ruff check --fix src/ tests/ scripts/ --exclude '**/src/data_designer/_version.py'
|
|
81
|
+
uv run ruff check --fix src/ tests/ scripts/ e2e_tests/ --exclude '**/src/data_designer/_version.py'
|
|
82
82
|
@echo "✅ Linting with autofix complete!"
|
|
83
83
|
|
|
84
84
|
test:
|
|
85
85
|
@echo "🧪 Running unit tests..."
|
|
86
86
|
uv run --group dev pytest
|
|
87
87
|
|
|
88
|
+
test-e2e:
|
|
89
|
+
@echo "🧹 Cleaning e2e test environment..."
|
|
90
|
+
rm -rf e2e_tests/uv.lock e2e_tests/.pycache e2e_tests/.venv
|
|
91
|
+
@echo "🧪 Running e2e tests..."
|
|
92
|
+
uv run --no-cache --refresh --directory e2e_tests pytest -s
|
|
93
|
+
|
|
88
94
|
convert-execute-notebooks:
|
|
89
95
|
@echo "📓 Converting Python tutorials to notebooks and executing..."
|
|
90
96
|
@mkdir -p docs/notebooks
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: data-designer
|
|
3
|
-
Version: 0.3.
|
|
3
|
+
Version: 0.3.2
|
|
4
4
|
Summary: General framework for synthetic data generation
|
|
5
5
|
License-Expression: Apache-2.0
|
|
6
6
|
License-File: LICENSE
|
|
@@ -186,7 +186,7 @@ ModelConfig(
|
|
|
186
186
|
top_p=0.9,
|
|
187
187
|
max_tokens=4096,
|
|
188
188
|
),
|
|
189
|
-
|
|
189
|
+
)
|
|
190
190
|
```
|
|
191
191
|
|
|
192
192
|
The value `openai/gpt-oss-20b` would be collected.
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
"cells": [
|
|
3
3
|
{
|
|
4
4
|
"cell_type": "markdown",
|
|
5
|
-
"id": "
|
|
5
|
+
"id": "adb0c3cd",
|
|
6
6
|
"metadata": {},
|
|
7
7
|
"source": [
|
|
8
8
|
"# 🎨 Data Designer Tutorial: The Basics\n",
|
|
@@ -14,7 +14,7 @@
|
|
|
14
14
|
},
|
|
15
15
|
{
|
|
16
16
|
"cell_type": "markdown",
|
|
17
|
-
"id": "
|
|
17
|
+
"id": "73d42bda",
|
|
18
18
|
"metadata": {},
|
|
19
19
|
"source": [
|
|
20
20
|
"### ⚡ Colab Setup\n",
|
|
@@ -25,7 +25,7 @@
|
|
|
25
25
|
{
|
|
26
26
|
"cell_type": "code",
|
|
27
27
|
"execution_count": null,
|
|
28
|
-
"id": "
|
|
28
|
+
"id": "c6675487",
|
|
29
29
|
"metadata": {},
|
|
30
30
|
"outputs": [],
|
|
31
31
|
"source": [
|
|
@@ -36,7 +36,7 @@
|
|
|
36
36
|
{
|
|
37
37
|
"cell_type": "code",
|
|
38
38
|
"execution_count": null,
|
|
39
|
-
"id": "
|
|
39
|
+
"id": "b98ebeee",
|
|
40
40
|
"metadata": {},
|
|
41
41
|
"outputs": [],
|
|
42
42
|
"source": [
|
|
@@ -53,7 +53,7 @@
|
|
|
53
53
|
},
|
|
54
54
|
{
|
|
55
55
|
"cell_type": "markdown",
|
|
56
|
-
"id": "
|
|
56
|
+
"id": "6e2355bb",
|
|
57
57
|
"metadata": {},
|
|
58
58
|
"source": [
|
|
59
59
|
"### 📦 Import the essentials\n",
|
|
@@ -64,7 +64,7 @@
|
|
|
64
64
|
{
|
|
65
65
|
"cell_type": "code",
|
|
66
66
|
"execution_count": null,
|
|
67
|
-
"id": "
|
|
67
|
+
"id": "95bf5ae3",
|
|
68
68
|
"metadata": {},
|
|
69
69
|
"outputs": [],
|
|
70
70
|
"source": [
|
|
@@ -85,7 +85,7 @@
|
|
|
85
85
|
},
|
|
86
86
|
{
|
|
87
87
|
"cell_type": "markdown",
|
|
88
|
-
"id": "
|
|
88
|
+
"id": "ee906a92",
|
|
89
89
|
"metadata": {},
|
|
90
90
|
"source": [
|
|
91
91
|
"### ⚙️ Initialize the Data Designer interface\n",
|
|
@@ -98,7 +98,7 @@
|
|
|
98
98
|
{
|
|
99
99
|
"cell_type": "code",
|
|
100
100
|
"execution_count": null,
|
|
101
|
-
"id": "
|
|
101
|
+
"id": "15b35cb8",
|
|
102
102
|
"metadata": {},
|
|
103
103
|
"outputs": [],
|
|
104
104
|
"source": [
|
|
@@ -107,7 +107,7 @@
|
|
|
107
107
|
},
|
|
108
108
|
{
|
|
109
109
|
"cell_type": "markdown",
|
|
110
|
-
"id": "
|
|
110
|
+
"id": "999ce38a",
|
|
111
111
|
"metadata": {},
|
|
112
112
|
"source": [
|
|
113
113
|
"### 🎛️ Define model configurations\n",
|
|
@@ -124,7 +124,7 @@
|
|
|
124
124
|
{
|
|
125
125
|
"cell_type": "code",
|
|
126
126
|
"execution_count": null,
|
|
127
|
-
"id": "
|
|
127
|
+
"id": "f5ab65d5",
|
|
128
128
|
"metadata": {},
|
|
129
129
|
"outputs": [],
|
|
130
130
|
"source": [
|
|
@@ -154,7 +154,7 @@
|
|
|
154
154
|
},
|
|
155
155
|
{
|
|
156
156
|
"cell_type": "markdown",
|
|
157
|
-
"id": "
|
|
157
|
+
"id": "912d7954",
|
|
158
158
|
"metadata": {},
|
|
159
159
|
"source": [
|
|
160
160
|
"### 🏗️ Initialize the Data Designer Config Builder\n",
|
|
@@ -169,7 +169,7 @@
|
|
|
169
169
|
{
|
|
170
170
|
"cell_type": "code",
|
|
171
171
|
"execution_count": null,
|
|
172
|
-
"id": "
|
|
172
|
+
"id": "0ba83688",
|
|
173
173
|
"metadata": {},
|
|
174
174
|
"outputs": [],
|
|
175
175
|
"source": [
|
|
@@ -178,7 +178,7 @@
|
|
|
178
178
|
},
|
|
179
179
|
{
|
|
180
180
|
"cell_type": "markdown",
|
|
181
|
-
"id": "
|
|
181
|
+
"id": "ee2de21d",
|
|
182
182
|
"metadata": {},
|
|
183
183
|
"source": [
|
|
184
184
|
"## 🎲 Getting started with sampler columns\n",
|
|
@@ -195,7 +195,7 @@
|
|
|
195
195
|
{
|
|
196
196
|
"cell_type": "code",
|
|
197
197
|
"execution_count": null,
|
|
198
|
-
"id": "
|
|
198
|
+
"id": "3009cfa5",
|
|
199
199
|
"metadata": {},
|
|
200
200
|
"outputs": [],
|
|
201
201
|
"source": [
|
|
@@ -204,7 +204,7 @@
|
|
|
204
204
|
},
|
|
205
205
|
{
|
|
206
206
|
"cell_type": "markdown",
|
|
207
|
-
"id": "
|
|
207
|
+
"id": "c42c890f",
|
|
208
208
|
"metadata": {},
|
|
209
209
|
"source": [
|
|
210
210
|
"Let's start designing our product review dataset by adding product category and subcategory columns.\n"
|
|
@@ -213,7 +213,7 @@
|
|
|
213
213
|
{
|
|
214
214
|
"cell_type": "code",
|
|
215
215
|
"execution_count": null,
|
|
216
|
-
"id": "
|
|
216
|
+
"id": "16251687",
|
|
217
217
|
"metadata": {},
|
|
218
218
|
"outputs": [],
|
|
219
219
|
"source": [
|
|
@@ -294,7 +294,7 @@
|
|
|
294
294
|
},
|
|
295
295
|
{
|
|
296
296
|
"cell_type": "markdown",
|
|
297
|
-
"id": "
|
|
297
|
+
"id": "ff41c919",
|
|
298
298
|
"metadata": {},
|
|
299
299
|
"source": [
|
|
300
300
|
"Next, let's add samplers to generate data related to the customer and their review.\n"
|
|
@@ -303,7 +303,7 @@
|
|
|
303
303
|
{
|
|
304
304
|
"cell_type": "code",
|
|
305
305
|
"execution_count": null,
|
|
306
|
-
"id": "
|
|
306
|
+
"id": "78ec15fc",
|
|
307
307
|
"metadata": {},
|
|
308
308
|
"outputs": [],
|
|
309
309
|
"source": [
|
|
@@ -335,12 +335,12 @@
|
|
|
335
335
|
" )\n",
|
|
336
336
|
")\n",
|
|
337
337
|
"\n",
|
|
338
|
-
"
|
|
338
|
+
"data_designer.validate(config_builder)"
|
|
339
339
|
]
|
|
340
340
|
},
|
|
341
341
|
{
|
|
342
342
|
"cell_type": "markdown",
|
|
343
|
-
"id": "
|
|
343
|
+
"id": "8ac2131e",
|
|
344
344
|
"metadata": {},
|
|
345
345
|
"source": [
|
|
346
346
|
"## 🦜 LLM-generated columns\n",
|
|
@@ -355,7 +355,7 @@
|
|
|
355
355
|
{
|
|
356
356
|
"cell_type": "code",
|
|
357
357
|
"execution_count": null,
|
|
358
|
-
"id": "
|
|
358
|
+
"id": "d8232495",
|
|
359
359
|
"metadata": {},
|
|
360
360
|
"outputs": [],
|
|
361
361
|
"source": [
|
|
@@ -386,12 +386,12 @@
|
|
|
386
386
|
" )\n",
|
|
387
387
|
")\n",
|
|
388
388
|
"\n",
|
|
389
|
-
"
|
|
389
|
+
"data_designer.validate(config_builder)"
|
|
390
390
|
]
|
|
391
391
|
},
|
|
392
392
|
{
|
|
393
393
|
"cell_type": "markdown",
|
|
394
|
-
"id": "
|
|
394
|
+
"id": "9105ddf2",
|
|
395
395
|
"metadata": {},
|
|
396
396
|
"source": [
|
|
397
397
|
"### 🔁 Iteration is key – preview the dataset!\n",
|
|
@@ -408,7 +408,7 @@
|
|
|
408
408
|
{
|
|
409
409
|
"cell_type": "code",
|
|
410
410
|
"execution_count": null,
|
|
411
|
-
"id": "
|
|
411
|
+
"id": "a6b02b74",
|
|
412
412
|
"metadata": {},
|
|
413
413
|
"outputs": [],
|
|
414
414
|
"source": [
|
|
@@ -418,7 +418,7 @@
|
|
|
418
418
|
{
|
|
419
419
|
"cell_type": "code",
|
|
420
420
|
"execution_count": null,
|
|
421
|
-
"id": "
|
|
421
|
+
"id": "74a4a386",
|
|
422
422
|
"metadata": {},
|
|
423
423
|
"outputs": [],
|
|
424
424
|
"source": [
|
|
@@ -429,7 +429,7 @@
|
|
|
429
429
|
{
|
|
430
430
|
"cell_type": "code",
|
|
431
431
|
"execution_count": null,
|
|
432
|
-
"id": "
|
|
432
|
+
"id": "b1be4d95",
|
|
433
433
|
"metadata": {},
|
|
434
434
|
"outputs": [],
|
|
435
435
|
"source": [
|
|
@@ -439,7 +439,7 @@
|
|
|
439
439
|
},
|
|
440
440
|
{
|
|
441
441
|
"cell_type": "markdown",
|
|
442
|
-
"id": "
|
|
442
|
+
"id": "c2871df4",
|
|
443
443
|
"metadata": {},
|
|
444
444
|
"source": [
|
|
445
445
|
"### 📊 Analyze the generated data\n",
|
|
@@ -452,7 +452,7 @@
|
|
|
452
452
|
{
|
|
453
453
|
"cell_type": "code",
|
|
454
454
|
"execution_count": null,
|
|
455
|
-
"id": "
|
|
455
|
+
"id": "b2beb476",
|
|
456
456
|
"metadata": {},
|
|
457
457
|
"outputs": [],
|
|
458
458
|
"source": [
|
|
@@ -462,7 +462,7 @@
|
|
|
462
462
|
},
|
|
463
463
|
{
|
|
464
464
|
"cell_type": "markdown",
|
|
465
|
-
"id": "
|
|
465
|
+
"id": "765fb038",
|
|
466
466
|
"metadata": {},
|
|
467
467
|
"source": [
|
|
468
468
|
"### 🆙 Scale up!\n",
|
|
@@ -475,7 +475,7 @@
|
|
|
475
475
|
{
|
|
476
476
|
"cell_type": "code",
|
|
477
477
|
"execution_count": null,
|
|
478
|
-
"id": "
|
|
478
|
+
"id": "f4fc625e",
|
|
479
479
|
"metadata": {},
|
|
480
480
|
"outputs": [],
|
|
481
481
|
"source": [
|
|
@@ -485,7 +485,7 @@
|
|
|
485
485
|
{
|
|
486
486
|
"cell_type": "code",
|
|
487
487
|
"execution_count": null,
|
|
488
|
-
"id": "
|
|
488
|
+
"id": "58989731",
|
|
489
489
|
"metadata": {},
|
|
490
490
|
"outputs": [],
|
|
491
491
|
"source": [
|
|
@@ -498,7 +498,7 @@
|
|
|
498
498
|
{
|
|
499
499
|
"cell_type": "code",
|
|
500
500
|
"execution_count": null,
|
|
501
|
-
"id": "
|
|
501
|
+
"id": "80351a24",
|
|
502
502
|
"metadata": {},
|
|
503
503
|
"outputs": [],
|
|
504
504
|
"source": [
|
|
@@ -510,7 +510,7 @@
|
|
|
510
510
|
},
|
|
511
511
|
{
|
|
512
512
|
"cell_type": "markdown",
|
|
513
|
-
"id": "
|
|
513
|
+
"id": "cc79ae74",
|
|
514
514
|
"metadata": {},
|
|
515
515
|
"source": [
|
|
516
516
|
"## ⏭️ Next Steps\n",
|
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
"cells": [
|
|
3
3
|
{
|
|
4
4
|
"cell_type": "markdown",
|
|
5
|
-
"id": "
|
|
5
|
+
"id": "166f4a41",
|
|
6
6
|
"metadata": {},
|
|
7
7
|
"source": [
|
|
8
8
|
"# 🎨 Data Designer Tutorial: Structured Outputs and Jinja Expressions\n",
|
|
@@ -16,7 +16,7 @@
|
|
|
16
16
|
},
|
|
17
17
|
{
|
|
18
18
|
"cell_type": "markdown",
|
|
19
|
-
"id": "
|
|
19
|
+
"id": "00a139eb",
|
|
20
20
|
"metadata": {},
|
|
21
21
|
"source": [
|
|
22
22
|
"### ⚡ Colab Setup\n",
|
|
@@ -27,7 +27,7 @@
|
|
|
27
27
|
{
|
|
28
28
|
"cell_type": "code",
|
|
29
29
|
"execution_count": null,
|
|
30
|
-
"id": "
|
|
30
|
+
"id": "a60a4a4e",
|
|
31
31
|
"metadata": {},
|
|
32
32
|
"outputs": [],
|
|
33
33
|
"source": [
|
|
@@ -38,7 +38,7 @@
|
|
|
38
38
|
{
|
|
39
39
|
"cell_type": "code",
|
|
40
40
|
"execution_count": null,
|
|
41
|
-
"id": "
|
|
41
|
+
"id": "14fc001f",
|
|
42
42
|
"metadata": {},
|
|
43
43
|
"outputs": [],
|
|
44
44
|
"source": [
|
|
@@ -55,7 +55,7 @@
|
|
|
55
55
|
},
|
|
56
56
|
{
|
|
57
57
|
"cell_type": "markdown",
|
|
58
|
-
"id": "
|
|
58
|
+
"id": "22c4fe6b",
|
|
59
59
|
"metadata": {},
|
|
60
60
|
"source": [
|
|
61
61
|
"### 📦 Import the essentials\n",
|
|
@@ -66,7 +66,7 @@
|
|
|
66
66
|
{
|
|
67
67
|
"cell_type": "code",
|
|
68
68
|
"execution_count": null,
|
|
69
|
-
"id": "
|
|
69
|
+
"id": "b2f8e13d",
|
|
70
70
|
"metadata": {},
|
|
71
71
|
"outputs": [],
|
|
72
72
|
"source": [
|
|
@@ -87,7 +87,7 @@
|
|
|
87
87
|
},
|
|
88
88
|
{
|
|
89
89
|
"cell_type": "markdown",
|
|
90
|
-
"id": "
|
|
90
|
+
"id": "e644b2a8",
|
|
91
91
|
"metadata": {},
|
|
92
92
|
"source": [
|
|
93
93
|
"### ⚙️ Initialize the Data Designer interface\n",
|
|
@@ -100,7 +100,7 @@
|
|
|
100
100
|
{
|
|
101
101
|
"cell_type": "code",
|
|
102
102
|
"execution_count": null,
|
|
103
|
-
"id": "
|
|
103
|
+
"id": "74b146e7",
|
|
104
104
|
"metadata": {},
|
|
105
105
|
"outputs": [],
|
|
106
106
|
"source": [
|
|
@@ -109,7 +109,7 @@
|
|
|
109
109
|
},
|
|
110
110
|
{
|
|
111
111
|
"cell_type": "markdown",
|
|
112
|
-
"id": "
|
|
112
|
+
"id": "7471f914",
|
|
113
113
|
"metadata": {},
|
|
114
114
|
"source": [
|
|
115
115
|
"### 🎛️ Define model configurations\n",
|
|
@@ -126,7 +126,7 @@
|
|
|
126
126
|
{
|
|
127
127
|
"cell_type": "code",
|
|
128
128
|
"execution_count": null,
|
|
129
|
-
"id": "
|
|
129
|
+
"id": "ea1fcee5",
|
|
130
130
|
"metadata": {},
|
|
131
131
|
"outputs": [],
|
|
132
132
|
"source": [
|
|
@@ -156,7 +156,7 @@
|
|
|
156
156
|
},
|
|
157
157
|
{
|
|
158
158
|
"cell_type": "markdown",
|
|
159
|
-
"id": "
|
|
159
|
+
"id": "53855c58",
|
|
160
160
|
"metadata": {},
|
|
161
161
|
"source": [
|
|
162
162
|
"### 🏗️ Initialize the Data Designer Config Builder\n",
|
|
@@ -171,7 +171,7 @@
|
|
|
171
171
|
{
|
|
172
172
|
"cell_type": "code",
|
|
173
173
|
"execution_count": null,
|
|
174
|
-
"id": "
|
|
174
|
+
"id": "74064875",
|
|
175
175
|
"metadata": {},
|
|
176
176
|
"outputs": [],
|
|
177
177
|
"source": [
|
|
@@ -180,7 +180,7 @@
|
|
|
180
180
|
},
|
|
181
181
|
{
|
|
182
182
|
"cell_type": "markdown",
|
|
183
|
-
"id": "
|
|
183
|
+
"id": "808534e9",
|
|
184
184
|
"metadata": {},
|
|
185
185
|
"source": [
|
|
186
186
|
"### 🧑🎨 Designing our data\n",
|
|
@@ -207,7 +207,7 @@
|
|
|
207
207
|
{
|
|
208
208
|
"cell_type": "code",
|
|
209
209
|
"execution_count": null,
|
|
210
|
-
"id": "
|
|
210
|
+
"id": "26d84a29",
|
|
211
211
|
"metadata": {},
|
|
212
212
|
"outputs": [],
|
|
213
213
|
"source": [
|
|
@@ -235,7 +235,7 @@
|
|
|
235
235
|
},
|
|
236
236
|
{
|
|
237
237
|
"cell_type": "markdown",
|
|
238
|
-
"id": "
|
|
238
|
+
"id": "624111a6",
|
|
239
239
|
"metadata": {},
|
|
240
240
|
"source": [
|
|
241
241
|
"Next, let's design our product review dataset using a few more tricks compared to the previous notebook.\n"
|
|
@@ -244,7 +244,7 @@
|
|
|
244
244
|
{
|
|
245
245
|
"cell_type": "code",
|
|
246
246
|
"execution_count": null,
|
|
247
|
-
"id": "
|
|
247
|
+
"id": "c63fbc58",
|
|
248
248
|
"metadata": {},
|
|
249
249
|
"outputs": [],
|
|
250
250
|
"source": [
|
|
@@ -353,7 +353,7 @@
|
|
|
353
353
|
},
|
|
354
354
|
{
|
|
355
355
|
"cell_type": "markdown",
|
|
356
|
-
"id": "
|
|
356
|
+
"id": "60832414",
|
|
357
357
|
"metadata": {},
|
|
358
358
|
"source": [
|
|
359
359
|
"Next, we will use more advanced Jinja expressions to create new columns.\n",
|
|
@@ -370,7 +370,7 @@
|
|
|
370
370
|
{
|
|
371
371
|
"cell_type": "code",
|
|
372
372
|
"execution_count": null,
|
|
373
|
-
"id": "
|
|
373
|
+
"id": "0964aff9",
|
|
374
374
|
"metadata": {},
|
|
375
375
|
"outputs": [],
|
|
376
376
|
"source": [
|
|
@@ -418,12 +418,12 @@
|
|
|
418
418
|
" )\n",
|
|
419
419
|
")\n",
|
|
420
420
|
"\n",
|
|
421
|
-
"
|
|
421
|
+
"data_designer.validate(config_builder)"
|
|
422
422
|
]
|
|
423
423
|
},
|
|
424
424
|
{
|
|
425
425
|
"cell_type": "markdown",
|
|
426
|
-
"id": "
|
|
426
|
+
"id": "a818e85f",
|
|
427
427
|
"metadata": {},
|
|
428
428
|
"source": [
|
|
429
429
|
"### 🔁 Iteration is key – preview the dataset!\n",
|
|
@@ -440,7 +440,7 @@
|
|
|
440
440
|
{
|
|
441
441
|
"cell_type": "code",
|
|
442
442
|
"execution_count": null,
|
|
443
|
-
"id": "
|
|
443
|
+
"id": "4af25c1e",
|
|
444
444
|
"metadata": {},
|
|
445
445
|
"outputs": [],
|
|
446
446
|
"source": [
|
|
@@ -450,7 +450,7 @@
|
|
|
450
450
|
{
|
|
451
451
|
"cell_type": "code",
|
|
452
452
|
"execution_count": null,
|
|
453
|
-
"id": "
|
|
453
|
+
"id": "2594a896",
|
|
454
454
|
"metadata": {},
|
|
455
455
|
"outputs": [],
|
|
456
456
|
"source": [
|
|
@@ -461,7 +461,7 @@
|
|
|
461
461
|
{
|
|
462
462
|
"cell_type": "code",
|
|
463
463
|
"execution_count": null,
|
|
464
|
-
"id": "
|
|
464
|
+
"id": "bfffec10",
|
|
465
465
|
"metadata": {},
|
|
466
466
|
"outputs": [],
|
|
467
467
|
"source": [
|
|
@@ -471,7 +471,7 @@
|
|
|
471
471
|
},
|
|
472
472
|
{
|
|
473
473
|
"cell_type": "markdown",
|
|
474
|
-
"id": "
|
|
474
|
+
"id": "54ce7f5d",
|
|
475
475
|
"metadata": {},
|
|
476
476
|
"source": [
|
|
477
477
|
"### 📊 Analyze the generated data\n",
|
|
@@ -484,7 +484,7 @@
|
|
|
484
484
|
{
|
|
485
485
|
"cell_type": "code",
|
|
486
486
|
"execution_count": null,
|
|
487
|
-
"id": "
|
|
487
|
+
"id": "841f74c7",
|
|
488
488
|
"metadata": {},
|
|
489
489
|
"outputs": [],
|
|
490
490
|
"source": [
|
|
@@ -494,7 +494,7 @@
|
|
|
494
494
|
},
|
|
495
495
|
{
|
|
496
496
|
"cell_type": "markdown",
|
|
497
|
-
"id": "
|
|
497
|
+
"id": "14573ebb",
|
|
498
498
|
"metadata": {},
|
|
499
499
|
"source": [
|
|
500
500
|
"### 🆙 Scale up!\n",
|
|
@@ -507,7 +507,7 @@
|
|
|
507
507
|
{
|
|
508
508
|
"cell_type": "code",
|
|
509
509
|
"execution_count": null,
|
|
510
|
-
"id": "
|
|
510
|
+
"id": "49b43121",
|
|
511
511
|
"metadata": {},
|
|
512
512
|
"outputs": [],
|
|
513
513
|
"source": [
|
|
@@ -517,7 +517,7 @@
|
|
|
517
517
|
{
|
|
518
518
|
"cell_type": "code",
|
|
519
519
|
"execution_count": null,
|
|
520
|
-
"id": "
|
|
520
|
+
"id": "d74648e8",
|
|
521
521
|
"metadata": {},
|
|
522
522
|
"outputs": [],
|
|
523
523
|
"source": [
|
|
@@ -530,7 +530,7 @@
|
|
|
530
530
|
{
|
|
531
531
|
"cell_type": "code",
|
|
532
532
|
"execution_count": null,
|
|
533
|
-
"id": "
|
|
533
|
+
"id": "c811b234",
|
|
534
534
|
"metadata": {},
|
|
535
535
|
"outputs": [],
|
|
536
536
|
"source": [
|
|
@@ -542,7 +542,7 @@
|
|
|
542
542
|
},
|
|
543
543
|
{
|
|
544
544
|
"cell_type": "markdown",
|
|
545
|
-
"id": "
|
|
545
|
+
"id": "56509580",
|
|
546
546
|
"metadata": {},
|
|
547
547
|
"source": [
|
|
548
548
|
"## ⏭️ Next Steps\n",
|