PyPI - dvt-core - Versions diffs - 1.11.0b4__py3-none-any.whl - Mend

dvt-core 1.11.0b4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of dvt-core might be problematic. Click here for more details.

Files changed (261) hide show

dvt/__init__.py +7 -0
dvt/_pydantic_shim.py +26 -0
dvt/adapters/__init__.py +16 -0
dvt/adapters/multi_adapter_manager.py +268 -0
dvt/artifacts/__init__.py +0 -0
dvt/artifacts/exceptions/__init__.py +1 -0
dvt/artifacts/exceptions/schemas.py +31 -0
dvt/artifacts/resources/__init__.py +116 -0
dvt/artifacts/resources/base.py +68 -0
dvt/artifacts/resources/types.py +93 -0
dvt/artifacts/resources/v1/analysis.py +10 -0
dvt/artifacts/resources/v1/catalog.py +23 -0
dvt/artifacts/resources/v1/components.py +275 -0
dvt/artifacts/resources/v1/config.py +282 -0
dvt/artifacts/resources/v1/documentation.py +11 -0
dvt/artifacts/resources/v1/exposure.py +52 -0
dvt/artifacts/resources/v1/function.py +53 -0
dvt/artifacts/resources/v1/generic_test.py +32 -0
dvt/artifacts/resources/v1/group.py +22 -0
dvt/artifacts/resources/v1/hook.py +11 -0
dvt/artifacts/resources/v1/macro.py +30 -0
dvt/artifacts/resources/v1/metric.py +173 -0
dvt/artifacts/resources/v1/model.py +146 -0
dvt/artifacts/resources/v1/owner.py +10 -0
dvt/artifacts/resources/v1/saved_query.py +112 -0
dvt/artifacts/resources/v1/seed.py +42 -0
dvt/artifacts/resources/v1/semantic_layer_components.py +72 -0
dvt/artifacts/resources/v1/semantic_model.py +315 -0
dvt/artifacts/resources/v1/singular_test.py +14 -0
dvt/artifacts/resources/v1/snapshot.py +92 -0
dvt/artifacts/resources/v1/source_definition.py +85 -0
dvt/artifacts/resources/v1/sql_operation.py +10 -0
dvt/artifacts/resources/v1/unit_test_definition.py +78 -0
dvt/artifacts/schemas/__init__.py +0 -0
dvt/artifacts/schemas/base.py +191 -0
dvt/artifacts/schemas/batch_results.py +24 -0
dvt/artifacts/schemas/catalog/__init__.py +12 -0
dvt/artifacts/schemas/catalog/v1/__init__.py +0 -0
dvt/artifacts/schemas/catalog/v1/catalog.py +60 -0
dvt/artifacts/schemas/freshness/__init__.py +1 -0
dvt/artifacts/schemas/freshness/v3/__init__.py +0 -0
dvt/artifacts/schemas/freshness/v3/freshness.py +159 -0
dvt/artifacts/schemas/manifest/__init__.py +2 -0
dvt/artifacts/schemas/manifest/v12/__init__.py +0 -0
dvt/artifacts/schemas/manifest/v12/manifest.py +212 -0
dvt/artifacts/schemas/results.py +148 -0
dvt/artifacts/schemas/run/__init__.py +2 -0
dvt/artifacts/schemas/run/v5/__init__.py +0 -0
dvt/artifacts/schemas/run/v5/run.py +184 -0
dvt/artifacts/schemas/upgrades/__init__.py +4 -0
dvt/artifacts/schemas/upgrades/upgrade_manifest.py +174 -0
dvt/artifacts/schemas/upgrades/upgrade_manifest_dbt_version.py +2 -0
dvt/artifacts/utils/validation.py +153 -0
dvt/cli/__init__.py +1 -0
dvt/cli/context.py +16 -0
dvt/cli/exceptions.py +56 -0
dvt/cli/flags.py +558 -0
dvt/cli/main.py +971 -0
dvt/cli/option_types.py +121 -0
dvt/cli/options.py +79 -0
dvt/cli/params.py +803 -0
dvt/cli/requires.py +478 -0
dvt/cli/resolvers.py +32 -0
dvt/cli/types.py +40 -0
dvt/clients/__init__.py +0 -0
dvt/clients/checked_load.py +82 -0
dvt/clients/git.py +164 -0
dvt/clients/jinja.py +206 -0
dvt/clients/jinja_static.py +245 -0
dvt/clients/registry.py +192 -0
dvt/clients/yaml_helper.py +68 -0
dvt/compilation.py +833 -0
dvt/compute/__init__.py +26 -0
dvt/compute/base.py +288 -0
dvt/compute/engines/__init__.py +13 -0
dvt/compute/engines/duckdb_engine.py +368 -0
dvt/compute/engines/spark_engine.py +273 -0
dvt/compute/query_analyzer.py +212 -0
dvt/compute/router.py +483 -0
dvt/config/__init__.py +4 -0
dvt/config/catalogs.py +95 -0
dvt/config/compute_config.py +406 -0
dvt/config/profile.py +411 -0
dvt/config/profiles_v2.py +464 -0
dvt/config/project.py +893 -0
dvt/config/renderer.py +232 -0
dvt/config/runtime.py +491 -0
dvt/config/selectors.py +209 -0
dvt/config/utils.py +78 -0
dvt/connectors/.gitignore +6 -0
dvt/connectors/README.md +306 -0
dvt/connectors/catalog.yml +217 -0
dvt/connectors/download_connectors.py +300 -0
dvt/constants.py +29 -0
dvt/context/__init__.py +0 -0
dvt/context/base.py +746 -0
dvt/context/configured.py +136 -0
dvt/context/context_config.py +350 -0
dvt/context/docs.py +82 -0
dvt/context/exceptions_jinja.py +179 -0
dvt/context/macro_resolver.py +195 -0
dvt/context/macros.py +171 -0
dvt/context/manifest.py +73 -0
dvt/context/providers.py +2198 -0
dvt/context/query_header.py +14 -0
dvt/context/secret.py +59 -0
dvt/context/target.py +74 -0
dvt/contracts/__init__.py +0 -0
dvt/contracts/files.py +413 -0
dvt/contracts/graph/__init__.py +0 -0
dvt/contracts/graph/manifest.py +1904 -0
dvt/contracts/graph/metrics.py +98 -0
dvt/contracts/graph/model_config.py +71 -0
dvt/contracts/graph/node_args.py +42 -0
dvt/contracts/graph/nodes.py +1806 -0
dvt/contracts/graph/semantic_manifest.py +233 -0
dvt/contracts/graph/unparsed.py +812 -0
dvt/contracts/project.py +417 -0
dvt/contracts/results.py +53 -0
dvt/contracts/selection.py +23 -0
dvt/contracts/sql.py +86 -0
dvt/contracts/state.py +69 -0
dvt/contracts/util.py +46 -0
dvt/deprecations.py +347 -0
dvt/deps/__init__.py +0 -0
dvt/deps/base.py +153 -0
dvt/deps/git.py +196 -0
dvt/deps/local.py +80 -0
dvt/deps/registry.py +131 -0
dvt/deps/resolver.py +149 -0
dvt/deps/tarball.py +121 -0
dvt/docs/source/_ext/dbt_click.py +118 -0
dvt/docs/source/conf.py +32 -0
dvt/env_vars.py +64 -0
dvt/event_time/event_time.py +40 -0
dvt/event_time/sample_window.py +60 -0
dvt/events/__init__.py +16 -0
dvt/events/base_types.py +37 -0
dvt/events/core_types_pb2.py +2 -0
dvt/events/logging.py +109 -0
dvt/events/types.py +2534 -0
dvt/exceptions.py +1487 -0
dvt/flags.py +89 -0
dvt/graph/__init__.py +11 -0
dvt/graph/cli.py +248 -0
dvt/graph/graph.py +172 -0
dvt/graph/queue.py +213 -0
dvt/graph/selector.py +375 -0
dvt/graph/selector_methods.py +976 -0
dvt/graph/selector_spec.py +223 -0
dvt/graph/thread_pool.py +18 -0
dvt/hooks.py +21 -0
dvt/include/README.md +49 -0
dvt/include/__init__.py +3 -0
dvt/include/global_project.py +4 -0
dvt/include/starter_project/.gitignore +4 -0
dvt/include/starter_project/README.md +15 -0
dvt/include/starter_project/__init__.py +3 -0
dvt/include/starter_project/analyses/.gitkeep +0 -0
dvt/include/starter_project/dvt_project.yml +36 -0
dvt/include/starter_project/macros/.gitkeep +0 -0
dvt/include/starter_project/models/example/my_first_dbt_model.sql +27 -0
dvt/include/starter_project/models/example/my_second_dbt_model.sql +6 -0
dvt/include/starter_project/models/example/schema.yml +21 -0
dvt/include/starter_project/seeds/.gitkeep +0 -0
dvt/include/starter_project/snapshots/.gitkeep +0 -0
dvt/include/starter_project/tests/.gitkeep +0 -0
dvt/internal_deprecations.py +27 -0
dvt/jsonschemas/__init__.py +3 -0
dvt/jsonschemas/jsonschemas.py +309 -0
dvt/jsonschemas/project/0.0.110.json +4717 -0
dvt/jsonschemas/project/0.0.85.json +2015 -0
dvt/jsonschemas/resources/0.0.110.json +2636 -0
dvt/jsonschemas/resources/0.0.85.json +2536 -0
dvt/jsonschemas/resources/latest.json +6773 -0
dvt/links.py +4 -0
dvt/materializations/__init__.py +0 -0
dvt/materializations/incremental/__init__.py +0 -0
dvt/materializations/incremental/microbatch.py +235 -0
dvt/mp_context.py +8 -0
dvt/node_types.py +37 -0
dvt/parser/__init__.py +23 -0
dvt/parser/analysis.py +21 -0
dvt/parser/base.py +549 -0
dvt/parser/common.py +267 -0
dvt/parser/docs.py +52 -0
dvt/parser/fixtures.py +51 -0
dvt/parser/functions.py +30 -0
dvt/parser/generic_test.py +100 -0
dvt/parser/generic_test_builders.py +334 -0
dvt/parser/hooks.py +119 -0
dvt/parser/macros.py +137 -0
dvt/parser/manifest.py +2204 -0
dvt/parser/models.py +574 -0
dvt/parser/partial.py +1179 -0
dvt/parser/read_files.py +445 -0
dvt/parser/schema_generic_tests.py +423 -0
dvt/parser/schema_renderer.py +111 -0
dvt/parser/schema_yaml_readers.py +936 -0
dvt/parser/schemas.py +1467 -0
dvt/parser/search.py +149 -0
dvt/parser/seeds.py +28 -0
dvt/parser/singular_test.py +20 -0
dvt/parser/snapshots.py +44 -0
dvt/parser/sources.py +557 -0
dvt/parser/sql.py +63 -0
dvt/parser/unit_tests.py +622 -0
dvt/plugins/__init__.py +20 -0
dvt/plugins/contracts.py +10 -0
dvt/plugins/exceptions.py +2 -0
dvt/plugins/manager.py +164 -0
dvt/plugins/manifest.py +21 -0
dvt/profiler.py +20 -0
dvt/py.typed +1 -0
dvt/runners/__init__.py +2 -0
dvt/runners/exposure_runner.py +7 -0
dvt/runners/no_op_runner.py +46 -0
dvt/runners/saved_query_runner.py +7 -0
dvt/selected_resources.py +8 -0
dvt/task/__init__.py +0 -0
dvt/task/base.py +504 -0
dvt/task/build.py +197 -0
dvt/task/clean.py +57 -0
dvt/task/clone.py +162 -0
dvt/task/compile.py +151 -0
dvt/task/compute.py +366 -0
dvt/task/debug.py +650 -0
dvt/task/deps.py +280 -0
dvt/task/docs/__init__.py +3 -0
dvt/task/docs/generate.py +408 -0
dvt/task/docs/index.html +250 -0
dvt/task/docs/serve.py +28 -0
dvt/task/freshness.py +323 -0
dvt/task/function.py +122 -0
dvt/task/group_lookup.py +46 -0
dvt/task/init.py +374 -0
dvt/task/list.py +237 -0
dvt/task/printer.py +176 -0
dvt/task/profiles.py +256 -0
dvt/task/retry.py +175 -0
dvt/task/run.py +1146 -0
dvt/task/run_operation.py +142 -0
dvt/task/runnable.py +802 -0
dvt/task/seed.py +104 -0
dvt/task/show.py +150 -0
dvt/task/snapshot.py +57 -0
dvt/task/sql.py +111 -0
dvt/task/test.py +464 -0
dvt/tests/fixtures/__init__.py +1 -0
dvt/tests/fixtures/project.py +620 -0
dvt/tests/util.py +651 -0
dvt/tracking.py +529 -0
dvt/utils/__init__.py +3 -0
dvt/utils/artifact_upload.py +151 -0
dvt/utils/utils.py +408 -0
dvt/version.py +249 -0
dvt_core-1.11.0b4.dist-info/METADATA +252 -0
dvt_core-1.11.0b4.dist-info/RECORD +261 -0
dvt_core-1.11.0b4.dist-info/WHEEL +5 -0
dvt_core-1.11.0b4.dist-info/entry_points.txt +2 -0
dvt_core-1.11.0b4.dist-info/top_level.txt +1 -0

dvt/parser/unit_tests.py ADDED Viewed

@@ -0,0 +1,622 @@
+import csv
+import os
+from copy import deepcopy
+from csv import DictReader
+from io import StringIO
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Set
+from dvt import utils
+from dvt.artifacts.resources import ModelConfig, UnitTestConfig, UnitTestFormat
+from dvt.config import RuntimeConfig
+from dvt.context.context_config import ContextConfig
+from dvt.context.providers import generate_parse_exposure, get_rendered
+from dvt.contracts.files import FileHash, SchemaSourceFile
+from dvt.contracts.graph.manifest import Manifest
+from dvt.contracts.graph.model_config import UnitTestNodeConfig
+from dvt.contracts.graph.nodes import (
+    DependsOn,
+    ModelNode,
+    UnitTestDefinition,
+    UnitTestNode,
+    UnitTestSourceDefinition,
+)
+from dvt.contracts.graph.unparsed import UnparsedUnitTest
+from dvt.exceptions import InvalidUnitTestGivenInput, ParsingError
+from dvt.graph import UniqueId
+from dvt.node_types import NodeType
+from dvt.parser.schemas import (
+    JSONValidationError,
+    ParseResult,
+    SchemaParser,
+    ValidationError,
+    YamlBlock,
+    YamlParseDictError,
+    YamlReader,
+)
+from dvt.utils import get_pseudo_test_path
+from dbt_common.events.functions import fire_event
+from dbt_common.events.types import SystemStdErr
+from dbt_extractor import ExtractionError, py_extract_from_source  # type: ignore
+class UnitTestManifestLoader:
+    def __init__(self, manifest, root_project, selected) -> None:
+        self.manifest: Manifest = manifest
+        self.root_project: RuntimeConfig = root_project
+        # selected comes from the initial selection against a "regular" manifest
+        self.selected: Set[UniqueId] = selected
+        self.unit_test_manifest = Manifest(macros=manifest.macros)
+    def load(self) -> Manifest:
+        for unique_id in self.selected:
+            if unique_id in self.manifest.unit_tests:
+                unit_test_case: UnitTestDefinition = self.manifest.unit_tests[unique_id]
+                if not unit_test_case.config.enabled:
+                    continue
+                self.parse_unit_test_case(unit_test_case)
+        return self.unit_test_manifest
+    def parse_unit_test_case(self, test_case: UnitTestDefinition):
+        # Create unit test node based on the node being tested
+        # The tested_node has already been resolved and is in depends_on.nodes
+        tested_node_unique_id = test_case.depends_on.nodes[0]
+        tested_node = self.manifest.nodes[tested_node_unique_id]
+        assert isinstance(tested_node, ModelNode)
+        # Create UnitTestNode based on model being tested. Since selection has
+        # already been done, we don't have to care about fields that are necessary
+        # for selection.
+        # Note: no depends_on, that's added later using input nodes
+        name = test_case.name
+        if tested_node.is_versioned:
+            name = name + f"_v{tested_node.version}"
+        expected_sql: Optional[str] = None
+        if test_case.expect.format == UnitTestFormat.SQL:
+            expected_rows: List[Dict[str, Any]] = []
+            expected_sql = test_case.expect.rows  # type: ignore
+        else:
+            assert isinstance(test_case.expect.rows, List)
+            expected_rows = deepcopy(test_case.expect.rows)
+        assert isinstance(expected_rows, List)
+        unit_test_node = UnitTestNode(
+            name=name,
+            resource_type=NodeType.Unit,
+            package_name=test_case.package_name,
+            path=get_pseudo_test_path(name, test_case.original_file_path),
+            original_file_path=test_case.original_file_path,
+            unique_id=test_case.unique_id,
+            config=UnitTestNodeConfig(
+                materialized="unit", expected_rows=expected_rows, expected_sql=expected_sql
+            ),
+            raw_code=tested_node.raw_code,
+            database=tested_node.database,
+            schema=tested_node.schema,
+            alias=name,
+            fqn=test_case.unique_id.split("."),
+            checksum=FileHash.empty(),
+            tested_node_unique_id=tested_node.unique_id,
+            overrides=test_case.overrides,
+        )
+        ctx = generate_parse_exposure(
+            unit_test_node,  # type: ignore
+            self.root_project,
+            self.manifest,
+            test_case.package_name,
+        )
+        get_rendered(unit_test_node.raw_code, ctx, unit_test_node, capture_macros=True)
+        # unit_test_node now has a populated refs/sources
+        self.unit_test_manifest.nodes[unit_test_node.unique_id] = unit_test_node
+        # Now create input_nodes for the test inputs
+        """
+        given:
+          - input: ref('my_model_a')
+            rows: []
+          - input: ref('my_model_b')
+            rows:
+              - {id: 1, b: 2}
+              - {id: 2, b: 2}
+        """
+        # Add the model "input" nodes, consisting of all referenced models in the unit test.
+        # This creates an ephemeral model for every input in every test, so there may be multiple
+        # input models substituting for the same input ref'd model. Note that since these are
+        # always "ephemeral" they just wrap the tested_node SQL in additional CTEs. No actual table
+        # or view is created.
+        for given in test_case.given:
+            # extract the original_input_node from the ref in the "input" key of the given list
+            original_input_node = self._get_original_input_node(
+                given.input, tested_node, test_case.name
+            )
+            input_name = original_input_node.name
+            common_fields = {
+                "resource_type": NodeType.Model,
+                # root directory for input and output fixtures
+                "original_file_path": unit_test_node.original_file_path,
+                "config": ModelConfig(materialized="ephemeral"),
+                "database": original_input_node.database,
+                "alias": original_input_node.identifier,
+                "schema": original_input_node.schema,
+                "fqn": original_input_node.fqn,
+                "checksum": FileHash.empty(),
+                "raw_code": self._build_fixture_raw_code(given.rows, None, given.format),
+                "package_name": original_input_node.package_name,
+                "unique_id": f"model.{original_input_node.package_name}.{input_name}",
+                "name": input_name,
+                "path": f"{input_name}.sql",
+            }
+            resource_type = original_input_node.resource_type
+            if resource_type in (
+                NodeType.Model,
+                NodeType.Seed,
+                NodeType.Snapshot,
+            ):
+                input_node = ModelNode(
+                    **common_fields,
+                    defer_relation=original_input_node.defer_relation,
+                )
+                if resource_type == NodeType.Model:
+                    if original_input_node.version:
+                        input_node.version = original_input_node.version
+                    if original_input_node.latest_version:
+                        input_node.latest_version = original_input_node.latest_version
+            elif resource_type == NodeType.Source:
+                # We are reusing the database/schema/identifier from the original source,
+                # but that shouldn't matter since this acts as an ephemeral model which just
+                # wraps a CTE around the unit test node.
+                input_node = UnitTestSourceDefinition(
+                    **common_fields,
+                    source_name=original_input_node.source_name,  # needed for source lookup
+                )
+                # Sources need to go in the sources dictionary in order to create the right lookup
+                self.unit_test_manifest.sources[input_node.unique_id] = input_node  # type: ignore
+            # Both ModelNode and UnitTestSourceDefinition need to go in nodes dictionary
+            self.unit_test_manifest.nodes[input_node.unique_id] = input_node
+            # Populate this_input_node_unique_id if input fixture represents node being tested
+            if original_input_node == tested_node:
+                unit_test_node.this_input_node_unique_id = input_node.unique_id
+            # Add unique ids of input_nodes to depends_on
+            unit_test_node.depends_on.nodes.append(input_node.unique_id)
+        # Add functions to the manifest and depends_on
+        for unique_id in tested_node.depends_on.nodes:
+            if unique_id in self.manifest.functions:
+                unit_test_node.depends_on.nodes.append(unique_id)
+                self.unit_test_manifest.functions[unique_id] = self.manifest.functions[unique_id]
+    def _build_fixture_raw_code(self, rows, column_name_to_data_types, fixture_format) -> str:
+        # We're not currently using column_name_to_data_types, but leaving here for
+        # possible future use.
+        if fixture_format == UnitTestFormat.SQL:
+            return rows
+        else:
+            return ("{{{{ get_fixture_sql({rows}, {column_name_to_data_types}) }}}}").format(
+                rows=rows, column_name_to_data_types=column_name_to_data_types
+            )
+    def _get_original_input_node(self, input: str, tested_node: ModelNode, test_case_name: str):
+        """
+        Returns the original input node as defined in the project given an input reference
+        and the node being tested.
+        input: str representing how input node is referenced in tested model sql
+          * examples:
+            - "ref('my_model_a')"
+            - "source('my_source_schema', 'my_source_name')"
+            - "this"
+        tested_node: ModelNode of representing node being tested
+        """
+        if input.strip() == "this":
+            original_input_node = tested_node
+        else:
+            try:
+                statically_parsed = py_extract_from_source(f"{{{{ {input} }}}}")
+            except ExtractionError:
+                raise InvalidUnitTestGivenInput(input=input)
+            if statically_parsed["refs"]:
+                ref = list(statically_parsed["refs"])[0]
+                name = ref.get("name")
+                package = ref.get("package")
+                version = ref.get("version")
+                # TODO: disabled lookup, versioned lookup, public models
+                original_input_node = self.manifest.ref_lookup.find(
+                    name, package, version, self.manifest
+                )
+            elif statically_parsed["sources"]:
+                source = list(statically_parsed["sources"])[0]
+                input_source_name, input_name = source
+                original_input_node = self.manifest.source_lookup.find(
+                    f"{input_source_name}.{input_name}",
+                    None,
+                    self.manifest,
+                )
+            else:
+                raise InvalidUnitTestGivenInput(input=input)
+        if not original_input_node:
+            msg = f"Unit test '{test_case_name}' had an input ({input}) which was not found in the manifest."
+            raise ParsingError(msg)
+        return original_input_node
+class UnitTestParser(YamlReader):
+    def __init__(self, schema_parser: SchemaParser, yaml: YamlBlock) -> None:
+        super().__init__(schema_parser, yaml, "unit_tests")
+        self.schema_parser = schema_parser
+        self.yaml = yaml
+    def parse(self) -> ParseResult:
+        for data in self.get_key_dicts():
+            unit_test: UnparsedUnitTest = self._get_unit_test(data)
+            tested_model_node = find_tested_model_node(
+                self.manifest, self.project.project_name, unit_test.model
+            )
+            unit_test_case_unique_id = (
+                f"{NodeType.Unit}.{self.project.project_name}.{unit_test.model}.{unit_test.name}"
+            )
+            unit_test_fqn = self._build_fqn(
+                self.project.project_name,
+                self.yaml.path.original_file_path,
+                unit_test.model,
+                unit_test.name,
+            )
+            unit_test_config = self._build_unit_test_config(unit_test_fqn, unit_test.config)
+            unit_test_definition = UnitTestDefinition(
+                name=unit_test.name,
+                model=unit_test.model,
+                resource_type=NodeType.Unit,
+                package_name=self.project.project_name,
+                path=self.yaml.path.relative_path,
+                original_file_path=self.yaml.path.original_file_path,
+                unique_id=unit_test_case_unique_id,
+                given=unit_test.given,
+                expect=unit_test.expect,
+                description=unit_test.description,
+                overrides=unit_test.overrides,
+                depends_on=DependsOn(),
+                fqn=unit_test_fqn,
+                config=unit_test_config,
+                versions=unit_test.versions,
+            )
+            if tested_model_node:
+                unit_test_definition.depends_on.nodes.append(tested_model_node.unique_id)
+                unit_test_definition.schema = tested_model_node.schema
+            # Check that format and type of rows matches for each given input,
+            # convert rows to a list of dictionaries, and add the unique_id of
+            # the unit_test_definition to the fixture source_file for partial parsing.
+            self._validate_and_normalize_given(unit_test_definition)
+            self._validate_and_normalize_expect(unit_test_definition)
+            # for calculating state:modified
+            unit_test_definition.build_unit_test_checksum()
+            assert isinstance(self.yaml.file, SchemaSourceFile)
+            if unit_test_config.enabled:
+                self.manifest.add_unit_test(self.yaml.file, unit_test_definition)
+            else:
+                self.manifest.add_disabled(self.yaml.file, unit_test_definition)
+        return ParseResult()
+    def _get_unit_test(self, data: Dict[str, Any]) -> UnparsedUnitTest:
+        try:
+            UnparsedUnitTest.validate(data)
+            return UnparsedUnitTest.from_dict(data)
+        except (ValidationError, JSONValidationError) as exc:
+            raise YamlParseDictError(self.yaml.path, self.key, data, exc)
+    def _build_unit_test_config(
+        self, unit_test_fqn: List[str], config_dict: Dict[str, Any]
+    ) -> UnitTestConfig:
+        config = ContextConfig(
+            self.schema_parser.root_project,
+            unit_test_fqn,
+            NodeType.Unit,
+            self.schema_parser.project.project_name,
+        )
+        unit_test_config_dict = config.build_config_dict(patch_config_dict=config_dict)
+        unit_test_config_dict = self.render_entry(unit_test_config_dict)
+        return UnitTestConfig.from_dict(unit_test_config_dict)
+    def _build_fqn(self, package_name, original_file_path, model_name, test_name):
+        # This code comes from "get_fqn" and "get_fqn_prefix" in the base parser.
+        # We need to get the directories underneath the model-path.
+        path = Path(original_file_path)
+        relative_path = str(path.relative_to(*path.parts[:1]))
+        no_ext = os.path.splitext(relative_path)[0]
+        fqn = [package_name]
+        fqn.extend(utils.split_path(no_ext)[:-1])
+        fqn.append(model_name)
+        fqn.append(test_name)
+        return fqn
+    def _get_fixture(self, fixture_name: str, project_name: str):
+        fixture_unique_id = f"{NodeType.Fixture}.{project_name}.{fixture_name}"
+        if fixture_unique_id in self.manifest.fixtures:
+            fixture = self.manifest.fixtures[fixture_unique_id]
+            return fixture
+        else:
+            raise ParsingError(
+                f"File not found for fixture '{fixture_name}' in unit tests in {self.yaml.path.original_file_path}"
+            )
+    def _validate_and_normalize_given(self, unit_test_definition):
+        for ut_input in unit_test_definition.given:
+            self._validate_and_normalize_rows(ut_input, unit_test_definition, "input")
+    def _validate_and_normalize_expect(self, unit_test_definition):
+        self._validate_and_normalize_rows(
+            unit_test_definition.expect, unit_test_definition, "expected"
+        )
+    def _validate_and_normalize_rows(self, ut_fixture, unit_test_definition, fixture_type) -> None:
+        if ut_fixture.format == UnitTestFormat.Dict:
+            if ut_fixture.rows is None and ut_fixture.fixture is None:  # This is a seed
+                ut_fixture.rows = self._load_rows_from_seed(ut_fixture.input)
+            if not isinstance(ut_fixture.rows, list):
+                raise ParsingError(
+                    f"Unit test {unit_test_definition.name} has {fixture_type} rows "
+                    f"which do not match format {ut_fixture.format}"
+                )
+        elif ut_fixture.format == UnitTestFormat.CSV:
+            if not (isinstance(ut_fixture.rows, str) or isinstance(ut_fixture.fixture, str)):
+                raise ParsingError(
+                    f"Unit test {unit_test_definition.name} has {fixture_type} rows or fixtures "
+                    f"which do not match format {ut_fixture.format}.  Expected string."
+                )
+            if ut_fixture.fixture:
+                csv_rows = self.get_fixture_file_rows(
+                    ut_fixture.fixture, self.project.project_name, unit_test_definition.unique_id
+                )
+            else:
+                csv_rows = self._convert_csv_to_list_of_dicts(ut_fixture.rows)
+            # Empty values (e.g. ,,) in a csv fixture should default to null, not ""
+            ut_fixture.rows = [
+                {k: (None if v == "" else v) for k, v in row.items()} for row in csv_rows
+            ]
+        elif ut_fixture.format == UnitTestFormat.SQL:
+            if not (isinstance(ut_fixture.rows, str) or isinstance(ut_fixture.fixture, str)):
+                raise ParsingError(
+                    f"Unit test {unit_test_definition.name} has {fixture_type} rows or fixtures "
+                    f"which do not match format {ut_fixture.format}.  Expected string."
+                )
+            if ut_fixture.fixture:
+                ut_fixture.rows = self.get_fixture_file_rows(
+                    ut_fixture.fixture, self.project.project_name, unit_test_definition.unique_id
+                )
+        # sanitize order of input
+        if ut_fixture.rows and (
+            ut_fixture.format == UnitTestFormat.Dict or ut_fixture.format == UnitTestFormat.CSV
+        ):
+            self._promote_first_non_none_row(ut_fixture)
+    def _promote_first_non_none_row(self, ut_fixture):
+        """
+        Promote the first row with no None values to the top of the ut_fixture.rows list.
+        This function modifies the ut_fixture object in place.
+        Needed for databases like Redshift which uses the first value in a column to determine
+        the column type. If the first value is None, the type is assumed to be VARCHAR(1).
+        This leads to obscure type mismatch errors centered on a unit test fixture's `expect`.
+        See https://github.com/dbt-labs/dbt-redshift/issues/821 for more info.
+        """
+        non_none_row_index = None
+        # Iterate through each row and its index
+        for index, row in enumerate(ut_fixture.rows):
+            # Check if all values in the row are not None
+            if all(value is not None for value in row.values()):
+                non_none_row_index = index
+                break
+        if non_none_row_index is None:
+            fire_event(
+                SystemStdErr(
+                    bmsg="Unit Test fixtures benefit from having at least one row free of Null values to ensure consistent column types. Failure to meet this recommendation can result in type mismatch errors between unit test source models and `expected` fixtures."
+                )
+            )
+        else:
+            ut_fixture.rows[0], ut_fixture.rows[non_none_row_index] = (
+                ut_fixture.rows[non_none_row_index],
+                ut_fixture.rows[0],
+            )
+    def get_fixture_file_rows(self, fixture_name, project_name, utdef_unique_id):
+        # find fixture file object and store unit_test_definition unique_id
+        fixture = self._get_fixture(fixture_name, project_name)
+        fixture_source_file = self.manifest.files[fixture.file_id]
+        fixture_source_file.unit_tests.append(utdef_unique_id)
+        return fixture.rows
+    def _convert_csv_to_list_of_dicts(self, csv_string: str) -> List[Dict[str, Any]]:
+        dummy_file = StringIO(csv_string)
+        reader = csv.DictReader(dummy_file)
+        rows = []
+        for row in reader:
+            rows.append(row)
+        return rows
+    def _load_rows_from_seed(self, ref_str: str) -> List[Dict[str, Any]]:
+        """Read rows from seed file on disk if not specified in YAML config. If seed file doesn't exist, return empty list."""
+        ref = py_extract_from_source("{{ " + ref_str + " }}")["refs"][0]
+        rows: List[Dict[str, Any]] = []
+        seed_name = ref["name"]
+        package_name = ref.get("package", self.project.project_name)
+        seed_node = self.manifest.ref_lookup.find(seed_name, package_name, None, self.manifest)
+        if not seed_node or seed_node.resource_type != NodeType.Seed:
+            # Seed not found in custom package specified
+            if package_name != self.project.project_name:
+                raise ParsingError(
+                    f"Unable to find seed '{package_name}.{seed_name}' for unit tests in '{package_name}' package"
+                )
+            else:
+                raise ParsingError(
+                    f"Unable to find seed '{package_name}.{seed_name}' for unit tests in directories: {self.project.seed_paths}"
+                )
+        seed_path = Path(self.project.project_root) / seed_node.original_file_path
+        with open(seed_path, "r") as f:
+            for row in DictReader(f):
+                rows.append(row)
+        return rows
+def find_tested_model_node(
+    manifest: Manifest, current_project: str, unit_test_model: str
+) -> Optional[ModelNode]:
+    model_name_split = unit_test_model.split()
+    model_name = model_name_split[0]
+    model_version = model_name_split[1] if len(model_name_split) == 2 else None
+    tested_node = manifest.ref_lookup.find(model_name, current_project, model_version, manifest)
+    return tested_node
+# This is called by the ManifestLoader after other processing has been done,
+# so that model versions are available.
+def process_models_for_unit_test(
+    manifest: Manifest, current_project: str, unit_test_def: UnitTestDefinition, models_to_versions
+):
+    # If the unit tests doesn't have a depends_on.nodes[0] then we weren't able to resolve
+    # the model, either because versions hadn't been processed yet, or it's not a valid model name
+    if not unit_test_def.depends_on.nodes:
+        tested_node = find_tested_model_node(manifest, current_project, unit_test_def.model)
+        if not tested_node:
+            raise ParsingError(
+                f"Unable to find model '{current_project}.{unit_test_def.model}' for "
+                f"unit test '{unit_test_def.name}' in {unit_test_def.original_file_path}"
+            )
+        unit_test_def.depends_on.nodes.append(tested_node.unique_id)
+        unit_test_def.schema = tested_node.schema
+    # The UnitTestDefinition should only have one "depends_on" at this point,
+    # the one that's found by the "model" field.
+    target_model_id = unit_test_def.depends_on.nodes[0]
+    if target_model_id not in manifest.nodes:
+        if target_model_id in manifest.disabled:
+            # The model is disabled, so we don't need to do anything (#10540)
+            return
+        else:
+            # If we've reached here and the model is not disabled, throw an error
+            raise ParsingError(
+                f"Unit test '{unit_test_def.name}' references a model that does not exist: {target_model_id}"
+            )
+    target_model = manifest.nodes[target_model_id]
+    assert isinstance(target_model, ModelNode)
+    target_model_is_incremental = "macro.dbt.is_incremental" in target_model.depends_on.macros
+    unit_test_def_has_incremental_override = unit_test_def.overrides and isinstance(
+        unit_test_def.overrides.macros.get("is_incremental"), bool
+    )
+    if target_model_is_incremental and (not unit_test_def_has_incremental_override):
+        raise ParsingError(
+            f"Boolean override for 'is_incremental' must be provided for unit test '{unit_test_def.name}' in model '{target_model.name}'"
+        )
+    unit_test_def_incremental_override_true = (
+        unit_test_def.overrides and unit_test_def.overrides.macros.get("is_incremental")
+    )
+    unit_test_def_has_this_input = "this" in [i.input for i in unit_test_def.given]
+    if (
+        target_model_is_incremental
+        and unit_test_def_incremental_override_true
+        and (not unit_test_def_has_this_input)
+    ):
+        raise ParsingError(
+            f"Unit test '{unit_test_def.name}' for incremental model '{target_model.name}' must have a 'this' input"
+        )
+    # unit_test_versions = unit_test_def.versions
+    # We're setting up unit tests for versioned models, so if
+    # the model isn't versioned, we don't need to do anything
+    if not target_model.is_versioned:
+        if unit_test_def.versions and (
+            unit_test_def.versions.include or unit_test_def.versions.exclude
+        ):
+            # If model is  not versioned, we should not have an include or exclude
+            msg = (
+                f"Unit test '{unit_test_def.name}' should not have a versions include or exclude "
+                f"when referencing non-versioned model '{target_model.name}'"
+            )
+            raise ParsingError(msg)
+        else:
+            return
+    versioned_models = []
+    if (
+        target_model.package_name in models_to_versions
+        and target_model.name in models_to_versions[target_model.package_name]
+    ):
+        versioned_models = models_to_versions[target_model.package_name][target_model.name]
+    versions_to_test = []
+    if unit_test_def.versions is None:
+        versions_to_test = versioned_models
+    elif unit_test_def.versions.exclude:
+        for model_unique_id in versioned_models:
+            model = manifest.nodes[model_unique_id]
+            assert isinstance(model, ModelNode)
+            if model.version in unit_test_def.versions.exclude:
+                continue
+            else:
+                versions_to_test.append(model.unique_id)
+    elif unit_test_def.versions.include:
+        for model_unique_id in versioned_models:
+            model = manifest.nodes[model_unique_id]
+            assert isinstance(model, ModelNode)
+            if model.version in unit_test_def.versions.include:
+                versions_to_test.append(model.unique_id)
+            else:
+                continue
+    if not versions_to_test:
+        msg = (
+            f"Unit test '{unit_test_def.name}' referenced a version of '{target_model.name}' "
+            "which was not found."
+        )
+        raise ParsingError(msg)
+    else:
+        # Create unit test definitions that match the model versions
+        original_unit_test_def = manifest.unit_tests.pop(unit_test_def.unique_id)
+        original_unit_test_dict = original_unit_test_def.to_dict()
+        schema_file = manifest.files[original_unit_test_def.file_id]
+        assert isinstance(schema_file, SchemaSourceFile)
+        schema_file.unit_tests.remove(original_unit_test_def.unique_id)
+        for versioned_model_unique_id in versions_to_test:
+            versioned_model = manifest.nodes[versioned_model_unique_id]
+            assert isinstance(versioned_model, ModelNode)
+            versioned_unit_test_unique_id = f"{NodeType.Unit}.{unit_test_def.package_name}.{unit_test_def.model}.{unit_test_def.name}_v{versioned_model.version}"
+            new_unit_test_def = UnitTestDefinition.from_dict(original_unit_test_dict)
+            new_unit_test_def.unique_id = versioned_unit_test_unique_id
+            new_unit_test_def.depends_on.nodes[0] = versioned_model_unique_id
+            new_unit_test_def.version = versioned_model.version
+            schema_file.unit_tests.append(versioned_unit_test_unique_id)
+            # fqn?
+            manifest.unit_tests[versioned_unit_test_unique_id] = new_unit_test_def

dvt/plugins/__init__.py ADDED Viewed

@@ -0,0 +1,20 @@
+from typing import Optional
+# these are just exports, they need "noqa" so flake8 will not complain.
+from .manager import PluginManager, dbt_hook, dbtPlugin  # noqa
+PLUGIN_MANAGER: Optional[PluginManager] = None
+def set_up_plugin_manager(project_name: str):
+    global PLUGIN_MANAGER
+    PLUGIN_MANAGER = PluginManager.from_modules(project_name)
+def get_plugin_manager(project_name: str) -> PluginManager:
+    global PLUGIN_MANAGER
+    if not PLUGIN_MANAGER:
+        set_up_plugin_manager(project_name)
+    assert PLUGIN_MANAGER
+    return PLUGIN_MANAGER

dvt/plugins/contracts.py ADDED Viewed

@@ -0,0 +1,10 @@
+from typing import Dict
+# just exports, they need "noqa" so flake8 will not complain.
+from dvt.artifacts.schemas.base import ArtifactMixin as PluginArtifact  # noqa
+from dvt.artifacts.schemas.base import BaseArtifactMetadata  # noqa
+from dvt.artifacts.schemas.base import schema_version  # noqa
+from dbt_common.dataclass_schema import ExtensibleDbtClassMixin, dbtClassMixin  # noqa
+PluginArtifacts = Dict[str, PluginArtifact]

dvt/plugins/exceptions.py ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ # just exports, they need "noqa" so flake8 will not complain.
2	+ from dvt.exceptions import dbtPluginError # noqa