dbt-labs · MichelleArk · Nov 2, 2023 · Oct 25, 2023 · Nov 1, 2023 · Nov 1, 2023
diff --git a/.changes/unreleased/Features-20231101-101845.yaml b/.changes/unreleased/Features-20231101-101845.yaml
@@ -0,0 +1,6 @@
+kind: Features
+body: Support unit testing incremental models
+time: 2023-11-01T10:18:45.341781-04:00
+custom:
+  Author: michelleark
+  Issue: "8422"
diff --git a/core/dbt/context/providers.py b/core/dbt/context/providers.py
@@ -1541,6 +1541,14 @@ def env_var(self, var: str, default: Optional[str] = None) -> str:
         else:
             return super().env_var(var, default)
 
+    @contextproperty()
+    def this(self) -> Optional[str]:
+        if self.model.this:
+            # TODO: RuntimeRefResolver.set_cte also passes None as second argument.
+            self.model.set_cte(self.model.this.unique_id, None)  # type: ignore
+            return self.adapter.Relation.add_ephemeral_prefix(self.model.this.name)
+        return None
+
 
 # This is called by '_context_for', used in 'render_with_context'
 def generate_parser_model_context(

diff --git a/core/dbt/contracts/graph/nodes.py b/core/dbt/contracts/graph/nodes.py
@@ -1068,6 +1068,7 @@ class UnitTestNode(CompiledNode):
     attached_node: Optional[str] = None
     overrides: Optional[UnitTestOverrides] = None
     config: UnitTestNodeConfig = field(default_factory=UnitTestNodeConfig)
+    this: Optional[ModelNode] = None
 
 
 @dataclass

diff --git a/core/dbt/exceptions.py b/core/dbt/exceptions.py
@@ -1220,6 +1220,12 @@
         super().__init__(msg=msg)
 
 
+class InvalidUnitTestGivenInput(ParsingError):
+    def __init__(self, input: str) -> None:
+        msg = f"Unit test given inputs must be either a 'ref', 'source' or 'this' call. Got: '{input}'."
+        super().__init__(msg=msg)
+
+
 class SameKeyNestedError(CompilationError):
     def __init__(self) -> None:
         msg = "Test cannot have the same key at the top-level and in config"

diff --git a/core/dbt/parser/unit_tests.py b/core/dbt/parser/unit_tests.py
@@ -9,13 +9,12 @@
 from dbt.contracts.graph.nodes import (
     ModelNode,
     UnitTestNode,
-    RefArgs,
     UnitTestDefinition,
     DependsOn,
     UnitTestConfig,
 )
 from dbt.contracts.graph.unparsed import UnparsedUnitTestSuite
-from dbt.exceptions import ParsingError
+from dbt.exceptions import ParsingError, InvalidUnitTestGivenInput
 from dbt.graph import UniqueId
 from dbt.node_types import NodeType
 from dbt.parser.schemas import (
@@ -28,7 +27,7 @@
     ParseResult,
 )
 from dbt.utils import get_pseudo_test_path
-from dbt_extractor import py_extract_from_source  # type: ignore
+from dbt_extractor import py_extract_from_source, ExtractionError  # type: ignore
 
 
 class UnitTestManifestLoader:
@@ -53,6 +52,7 @@
         actual_node = self.manifest.ref_lookup.perform_lookup(
             f"model.{package_name}.{test_case.model}", self.manifest
         )
+        assert isinstance(actual_node, ModelNode)
 
         # Create UnitTestNode based on model being tested. Since selection has
         # already been done, we don't have to care about fields that are necessary
@@ -106,7 +106,7 @@
         # input models substituting for the same input ref'd model.
         for given in test_case.given:
             # extract the original_input_node from the ref in the "input" key of the given list
-            original_input_node = self._get_original_input_node(given.input)
+            original_input_node = self._get_original_input_node(given.input, actual_node)
 
             original_input_node_columns = None
             if (
@@ -117,11 +117,13 @@
                     column.name: column.data_type for column in original_input_node.columns
                 }
 
-            # TODO: package_name?
-            input_name = f"{test_case.model}__{test_case.name}__{original_input_node.name}"
+            # TODO: include package_name?
+            input_name = f"{unit_test_node.name}__{original_input_node.name}"
             input_unique_id = f"model.{package_name}.{input_name}"
             input_node = ModelNode(
-                raw_code=self._build_raw_code(given.get_rows(), original_input_node_columns),
+                raw_code=self._build_fixture_raw_code(
+                    given.get_rows(), original_input_node_columns
+                ),
                 resource_type=NodeType.Model,
                 package_name=package_name,
                 path=original_input_node.path,
@@ -136,37 +138,55 @@
                 checksum=FileHash.empty(),
             )
             self.unit_test_manifest.nodes[input_node.unique_id] = input_node
+
+            # Store input_node on unit_test_node for ease of access in UnitTestContext.this
+            if original_input_node == actual_node:
+                unit_test_node.this = input_node
+
             # Add unique ids of input_nodes to depends_on
             unit_test_node.depends_on.nodes.append(input_node.unique_id)
 
-    def _build_raw_code(self, rows, column_name_to_data_types) -> str:
+    def _build_fixture_raw_code(self, rows, column_name_to_data_types) -> str:
         return ("{{{{ get_fixture_sql({rows}, {column_name_to_data_types}) }}}}").format(
             rows=rows, column_name_to_data_types=column_name_to_data_types
         )
 
-    def _get_original_input_node(self, input: str):
-        """input: ref('my_model_a')"""
-        # Exract the ref or sources
-        statically_parsed = py_extract_from_source(f"{{{{ {input} }}}}")
-        if statically_parsed["refs"]:
-            # set refs and sources on the node object
-            refs: List[RefArgs] = []
-            for ref in statically_parsed["refs"]:
-                name = ref.get("name")
-                package = ref.get("package")
-                version = ref.get("version")
-                refs.append(RefArgs(name, package, version))
-                # TODO: disabled lookup, versioned lookup, public models
-                original_input_node = self.manifest.ref_lookup.find(
-                    name, package, version, self.manifest
-                )
-        elif statically_parsed["sources"]:
-            input_package_name, input_source_name = statically_parsed["sources"][0]
-            original_input_node = self.manifest.source_lookup.find(
-                input_source_name, input_package_name, self.manifest
-            )
+    def _get_original_input_node(self, input: str, tested_node: ModelNode):
+        """
+        Returns the original input node as defined in the project given an input reference
+        and the node being tested.
+
+        input: str representing how input node is referenced in tested model sql
+          * examples:
+            - "ref('my_model_a')"
+            - "source('my_source_schema', 'my_source_name')"
+            - "this"
+        tested_node: ModelNode of representing node being tested
+        """
+        if input.strip() == "this":
+            original_input_node = tested_node
         else:
-            raise ParsingError("given input must be ref or source")
+            try:
+                statically_parsed = py_extract_from_source(f"{{{{ {input} }}}}")
+            except ExtractionError:
+                raise InvalidUnitTestGivenInput(input=input)
+
+            if statically_parsed["refs"]:
+                for ref in statically_parsed["refs"]:
+                    name = ref.get("name")
+                    package = ref.get("package")
+                    version = ref.get("version")
+                    # TODO: disabled lookup, versioned lookup, public models
+                    original_input_node = self.manifest.ref_lookup.find(
+                        name, package, version, self.manifest
+                    )
+            elif statically_parsed["sources"]:
+                input_package_name, input_source_name = statically_parsed["sources"][0]
+                original_input_node = self.manifest.source_lookup.find(
+                    input_source_name, input_package_name, self.manifest
+                )
+            else:
+                raise InvalidUnitTestGivenInput(input=input)
 
         return original_input_node
 

diff --git a/tests/functional/unit_testing/test_unit_testing.py b/tests/functional/unit_testing/test_unit_testing.py
@@ -331,3 +331,77 @@ def test_basic(self, project):
         )
         with pytest.raises(ParsingError):
             results = run_dbt(["unit-test", "--select", "my_model"], expect_pass=False)
+
+
+event_sql = """
+select DATE '2020-01-01' as event_time, 1 as event
+union all
+select DATE '2020-01-02' as event_time, 2 as event
+union all
+select DATE '2020-01-03' as event_time, 3 as event
+"""
+
+my_incremental_model_sql = """
+{{
+    config(
+        materialized='incremental'
+    )
+}}
+
+select * from {{ ref('events') }}
+{% if is_incremental() %}
+where event_time > (select max(event_time) from {{ this }})
+{% endif %}
+"""
+
+test_my_model_incremental_yml = """
+unit:
+  - model: my_incremental_model
+    tests:
+      - name: incremental_false
+        overrides:
+          macros:
+            is_incremental: false
+        given:
+          - input: ref('events')
+            rows:
+              - {event_time: "2020-01-01", event: 1}
+        expect:
+          rows:
+            - {event_time: "2020-01-01", event: 1}
+      - name: incremental_true
+        overrides:
+          macros:
+            is_incremental: true
+        given:
+          - input: ref('events')
+            rows:
+              - {event_time: "2020-01-01", event: 1}
+              - {event_time: "2020-01-02", event: 2}
+              - {event_time: "2020-01-03", event: 3}
+          - input: this
+            rows:
+              - {event_time: "2020-01-01", event: 1}
+        expect:
+          rows:
+            - {event_time: "2020-01-02", event: 2}
+            - {event_time: "2020-01-03", event: 3}
+"""
+
+
+class TestUnitTestIncrementalModel:
+    @pytest.fixture(scope="class")
+    def models(self):
+        return {
+            "my_incremental_model.sql": my_incremental_model_sql,
+            "events.sql": event_sql,
+            "test_my_incremental_model.yml": test_my_model_incremental_yml,
+        }
+
+    def test_basic(self, project):
+        results = run_dbt(["run"])
+        assert len(results) == 2
+
+        # Select by model name
+        results = run_dbt(["unit-test", "--select", "my_incremental_model"], expect_pass=True)
+        assert len(results) == 2