dbt-labs · gshank · Mar 19, 2023 · Mar 8, 2023 · Mar 13, 2023 · Mar 13, 2023
@@ -0,0 +1,6 @@
+kind: Features
+body: Make model contracts agnostic to ordering
+time: 2023-03-13T13:59:17.255368-04:00
+custom:
+  Author: gshank
+  Issue: 6975 7064
@@ -483,7 +483,7 @@ def get_environment(
     native: bool = False,
 ) -> jinja2.Environment:
     args: Dict[str, List[Union[str, Type[jinja2.ext.Extension]]]] = {
-        "extensions": ["jinja2.ext.do"]
+        "extensions": ["jinja2.ext.do", "jinja2.ext.loopcontrols"]
     }
 
     if capture_macros:

@@ -23,6 +23,7 @@
     PropertyYMLError,
     NotImplementedError,
     RelationWrongTypeError,
+    ContractError,
     ColumnTypeMissingError,
 )
 
@@ -66,6 +67,10 @@ def raise_compiler_error(msg, node=None) -> NoReturn:
     raise CompilationError(msg, node)
 
 
+def raise_contract_error(yaml_columns, sql_columns) -> NoReturn:
+    raise ContractError(yaml_columns, sql_columns)
+
+
 def raise_database_error(msg, node=None) -> NoReturn:
     raise DbtDatabaseError(msg, node)
 
@@ -124,6 +129,7 @@ def column_type_missing(column_names) -> NoReturn:
         raise_invalid_property_yml_version,
         raise_not_implemented,
         relation_wrong_type,
+        raise_contract_error,
         column_type_missing,
     ]
 }

@@ -2124,6 +2124,23 @@ def get_message(self) -> str:
         return msg
 
 
+class ContractError(CompilationError):
+    def __init__(self, yaml_columns, sql_columns):
+        self.yaml_columns = yaml_columns
+        self.sql_columns = sql_columns
+        super().__init__(msg=self.get_message())
+
+    def get_message(self) -> str:
+        msg = (
+            "Contracts are enabled for this model. "
+            "Please ensure the name, data_type, and number of columns in your `yml` file "
+            "match the columns in your SQL file.\n"
+            f"Schema File Columns: {self.yaml_columns}\n"
+            f"SQL File Columns: {self.sql_columns}"
+        )
+        return msg
+
+
 # not modifying these since rpc should be deprecated soon
 class UnknownAsyncIDException(Exception):
     CODE = 10012

@@ -37,13 +37,32 @@
   {#--Obtain the column schema provided by the schema file by generating an 'empty schema' query from the model's columns. #}
   {%- set schema_file_provided_columns = get_column_schema_from_query(get_empty_schema_sql(model['columns'])) -%}
 
-  {%- set sql_file_provided_columns_formatted = format_columns(sql_file_provided_columns)  -%}
-  {%- set schema_file_provided_columns_formatted = format_columns(schema_file_provided_columns)  -%}
+  {#-- For compiler error msg #}
+  {%- set sql_columns = (format_columns(sql_file_provided_columns)|trim)  -%}
+  {%- set yaml_columns = (format_columns(schema_file_provided_columns)|trim)  -%}
 
-  {%- if sql_file_provided_columns_formatted != schema_file_provided_columns_formatted -%}
-    {%- do exceptions.raise_compiler_error('Please ensure the name, data_type, order, and number of columns in your `yml` file match the columns in your SQL file.\nSchema File Columns: ' ~ (schema_file_provided_columns_formatted|trim) ~ '\n\nSQL File Columns: ' ~ (sql_file_provided_columns_formatted|trim) ~ ' ' ) %}
+  {%- if sql_file_provided_columns|length != schema_file_provided_columns|length -%}
+    {%- do exceptions.raise_contract_error(yaml_columns, sql_columns) -%}
   {%- endif -%}
 
+  {%- for sql_col in sql_file_provided_columns -%}
+    {%- set yaml_col = [] -%}
+    {%- for schema_col in schema_file_provided_columns -%}
+      {%- if schema_col.name == sql_col.name -%}
+        {%- do yaml_col.append(schema_col) -%}
+        {%- break -%}
+      {%- endif -%}
+    {%- endfor -%}
+    {%- if not yaml_col -%}
+      {#-- Column with name not found in yaml --#}
+      {%- do exceptions.raise_contract_error(yaml_columns, sql_columns) -%}
+    {%- endif -%}
+    {%- if sql_col.dtype != yaml_col[0].dtype -%}
+      {#-- Column data types don't match --#}
+      {%- do exceptions.raise_contract_error(yaml_columns, sql_columns) -%}
+    {%- endif -%}
+  {%- endfor -%}
+
 {% endmacro %}
 
 {% macro format_columns(columns) %}

@@ -25,11 +25,26 @@
 
   create {% if temporary: -%}temporary{%- endif %} table
     {{ relation.include(database=(not temporary), schema=(not temporary)) }}
-    {% if config.get('contract', False) %}
-      {{ get_assert_columns_equivalent(sql) }}
-      {{ get_columns_spec_ddl() }}
-    {% endif %}
+  {% if config.get('contract', False) %}
+    {{ get_assert_columns_equivalent(sql) }}
+    {{ get_columns_spec_ddl() }}
+    {%- set sql = get_select_subquery(sql) %}
+  {% endif %}
   as (
     {{ sql }}
   );
 {%- endmacro %}
+
+{% macro get_select_subquery(sql) %}
+  {{ return(adapter.dispatch('get_select_subquery', 'dbt')(sql)) }}
+{% endmacro %}
+
+{% macro default__get_select_subquery(sql) %}
+    select
+    {% for column in model['columns'] %}
+      {{ column }}{{ ", " if not loop.last }}
+    {% endfor %}
+    from (
+        {{ sql }}
+    ) as model_subq
+{%- endmacro %}
@@ -13,10 +13,11 @@
     {{ get_assert_columns_equivalent(sql) }}
     {{ get_columns_spec_ddl() }} ;
     insert into {{ relation }} {{ get_column_names() }}
-    {% else %}
-      as
+    {%- set sql = get_select_subquery(sql) %}
+  {% else %}
+    as
   {% endif %}
-    (
+  (
     {{ sql }}
   );
 {%- endmacro %}

@@ -65,8 +65,9 @@ def data_types(self, schema_int_type, int_type, string_type):
         ]
 
     def test__constraints_wrong_column_order(self, project, string_type, int_type):
+        # This no longer causes an error, since we enforce yaml column order
         results, log_output = run_dbt_and_capture(
-            ["run", "-s", "my_model_wrong_order"], expect_pass=False
+            ["run", "-s", "my_model_wrong_order"], expect_pass=True
         )
         manifest = get_manifest(project.project_root)
         model_id = "model.test.my_model_wrong_order"
@@ -75,18 +76,6 @@ def test__constraints_wrong_column_order(self, project, string_type, int_type):
 
         assert contract_actual_config is True
 
-        expected_compile_error = "Please ensure the name, data_type, order, and number of columns in your `yml` file match the columns in your SQL file."
-        expected_schema_file_columns = (
-            f"Schema File Columns: id {int_type}, color {string_type}, date_day DATE"
-        )
-        expected_sql_file_columns = (
-            f"SQL File Columns: color {string_type}, id {int_type}, date_day DATE"
-        )
-
-        assert expected_compile_error in log_output
-        assert expected_schema_file_columns in log_output
-        assert expected_sql_file_columns in log_output
-
     def test__constraints_wrong_column_names(self, project, string_type, int_type):
         results, log_output = run_dbt_and_capture(
             ["run", "-s", "my_model_wrong_name"], expect_pass=False
@@ -98,7 +87,7 @@ def test__constraints_wrong_column_names(self, project, string_type, int_type):
 
         assert contract_actual_config is True
 
-        expected_compile_error = "Please ensure the name, data_type, order, and number of columns in your `yml` file match the columns in your SQL file."
+        expected_compile_error = "Please ensure the name, data_type, and number of columns in your `yml` file match the columns in your SQL file."
         expected_schema_file_columns = (
             f"Schema File Columns: id {int_type}, color {string_type}, date_day DATE"
         )
@@ -147,7 +136,7 @@ def test__constraints_wrong_column_data_types(
 
             assert contract_actual_config is True
 
-            expected_compile_error = "Please ensure the name, data_type, order, and number of columns in your `yml` file match the columns in your SQL file."
+            expected_compile_error = "Please ensure the name, data_type, and number of columns in your `yml` file match the columns in your SQL file."
             expected_sql_file_columns = (
                 f"SQL File Columns: wrong_data_type_column_name {error_data_type}"
             )
@@ -196,11 +185,19 @@ def test__constraints_correct_column_data_types(self, project, data_types):
     id ,
     color ,
     date_day
-) (
+)
+(
     select
-        1 as id,
-        'blue' as color,
-        cast('2019-01-01' as date) as date_day
+       id,
+       color,
+       date_day
+       from
+    (
+        select
+            1 as id,
+            'blue' as color,
+            cast('2019-01-01' as date) as date_day
+    ) as model_subq
 );
 """
 
@@ -248,10 +245,10 @@ def test__constraints_ddl(self, project, expected_sql):
             expected_sql_check == generated_sql_check
         ), f"""
 -- GENERATED SQL
-{generated_sql}
+{generated_sql_check}
 
 -- EXPECTED SQL
-{expected_sql}
+{expected_sql_check}
 """
 
     def test__constraints_enforcement_rollback(

@@ -1,6 +1,6 @@
 import pytest
 from dbt.exceptions import ParsingError
-from dbt.tests.util import run_dbt, get_manifest, run_dbt_and_capture
+from dbt.tests.util import run_dbt, get_manifest, get_artifact, run_dbt_and_capture
 
 my_model_sql = """
 {{
@@ -10,8 +10,8 @@
 }}
 
 select
-  1 as id,
   'blue' as color,
+  1 as id,
   cast('2019-01-01' as date) as date_day
 """
 
@@ -29,7 +29,7 @@
   cast('2019-01-01' as date) as date_day
 """
 
-my_model_constraints_disabled_sql = """
+my_model_contract_disabled_sql = """
 {{
   config(
     materialized = "table",
@@ -171,7 +171,7 @@ def model(dbt, _):
 """
 
 
-class TestModelLevelConstraintsEnabledConfigs:
+class TestModelLevelContractEnabledConfigs:
     @pytest.fixture(scope="class")
     def models(self):
         return {
@@ -180,11 +180,12 @@ def models(self):
         }
 
     def test__model_contract_true(self, project):
-        run_dbt(["parse"])
+        run_dbt(["run"])
         manifest = get_manifest(project.project_root)
         model_id = "model.test.my_model"
-        my_model_columns = manifest.nodes[model_id].columns
-        my_model_config = manifest.nodes[model_id].config
+        model = manifest.nodes[model_id]
+        my_model_columns = model.columns
+        my_model_config = model.config
         contract_actual_config = my_model_config.contract
 
         assert contract_actual_config is True
@@ -193,8 +194,17 @@ def test__model_contract_true(self, project):
 
         assert expected_columns == str(my_model_columns)
 
+        # compiled fields aren't in the manifest above because it only has parsed fields
+        manifest_json = get_artifact(project.project_root, "target", "manifest.json")
+        compiled_code = manifest_json["nodes"][model_id]["compiled_code"]
+        cleaned_code = " ".join(compiled_code.split())
+        assert (
+            "select 'blue' as color, 1 as id, cast('2019-01-01' as date) as date_day"
+            == cleaned_code
+        )
+
 
-class TestProjectConstraintsEnabledConfigs:
+class TestProjectContractEnabledConfigs:
     @pytest.fixture(scope="class")
     def project_config_update(self):
         return {
@@ -221,7 +231,7 @@ def test_defined_column_type(self, project):
         assert contract_actual_config is True
 
 
-class TestProjectConstraintsEnabledConfigsError:
+class TestProjectContractEnabledConfigsError:
     @pytest.fixture(scope="class")
     def project_config_update(self):
         return {
@@ -253,7 +263,7 @@ def test_undefined_column_type(self, project):
         assert expected_compile_error in log_output
 
 
-class TestModelConstraintsEnabledConfigs:
+class TestModelContractEnabledConfigs:
     @pytest.fixture(scope="class")
     def models(self):
         return {"my_model.sql": my_model_contract_sql, "constraints_schema.yml": model_schema_yml}
@@ -267,7 +277,7 @@ def test__model_contract(self, project):
         assert contract_actual_config is True
 
 
-class TestModelConstraintsEnabledConfigsMissingDataTypes:
+class TestModelContractEnabledConfigsMissingDataTypes:
     @pytest.fixture(scope="class")
     def models(self):
         return {
@@ -289,11 +299,11 @@ def test_undefined_column_type(self, project):
         assert expected_compile_error in log_output
 
 
-class TestModelLevelConstraintsDisabledConfigs:
+class TestModelLevelContractDisabledConfigs:
     @pytest.fixture(scope="class")
     def models(self):
         return {
-            "my_model.sql": my_model_constraints_disabled_sql,
+            "my_model.sql": my_model_contract_disabled_sql,
             "constraints_schema.yml": model_schema_yml,
         }
 
@@ -308,7 +318,7 @@ def test__model_contract_false(self, project):
         assert contract_actual_config is False
 
 
-class TestModelLevelConstraintsErrorMessages:
+class TestModelLevelContractErrorMessages:
     @pytest.fixture(scope="class")
     def models(self):
         return {
@@ -330,7 +340,7 @@ def test__config_errors(self, project):
         assert expected_empty_data_type_error not in str(exc_str)
 
 
-class TestSchemaConstraintsEnabledConfigs:
+class TestSchemaContractEnabledConfigs:
     @pytest.fixture(scope="class")
     def models(self):
         return {
@@ -347,7 +357,7 @@ def test__schema_error(self, project):
         assert schema_error_expected in str(exc_str)
 
 
-class TestPythonModelLevelConstraintsErrorMessages:
+class TestPythonModelLevelContractErrorMessages:
     @pytest.fixture(scope="class")
     def models(self):
         return {