use adapter to execute sql

create incremental test directory in adapter zone
v2 based on feedback for base version of testing, plus small removal of leftover breakpoint
2025-12-17 19:31:34 +00:00 · 2022-04-01 16:18:13 -04:00 · 2022-04-01 09:21:43 -05:00 · 2022-03-31 17:07:23 -05:00 · 2022-03-30 16:10:15 -05:00 · 2022-03-30 09:57:02 -05:00
20 changed files with 565 additions and 570 deletions
--- a/.changes/unreleased/Features-20220328-150812.yaml
+++ b/.changes/unreleased/Features-20220328-150812.yaml
@@ -0,0 +1,7 @@
+kind: Features
+body: converting unique key as list tests to new pytest format
+time: 2022-03-28T15:08:12.70006-05:00
+custom:
+  Author: McKnight-42
+  Issue: "4882"
+  PR: "4958"
--- a/core/dbt/tests/tables.py
+++ b/core/dbt/tests/tables.py
@@ -1,8 +1,7 @@
 from dbt.context import providers
 from unittest.mock import patch
 from contextlib import contextmanager
-from dbt.events.functions import fire_event
-from dbt.events.test_types import IntegrationTestDebug
+from dbt.tests.util import run_sql_with_adapter

 # This code was copied from the earlier test framework in test/integration/base.py
 # The goal is to vastly simplify this and replace it with calls to macros.
@@ -309,38 +308,7 @@ class TableComparison:

    # This duplicates code in the TestProjInfo class.
    def run_sql(self, sql, fetch=None):
-        if sql.strip() == "":
-            return
-        # substitute schema and database in sql
-        adapter = self.adapter
-        kwargs = {
-            "schema": self.unique_schema,
-            "database": adapter.quote(self.default_database),
-        }
-        sql = sql.format(**kwargs)
-
-        with self.get_connection("__test") as conn:
-            msg = f'test connection "{conn.name}" executing: {sql}'
-            fire_event(IntegrationTestDebug(msg=msg))
-            with conn.handle.cursor() as cursor:
-                try:
-                    cursor.execute(sql)
-                    conn.handle.commit()
-                    conn.handle.commit()
-                    if fetch == "one":
-                        return cursor.fetchone()
-                    elif fetch == "all":
-                        return cursor.fetchall()
-                    else:
-                        return
-                except BaseException as e:
-                    if conn.handle and not getattr(conn.handle, "closed", True):
-                        conn.handle.rollback()
-                    print(sql)
-                    print(e)
-                    raise
-                finally:
-                    conn.transaction_open = False
+        return run_sql_with_adapter(self.adapter, sql, fetch=fetch)

    def get_tables_in_schema(self):
        sql = """
--- a/test/integration/076_incremental_unique_id_test/models/duplicated_unary_unique_key_list.sql
+++ b/test/integration/076_incremental_unique_id_test/models/duplicated_unary_unique_key_list.sql
@@ -1,17 +0,0 @@
-{{
-    config(
-        materialized='incremental',
-        unique_key=['state', 'state']
-    )
-}}
-
-select
-    state::varchar(2) as state,
-    county::varchar(12) as county,
-    city::varchar(12) as city,
-    last_visit_date::date as last_visit_date
-from {{ ref('seed') }}
-
-{% if is_incremental() %}
-    where last_visit_date > (select max(last_visit_date) from {{ this }})
-{% endif %}
--- a/test/integration/076_incremental_unique_id_test/models/empty_str_unique_key.sql
+++ b/test/integration/076_incremental_unique_id_test/models/empty_str_unique_key.sql
@@ -1,16 +0,0 @@
-- ensure model with empty string unique key should build normally
-
-{{
-    config(
-        materialized='incremental',
-        unique_key=''
-    )
-}}
-
-select
-    *
-from {{ ref('seed') }}
-
-{% if is_incremental() %}
-    where last_visit_date > (select max(last_visit_date) from {{ this }})
-{% endif %}
--- a/test/integration/076_incremental_unique_id_test/models/empty_unique_key_list.sql
+++ b/test/integration/076_incremental_unique_id_test/models/empty_unique_key_list.sql
@@ -1,14 +0,0 @@
-- model with empty list unique key should build normally
-
-{{
-    config(
-        materialized='incremental',
-        unique_key=[]
-    )
-}}
-
-select * from {{ ref('seed') }}
-
-{% if is_incremental() %}
-    where last_visit_date > (select max(last_visit_date) from {{ this }})
-{% endif %}
--- a/test/integration/076_incremental_unique_id_test/models/expected/one_str__overwrite.sql
+++ b/test/integration/076_incremental_unique_id_test/models/expected/one_str__overwrite.sql
@@ -1,21 +0,0 @@
-{{
-    config(
-        materialized='table'
-    )
-}}
-
-select
-    'CT'::varchar(2) as state,
-    'Hartford'::varchar(12) as county,
-    'Hartford'::varchar(12) as city,
-    '2022-02-14'::date as last_visit_date
-union all
-select 'MA'::varchar(2),'Suffolk'::varchar(12),'Boston'::varchar(12),'2020-02-12'::date
-union all
-select 'NJ'::varchar(2),'Mercer'::varchar(12),'Trenton'::varchar(12),'2022-01-01'::date
-union all
-select 'NY'::varchar(2),'Kings'::varchar(12),'Brooklyn'::varchar(12),'2021-04-02'::date
-union all
-select 'NY'::varchar(2),'New York'::varchar(12),'Manhattan'::varchar(12),'2021-04-01'::date
-union all
-select 'PA'::varchar(2),'Philadelphia'::varchar(12),'Philadelphia'::varchar(12),'2021-05-21'::date
--- a/test/integration/076_incremental_unique_id_test/models/expected/unique_key_list__inplace_overwrite.sql
+++ b/test/integration/076_incremental_unique_id_test/models/expected/unique_key_list__inplace_overwrite.sql
@@ -1,21 +0,0 @@
-{{
-    config(
-        materialized='table'
-    )
-}}
-
-select
-    'CT'::varchar(2) as state,
-    'Hartford'::varchar(12) as county,
-    'Hartford'::varchar(12) as city,
-    '2022-02-14'::date as last_visit_date
-union all
-select 'MA'::varchar(2),'Suffolk'::varchar(12),'Boston'::varchar(12),'2020-02-12'::date
-union all
-select 'NJ'::varchar(2),'Mercer'::varchar(12),'Trenton'::varchar(12),'2022-01-01'::date
-union all
-select 'NY'::varchar(2),'Kings'::varchar(12),'Brooklyn'::varchar(12),'2021-04-02'::date
-union all
-select 'NY'::varchar(2),'New York'::varchar(12),'Manhattan'::varchar(12),'2021-04-01'::date
-union all
-select 'PA'::varchar(2),'Philadelphia'::varchar(12),'Philadelphia'::varchar(12),'2021-05-21'::date
--- a/test/integration/076_incremental_unique_id_test/models/no_unique_key.sql
+++ b/test/integration/076_incremental_unique_id_test/models/no_unique_key.sql
@@ -1,15 +0,0 @@
-- no specified unique key should cause no special build behavior
-
-{{
-    config(
-        materialized='incremental'
-    )
-}}
-
-select
-    *
-from {{ ref('seed') }}
-
-{% if is_incremental() %}
-    where last_visit_date > (select max(last_visit_date) from {{ this }})
-{% endif %}
--- a/test/integration/076_incremental_unique_id_test/models/nontyped_trinary_unique_key_list.sql
+++ b/test/integration/076_incremental_unique_id_test/models/nontyped_trinary_unique_key_list.sql
@@ -1,21 +0,0 @@
-- a multi-argument unique key list should see overwriting on rows in the model
--   where all unique key fields apply
--   N.B. needed for direct comparison with seed
-
-{{
-    config(
-        materialized='incremental',
-        unique_key=['state', 'county', 'city']
-    )
-}}
-
-select
-    state as state,
-    county as county,
-    city as city,
-    last_visit_date as last_visit_date
-from {{ ref('seed') }}
-
-{% if is_incremental() %}
-    where last_visit_date > (select max(last_visit_date) from {{ this }})
-{% endif %}
--- a/test/integration/076_incremental_unique_id_test/models/not_found_unique_key.sql
+++ b/test/integration/076_incremental_unique_id_test/models/not_found_unique_key.sql
@@ -1,16 +0,0 @@
-- a model with a unique key not found in the table itself will error out
-
-{{
-    config(
-        materialized='incremental',
-        unique_key='thisisnotacolumn'
-    )
-}}
-
-select
-    *
-from {{ ref('seed') }}
-
-{% if is_incremental() %}
-    where last_visit_date > (select max(last_visit_date) from {{ this }})
-{% endif %}
--- a/test/integration/076_incremental_unique_id_test/models/not_found_unique_key_list.sql
+++ b/test/integration/076_incremental_unique_id_test/models/not_found_unique_key_list.sql
@@ -1,10 +0,0 @@
-- a unique key list with any element not in the model itself should error out
-
-{{
-    config(
-        materialized='incremental',
-        unique_key=['state', 'thisisnotacolumn']
-    )
-}}
-
-select * from {{ ref('seed') }}
--- a/test/integration/076_incremental_unique_id_test/models/str_unique_key.sql
+++ b/test/integration/076_incremental_unique_id_test/models/str_unique_key.sql
@@ -1,21 +0,0 @@
-- a unique key with a string should trigger to overwrite behavior when
--   the source has entries in conflict (i.e. more than one row per unique key
--   combination)
-
-{{
-    config(
-        materialized='incremental',
-        unique_key='state'
-    )
-}}
-
-select
-    state::varchar(2) as state,
-    county::varchar(12) as county,
-    city::varchar(12) as city,
-    last_visit_date::date as last_visit_date
-from {{ ref('seed') }}
-
-{% if is_incremental() %}
-    where last_visit_date > (select max(last_visit_date) from {{ this }})
-{% endif %}
--- a/test/integration/076_incremental_unique_id_test/models/trinary_unique_key_list.sql
+++ b/test/integration/076_incremental_unique_id_test/models/trinary_unique_key_list.sql
@@ -1,20 +0,0 @@
-- a multi-argument unique key list should see overwriting on rows in the model
--   where all unique key fields apply
-
-{{
-    config(
-        materialized='incremental',
-        unique_key=['state', 'county', 'city']
-    )
-}}
-
-select
-    state::varchar(2) as state,
-    county::varchar(12) as county,
-    city::varchar(12) as city,
-    last_visit_date::date as last_visit_date
-from {{ ref('seed') }}
-
-{% if is_incremental() %}
-    where last_visit_date > (select max(last_visit_date) from {{ this }})
-{% endif %}
--- a/test/integration/076_incremental_unique_id_test/models/unary_unique_key_list.sql
+++ b/test/integration/076_incremental_unique_id_test/models/unary_unique_key_list.sql
@@ -1,20 +0,0 @@
-- a one argument unique key list should result in overwritting semantics for
--   that one matching field
-
-{{
-    config(
-        materialized='incremental',
-        unique_key=['state']
-    )
-}}
-
-select
-    state::varchar(2) as state,
-    county::varchar(12) as county,
-    city::varchar(12) as city,
-    last_visit_date::date as last_visit_date
-from {{ ref('seed') }}
-
-{% if is_incremental() %}
-    where last_visit_date > (select max(last_visit_date) from {{ this }})
-{% endif %}
--- a/test/integration/076_incremental_unique_id_test/seeds/add_new_rows.sql
+++ b/test/integration/076_incremental_unique_id_test/seeds/add_new_rows.sql
@@ -1,12 +0,0 @@
-- Insert statement which when applied to seed.csv sees incremental model
--   grow in size while not (necessarily) diverging from the seed itself.
-
-- insert two new rows, both of which should be in incremental model
--   with any unique columns
-insert into {schema}.seed
-    (state, county, city, last_visit_date)
-values ('WA','King','Seattle','2022-02-01');
-
-insert into {schema}.seed
-    (state, county, city, last_visit_date)
-values ('CA','Los Angeles','Los Angeles','2022-02-01');
--- a/test/integration/076_incremental_unique_id_test/seeds/duplicate_insert.sql
+++ b/test/integration/076_incremental_unique_id_test/seeds/duplicate_insert.sql
@@ -1,9 +0,0 @@
-- Insert statement which when applied to seed.csv triggers the inplace
--   overwrite strategy of incremental models. Seed and incremental model
--   diverge.
-
-- insert new row, which should not be in incremental model
--  with primary or first three columns unique
-insert into {schema}.seed
-    (state, county, city, last_visit_date)
-values ('CT','Hartford','Hartford','2022-02-14');
--- a/test/integration/076_incremental_unique_id_test/seeds/seed.csv
+++ b/test/integration/076_incremental_unique_id_test/seeds/seed.csv
@@ -1,7 +0,0 @@
-state,county,city,last_visit_date
-CT,Hartford,Hartford,2020-09-23
-MA,Suffolk,Boston,2020-02-12
-NJ,Mercer,Trenton,2022-01-01
-NY,Kings,Brooklyn,2021-04-02
-NY,New York,Manhattan,2021-04-01
-PA,Philadelphia,Philadelphia,2021-05-21
--- a/test/integration/076_incremental_unique_id_test/test_incremental_unique_id.py
+++ b/test/integration/076_incremental_unique_id_test/test_incremental_unique_id.py
@@ -1,295 +0,0 @@
-from dbt.contracts.results import RunStatus
-from test.integration.base import DBTIntegrationTest, use_profile
-from collections import namedtuple
-from pathlib import Path
-
-
-TestResults = namedtuple(
-    'TestResults',
-    ['seed_count', 'model_count', 'seed_rows', 'inc_test_model_count',
-     'opt_model_count', 'relation'],
-)
-
-
-class TestIncrementalUniqueKeyBase(DBTIntegrationTest):
-    @property
-    def schema(self):
-        return 'incremental_unique_key'
-
-    @property
-    def models(self):
-        return 'models'
-
-    def update_incremental_model(self, incremental_model):
-        '''update incremental model after the seed table has been updated'''
-        model_result_set = self.run_dbt(['run', '--select', incremental_model])
-        return len(model_result_set)
-
-    def setup_test(self, seed, incremental_model, update_sql_file):
-        '''build a test case and return values for assertions
-        [INFO] Models must be in place to test incremental model
-        construction and merge behavior. Database touches are side
-        effects to extract counts (which speak to health of unique keys).'''
-        #idempotently create some number of seeds and incremental models'''
-        seed_count = len(self.run_dbt(
-            ['seed', '--select', seed, '--full-refresh']
-        ))
-        model_count = len(self.run_dbt(
-            ['run', '--select', incremental_model, '--full-refresh']
-        ))
-
-        # update seed in anticipation of incremental model update
-        row_count_query = 'select * from {}.{}'.format(
-            self.unique_schema(),
-            seed
-        )
-        self.run_sql_file(Path('seeds') / Path(update_sql_file + '.sql'))
-        seed_rows = len(self.run_sql(row_count_query, fetch='all'))
-
-        # propagate seed state to incremental model according to unique keys
-        inc_test_model_count = self.update_incremental_model(
-            incremental_model=incremental_model
-        )
-
-        return (seed_count, model_count, seed_rows, inc_test_model_count)
-
-    def test_scenario_correctness(self, expected_fields, test_case_fields):
-        '''Invoke assertions to verify correct build functionality'''
-        # 1. test seed(s) should build afresh
-        self.assertEqual(
-            expected_fields.seed_count, test_case_fields.seed_count
-        )
-        # 2. test model(s) should build afresh
-        self.assertEqual(
-            expected_fields.model_count, test_case_fields.model_count
-        )
-        # 3. seeds should have intended row counts post update
-        self.assertEqual(
-            expected_fields.seed_rows, test_case_fields.seed_rows
-        )
-        # 4. incremental test model(s) should be updated
-        self.assertEqual(
-            expected_fields.inc_test_model_count,
-            test_case_fields.inc_test_model_count
-        )
-        # 5. extra incremental model(s) should be built; optional since
-        #   comparison may be between an incremental model and seed
-        if (expected_fields.opt_model_count and
-            test_case_fields.opt_model_count):
-            self.assertEqual(
-                expected_fields.opt_model_count,
-                test_case_fields.opt_model_count
-            )
-        # 6. result table should match intended result set (itself a relation)
-        self.assertTablesEqual(
-            expected_fields.relation, test_case_fields.relation
-        )
-
-    def stub_expected_fields(
-        self, relation, seed_rows, opt_model_count=None
-    ):
-        return TestResults(
-            seed_count=1, model_count=1, seed_rows=seed_rows,
-            inc_test_model_count=1, opt_model_count=opt_model_count,
-            relation=relation
-        )
-
-    def fail_to_build_inc_missing_unique_key_column(self, incremental_model_name):
-        '''should pass back error state when trying build an incremental
-           model whose unique key or keylist includes a column missing
-           from the incremental model'''
-        seed_count = len(self.run_dbt(
-            ['seed', '--select', 'seed', '--full-refresh']
-        ))
-        # unique keys are not applied on first run, so two are needed
-        self.run_dbt(
-            ['run', '--select', incremental_model_name, '--full-refresh'],
-            expect_pass=True
-        )
-        run_result = self.run_dbt(
-            ['run', '--select', incremental_model_name],
-            expect_pass=False
-        ).results[0]
-
-        return run_result.status, run_result.message
-
-
-class TestIncrementalWithoutUniqueKey(TestIncrementalUniqueKeyBase):
-    @use_profile('postgres')
-    def test__postgres_no_unique_keys(self):
-        '''with no unique keys, seed and model should match'''
-        seed='seed'
-        seed_rows=8
-        incremental_model='no_unique_key'
-        update_sql_file='add_new_rows'
-
-        expected_fields = self.stub_expected_fields(
-            relation=seed, seed_rows=seed_rows
-        )
-        test_case_fields = TestResults(
-            *self.setup_test(seed, incremental_model, update_sql_file),
-            opt_model_count=None, relation=incremental_model
-        )
-
-        self.test_scenario_correctness(expected_fields, test_case_fields)
-
-
-class TestIncrementalStrUniqueKey(TestIncrementalUniqueKeyBase):
-    @use_profile('postgres')
-    def test__postgres_empty_str_unique_key(self):
-        '''with empty string for unique key, seed and model should match'''
-        seed='seed'
-        seed_rows=8
-        incremental_model='empty_str_unique_key'
-        update_sql_file='add_new_rows'
-
-        expected_fields = self.stub_expected_fields(
-            relation=seed, seed_rows=seed_rows
-        )
-        test_case_fields = TestResults(
-            *self.setup_test(seed, incremental_model, update_sql_file),
-            opt_model_count=None, relation=incremental_model
-        )
-
-        self.test_scenario_correctness(expected_fields, test_case_fields)
-
-    @use_profile('postgres')
-    def test__postgres_one_unique_key(self):
-        '''with one unique key, model will overwrite existing row'''
-        seed='seed'
-        seed_rows=7
-        incremental_model='str_unique_key'
-        update_sql_file='duplicate_insert'
-        expected_model='one_str__overwrite'
-
-        expected_fields = self.stub_expected_fields(
-            relation=expected_model, seed_rows=seed_rows, opt_model_count=1
-        )
-        test_case_fields = TestResults(
-            *self.setup_test(seed, incremental_model, update_sql_file),
-            opt_model_count=self.update_incremental_model(expected_model),
-            relation=incremental_model
-        )
-
-        self.test_scenario_correctness(expected_fields, test_case_fields)
-
-    @use_profile('postgres')
-    def test__postgres_bad_unique_key(self):
-        '''expect compilation error from unique key not being a column'''
-
-        (status, exc) = self.fail_to_build_inc_missing_unique_key_column(
-            incremental_model_name='not_found_unique_key'
-        )
-
-        self.assertEqual(status, RunStatus.Error)
-        self.assertTrue("thisisnotacolumn" in exc.lower())
-
-
-class TestIncrementalListUniqueKey(TestIncrementalUniqueKeyBase):
-    @use_profile('postgres')
-    def test__postgres_empty_unique_key_list(self):
-        '''with no unique keys, seed and model should match'''
-        seed='seed'
-        seed_rows=8
-        incremental_model='empty_unique_key_list'
-        update_sql_file='add_new_rows'
-
-        expected_fields = self.stub_expected_fields(
-            relation=seed, seed_rows=seed_rows
-        )
-        test_case_fields = TestResults(
-            *self.setup_test(seed, incremental_model, update_sql_file),
-            opt_model_count=None, relation=incremental_model
-        )
-
-        self.test_scenario_correctness(expected_fields, test_case_fields)
-
-    @use_profile('postgres')
-    def test__postgres_unary_unique_key_list(self):
-        '''with one unique key, model will overwrite existing row'''
-        seed='seed'
-        seed_rows=7
-        incremental_model='unary_unique_key_list'
-        update_sql_file='duplicate_insert'
-        expected_model='unique_key_list__inplace_overwrite'
-
-        expected_fields = self.stub_expected_fields(
-            relation=expected_model, seed_rows=seed_rows, opt_model_count=1
-        )
-        test_case_fields = TestResults(
-            *self.setup_test(seed, incremental_model, update_sql_file),
-            opt_model_count=self.update_incremental_model(expected_model),
-            relation=incremental_model
-        )
-
-        self.test_scenario_correctness(expected_fields, test_case_fields)
-
-    @use_profile('postgres')
-    def test__postgres_duplicated_unary_unique_key_list(self):
-        '''with two of the same unique key, model will overwrite existing row'''
-        seed='seed'
-        seed_rows=7
-        incremental_model='duplicated_unary_unique_key_list'
-        update_sql_file='duplicate_insert'
-        expected_model='unique_key_list__inplace_overwrite'
-
-        expected_fields = self.stub_expected_fields(
-            relation=expected_model, seed_rows=seed_rows, opt_model_count=1
-        )
-        test_case_fields = TestResults(
-            *self.setup_test(seed, incremental_model, update_sql_file),
-            opt_model_count=self.update_incremental_model(expected_model),
-            relation=incremental_model
-        )
-
-        self.test_scenario_correctness(expected_fields, test_case_fields)
-
-    @use_profile('postgres')
-    def test__postgres_trinary_unique_key_list(self):
-        '''with three unique keys, model will overwrite existing row'''
-        seed='seed'
-        seed_rows=7
-        incremental_model='trinary_unique_key_list'
-        update_sql_file='duplicate_insert'
-        expected_model='unique_key_list__inplace_overwrite'
-
-        expected_fields = self.stub_expected_fields(
-            relation=expected_model, seed_rows=seed_rows, opt_model_count=1
-        )
-        test_case_fields = TestResults(
-            *self.setup_test(seed, incremental_model, update_sql_file),
-            opt_model_count=self.update_incremental_model(expected_model),
-            relation=incremental_model
-        )
-
-        self.test_scenario_correctness(expected_fields, test_case_fields)
-
-    @use_profile('postgres')
-    def test__postgres_trinary_unique_key_list_no_update(self):
-        '''even with three unique keys, adding distinct rows to seed does not
-           cause seed and model to diverge'''
-        seed='seed'
-        seed_rows=8
-        incremental_model='nontyped_trinary_unique_key_list'
-        update_sql_file='add_new_rows'
-
-        expected_fields = self.stub_expected_fields(
-            relation=seed, seed_rows=seed_rows
-        )
-        test_case_fields = TestResults(
-            *self.setup_test(seed, incremental_model, update_sql_file),
-            opt_model_count=None, relation=incremental_model
-        )
-
-        self.test_scenario_correctness(expected_fields, test_case_fields)
-
-    @use_profile('postgres')
-    def test__postgres_bad_unique_key_list(self):
-        '''expect compilation error from unique key not being a column'''
-
-        (status, exc) = self.fail_to_build_inc_missing_unique_key_column(
-            incremental_model_name='not_found_unique_key_list'
-        )
-
-        self.assertEqual(status, RunStatus.Error)
-        self.assertTrue("thisisnotacolumn" in exc.lower())
--- a/tests/adapter/dbt/tests/adapter/incremental/test_incremental_unique_id.py
+++ b/tests/adapter/dbt/tests/adapter/incremental/test_incremental_unique_id.py
@@ -0,0 +1,556 @@
+import pytest
+from dbt.tests.util import run_dbt
+from dbt.tests.tables import TableComparison
+from dbt.contracts.results import RunStatus
+from collections import namedtuple
+from pathlib import Path
+
+models__trinary_unique_key_list_sql = """
+-- a multi-argument unique key list should see overwriting on rows in the model
+--   where all unique key fields apply
+
+{{
+    config(
+        materialized='incremental',
+        unique_key=['state', 'county', 'city']
+    )
+}}
+
+select
+    state::varchar(2) as state,
+    county::varchar(12) as county,
+    city::varchar(12) as city,
+    last_visit_date::date as last_visit_date
+from {{ ref('seed') }}
+
+{% if is_incremental() %}
+    where last_visit_date > (select max(last_visit_date) from {{ this }})
+{% endif %}
+
+"""
+
+models__nontyped_trinary_unique_key_list_sql = """
+-- a multi-argument unique key list should see overwriting on rows in the model
+--   where all unique key fields apply
+--   N.B. needed for direct comparison with seed
+
+{{
+    config(
+        materialized='incremental',
+        unique_key=['state', 'county', 'city']
+    )
+}}
+
+select
+    state as state,
+    county as county,
+    city as city,
+    last_visit_date as last_visit_date
+from {{ ref('seed') }}
+
+{% if is_incremental() %}
+    where last_visit_date > (select max(last_visit_date) from {{ this }})
+{% endif %}
+
+"""
+
+models__unary_unique_key_list_sql = """
+-- a one argument unique key list should result in overwritting semantics for
+--   that one matching field
+
+{{
+    config(
+        materialized='incremental',
+        unique_key=['state']
+    )
+}}
+
+select
+    state::varchar(2) as state,
+    county::varchar(12) as county,
+    city::varchar(12) as city,
+    last_visit_date::date as last_visit_date
+from {{ ref('seed') }}
+
+{% if is_incremental() %}
+    where last_visit_date > (select max(last_visit_date) from {{ this }})
+{% endif %}
+
+"""
+
+models__not_found_unique_key_sql = """
+-- a model with a unique key not found in the table itself will error out
+
+{{
+    config(
+        materialized='incremental',
+        unique_key='thisisnotacolumn'
+    )
+}}
+
+select
+    *
+from {{ ref('seed') }}
+
+{% if is_incremental() %}
+    where last_visit_date > (select max(last_visit_date) from {{ this }})
+{% endif %}
+
+"""
+
+models__empty_unique_key_list_sql = """
+-- model with empty list unique key should build normally
+
+{{
+    config(
+        materialized='incremental',
+        unique_key=[]
+    )
+}}
+
+select * from {{ ref('seed') }}
+
+{% if is_incremental() %}
+    where last_visit_date > (select max(last_visit_date) from {{ this }})
+{% endif %}
+
+"""
+
+models__no_unique_key_sql = """
+-- no specified unique key should cause no special build behavior
+
+{{
+    config(
+        materialized='incremental'
+    )
+}}
+
+select
+    *
+from {{ ref('seed') }}
+
+{% if is_incremental() %}
+    where last_visit_date > (select max(last_visit_date) from {{ this }})
+{% endif %}
+
+"""
+
+models__empty_str_unique_key_sql = """
+-- ensure model with empty string unique key should build normally
+
+{{
+    config(
+        materialized='incremental',
+        unique_key=''
+    )
+}}
+
+select
+    *
+from {{ ref('seed') }}
+
+{% if is_incremental() %}
+    where last_visit_date > (select max(last_visit_date) from {{ this }})
+{% endif %}
+
+"""
+
+models__str_unique_key_sql = """
+-- a unique key with a string should trigger to overwrite behavior when
+--   the source has entries in conflict (i.e. more than one row per unique key
+--   combination)
+
+{{
+    config(
+        materialized='incremental',
+        unique_key='state'
+    )
+}}
+
+select
+    state::varchar(2) as state,
+    county::varchar(12) as county,
+    city::varchar(12) as city,
+    last_visit_date::date as last_visit_date
+from {{ ref('seed') }}
+
+{% if is_incremental() %}
+    where last_visit_date > (select max(last_visit_date) from {{ this }})
+{% endif %}
+
+"""
+
+models__duplicated_unary_unique_key_list_sql = """
+{{
+    config(
+        materialized='incremental',
+        unique_key=['state', 'state']
+    )
+}}
+
+select
+    state::varchar(2) as state,
+    county::varchar(12) as county,
+    city::varchar(12) as city,
+    last_visit_date::date as last_visit_date
+from {{ ref('seed') }}
+
+{% if is_incremental() %}
+    where last_visit_date > (select max(last_visit_date) from {{ this }})
+{% endif %}
+
+"""
+
+models__not_found_unique_key_list_sql = """
+-- a unique key list with any element not in the model itself should error out
+
+{{
+    config(
+        materialized='incremental',
+        unique_key=['state', 'thisisnotacolumn']
+    )
+}}
+
+select * from {{ ref('seed') }}
+
+"""
+
+models__expected__one_str__overwrite_sql = """
+{{
+    config(
+        materialized='table'
+    )
+}}
+
+select
+    'CT'::varchar(2) as state,
+    'Hartford'::varchar(12) as county,
+    'Hartford'::varchar(12) as city,
+    '2022-02-14'::date as last_visit_date
+union all
+select 'MA'::varchar(2),'Suffolk'::varchar(12),'Boston'::varchar(12),'2020-02-12'::date
+union all
+select 'NJ'::varchar(2),'Mercer'::varchar(12),'Trenton'::varchar(12),'2022-01-01'::date
+union all
+select 'NY'::varchar(2),'Kings'::varchar(12),'Brooklyn'::varchar(12),'2021-04-02'::date
+union all
+select 'NY'::varchar(2),'New York'::varchar(12),'Manhattan'::varchar(12),'2021-04-01'::date
+union all
+select 'PA'::varchar(2),'Philadelphia'::varchar(12),'Philadelphia'::varchar(12),'2021-05-21'::date
+
+"""
+
+models__expected__unique_key_list__inplace_overwrite_sql = """
+{{
+    config(
+        materialized='table'
+    )
+}}
+
+select
+    'CT'::varchar(2) as state,
+    'Hartford'::varchar(12) as county,
+    'Hartford'::varchar(12) as city,
+    '2022-02-14'::date as last_visit_date
+union all
+select 'MA'::varchar(2),'Suffolk'::varchar(12),'Boston'::varchar(12),'2020-02-12'::date
+union all
+select 'NJ'::varchar(2),'Mercer'::varchar(12),'Trenton'::varchar(12),'2022-01-01'::date
+union all
+select 'NY'::varchar(2),'Kings'::varchar(12),'Brooklyn'::varchar(12),'2021-04-02'::date
+union all
+select 'NY'::varchar(2),'New York'::varchar(12),'Manhattan'::varchar(12),'2021-04-01'::date
+union all
+select 'PA'::varchar(2),'Philadelphia'::varchar(12),'Philadelphia'::varchar(12),'2021-05-21'::date
+
+"""
+
+seeds__duplicate_insert_sql = """
+-- Insert statement which when applied to seed.csv triggers the inplace
+--   overwrite strategy of incremental models. Seed and incremental model
+--   diverge.
+
+-- insert new row, which should not be in incremental model
+--  with primary or first three columns unique
+insert into {schema}.seed
+    (state, county, city, last_visit_date)
+values ('CT','Hartford','Hartford','2022-02-14');
+
+"""
+
+seeds__seed_csv = """state,county,city,last_visit_date
+CT,Hartford,Hartford,2020-09-23
+MA,Suffolk,Boston,2020-02-12
+NJ,Mercer,Trenton,2022-01-01
+NY,Kings,Brooklyn,2021-04-02
+NY,New York,Manhattan,2021-04-01
+PA,Philadelphia,Philadelphia,2021-05-21
+"""
+
+seeds__add_new_rows_sql = """
+-- Insert statement which when applied to seed.csv sees incremental model
+--   grow in size while not (necessarily) diverging from the seed itself.
+
+-- insert two new rows, both of which should be in incremental model
+--   with any unique columns
+insert into {schema}.seed
+    (state, county, city, last_visit_date)
+values ('WA','King','Seattle','2022-02-01');
+
+insert into {schema}.seed
+    (state, county, city, last_visit_date)
+values ('CA','Los Angeles','Los Angeles','2022-02-01');
+
+"""
+
+
+ResultHolder = namedtuple(
+    "ResultHolder",
+    [
+        "seed_count",
+        "model_count",
+        "seed_rows",
+        "inc_test_model_count",
+        "opt_model_count",
+        "relation",
+    ],
+)
+
+
+class BaseIncrementalUniqueKey:
+    @pytest.fixture(scope="class")
+    def models(self):
+        return {
+            "trinary_unique_key_list.sql": models__trinary_unique_key_list_sql,
+            "nontyped_trinary_unique_key_list.sql": models__nontyped_trinary_unique_key_list_sql,
+            "unary_unique_key_list.sql": models__unary_unique_key_list_sql,
+            "not_found_unique_key.sql": models__not_found_unique_key_sql,
+            "empty_unique_key_list.sql": models__empty_unique_key_list_sql,
+            "no_unique_key.sql": models__no_unique_key_sql,
+            "empty_str_unique_key.sql": models__empty_str_unique_key_sql,
+            "str_unique_key.sql": models__str_unique_key_sql,
+            "duplicated_unary_unique_key_list.sql": models__duplicated_unary_unique_key_list_sql,
+            "not_found_unique_key_list.sql": models__not_found_unique_key_list_sql,
+            "expected": {
+                "one_str__overwrite.sql": models__expected__one_str__overwrite_sql,
+                "unique_key_list__inplace_overwrite.sql": models__expected__unique_key_list__inplace_overwrite_sql,
+            },
+        }
+
+    @pytest.fixture(scope="class")
+    def seeds(self):
+        return {
+            "duplicate_insert.sql": seeds__duplicate_insert_sql,
+            "seed.csv": seeds__seed_csv,
+            "add_new_rows.sql": seeds__add_new_rows_sql,
+        }
+
+    def update_incremental_model(self, incremental_model):
+        """update incremental model after the seed table has been updated"""
+        model_result_set = run_dbt(["run", "--select", incremental_model])
+        return len(model_result_set)
+
+    def get_test_fields(
+        self, project, seed, incremental_model, update_sql_file, opt_model_count=None
+    ):
+        """build a test case and return values for assertions
+        [INFO] Models must be in place to test incremental model
+        construction and merge behavior. Database touches are side
+        effects to extract counts (which speak to health of unique keys)."""
+        # idempotently create some number of seeds and incremental models'''
+
+        seed_count = len(run_dbt(["seed", "--select", seed, "--full-refresh"]))
+
+        model_count = len(run_dbt(["run", "--select", incremental_model, "--full-refresh"]))
+        # pass on kwarg
+        relation = incremental_model
+        # update seed in anticipation of incremental model update
+        row_count_query = "select * from {}.{}".format(project.test_schema, seed)
+        project.run_sql_file(Path("seeds") / Path(update_sql_file + ".sql"))
+        seed_rows = len(project.run_sql(row_count_query, fetch="all"))
+
+        # propagate seed state to incremental model according to unique keys
+        inc_test_model_count = self.update_incremental_model(incremental_model=incremental_model)
+
+        return ResultHolder(
+            seed_count, model_count, seed_rows, inc_test_model_count, opt_model_count, relation
+        )
+
+    def check_scenario_correctness(self, expected_fields, test_case_fields, project):
+        """Invoke assertions to verify correct build functionality"""
+        # 1. test seed(s) should build afresh
+        assert expected_fields.seed_count == test_case_fields.seed_count
+        # 2. test model(s) should build afresh
+        assert expected_fields.model_count == test_case_fields.model_count
+        # 3. seeds should have intended row counts post update
+        assert expected_fields.seed_rows == test_case_fields.seed_rows
+        # 4. incremental test model(s) should be updated
+        assert expected_fields.inc_test_model_count == test_case_fields.inc_test_model_count
+        # 5. extra incremental model(s) should be built; optional since
+        #   comparison may be between an incremental model and seed
+        if expected_fields.opt_model_count and test_case_fields.opt_model_count:
+            assert expected_fields.opt_model_count == test_case_fields.opt_model_count
+        # 6. result table should match intended result set (itself a relation)
+        table_comp = TableComparison(
+            adapter=project.adapter, unique_schema=project.test_schema, database=project.database
+        )
+        table_comp.assert_tables_equal(expected_fields.relation, test_case_fields.relation)
+
+    def get_expected_fields(self, relation, seed_rows, opt_model_count=None):
+        return ResultHolder(
+            seed_count=1,
+            model_count=1,
+            seed_rows=seed_rows,
+            inc_test_model_count=1,
+            opt_model_count=opt_model_count,
+            relation=relation,
+        )
+
+    def fail_to_build_inc_missing_unique_key_column(self, incremental_model_name):
+        """should pass back error state when trying build an incremental
+        model whose unique key or keylist includes a column missing
+        from the incremental model"""
+        seed_count = len(run_dbt(["seed", "--select", "seed", "--full-refresh"]))  # noqa:F841
+        # unique keys are not applied on first run, so two are needed
+        run_dbt(
+            ["run", "--select", incremental_model_name, "--full-refresh"],
+            expect_pass=True,
+        )
+        run_result = run_dbt(
+            ["run", "--select", incremental_model_name], expect_pass=False
+        ).results[0]
+
+        return run_result.status, run_result.message
+
+    # no unique_key test
+    def test__no_unique_keys(self, project):
+        """with no unique keys, seed and model should match"""
+
+        expected_fields = self.get_expected_fields(relation="seed", seed_rows=8)
+        test_case_fields = self.get_test_fields(
+            project, seed="seed", incremental_model="no_unique_key", update_sql_file="add_new_rows"
+        )
+        self.check_scenario_correctness(expected_fields, test_case_fields, project)
+
+    # unique_key as str tests
+    def test__empty_str_unique_key(self, project):
+        """with empty string for unique key, seed and model should match"""
+
+        expected_fields = self.get_expected_fields(relation="seed", seed_rows=8)
+        test_case_fields = self.get_test_fields(
+            project,
+            seed="seed",
+            incremental_model="empty_str_unique_key",
+            update_sql_file="add_new_rows",
+        )
+        self.check_scenario_correctness(expected_fields, test_case_fields, project)
+
+    def test__one_unique_key(self, project):
+        """with one unique key, model will overwrite existing row"""
+
+        expected_fields = self.get_expected_fields(
+            relation="one_str__overwrite", seed_rows=7, opt_model_count=1
+        )
+        test_case_fields = self.get_test_fields(
+            project,
+            seed="seed",
+            incremental_model="str_unique_key",
+            update_sql_file="duplicate_insert",
+            opt_model_count=self.update_incremental_model("one_str__overwrite"),
+        )
+        self.check_scenario_correctness(expected_fields, test_case_fields, project)
+
+    def test__bad_unique_key(self, project):
+        """expect compilation error from unique key not being a column"""
+
+        (status, exc) = self.fail_to_build_inc_missing_unique_key_column(
+            incremental_model_name="not_found_unique_key"
+        )
+
+        assert status == RunStatus.Error
+        assert "thisisnotacolumn" in exc.lower()
+
+    # test unique_key as list
+    def test__empty_unique_key_list(self, project):
+        """with no unique keys, seed and model should match"""
+
+        expected_fields = self.get_expected_fields(relation="seed", seed_rows=8)
+        test_case_fields = self.get_test_fields(
+            project,
+            seed="seed",
+            incremental_model="empty_unique_key_list",
+            update_sql_file="add_new_rows",
+        )
+        self.check_scenario_correctness(expected_fields, test_case_fields, project)
+
+    def test__unary_unique_key_list(self, project):
+        """with one unique key, model will overwrite existing row"""
+
+        expected_fields = self.get_expected_fields(
+            relation="unique_key_list__inplace_overwrite", seed_rows=7, opt_model_count=1
+        )
+        test_case_fields = self.get_test_fields(
+            project,
+            seed="seed",
+            incremental_model="unary_unique_key_list",
+            update_sql_file="duplicate_insert",
+            opt_model_count=self.update_incremental_model("unique_key_list__inplace_overwrite"),
+        )
+        self.check_scenario_correctness(expected_fields, test_case_fields, project)
+
+    def test__duplicated_unary_unique_key_list(self, project):
+        """with two of the same unique key, model will overwrite existing row"""
+
+        expected_fields = self.get_expected_fields(
+            relation="unique_key_list__inplace_overwrite", seed_rows=7, opt_model_count=1
+        )
+        test_case_fields = self.get_test_fields(
+            project,
+            seed="seed",
+            incremental_model="duplicated_unary_unique_key_list",
+            update_sql_file="duplicate_insert",
+            opt_model_count=self.update_incremental_model("unique_key_list__inplace_overwrite"),
+        )
+        self.check_scenario_correctness(expected_fields, test_case_fields, project)
+
+    def test__trinary_unique_key_list(self, project):
+        """with three unique keys, model will overwrite existing row"""
+
+        expected_fields = self.get_expected_fields(
+            relation="unique_key_list__inplace_overwrite", seed_rows=7, opt_model_count=1
+        )
+        test_case_fields = self.get_test_fields(
+            project,
+            seed="seed",
+            incremental_model="trinary_unique_key_list",
+            update_sql_file="duplicate_insert",
+            opt_model_count=self.update_incremental_model("unique_key_list__inplace_overwrite"),
+        )
+        self.check_scenario_correctness(expected_fields, test_case_fields, project)
+
+    def test__trinary_unique_key_list_no_update(self, project):
+        """even with three unique keys, adding distinct rows to seed does not
+        cause seed and model to diverge"""
+
+        expected_fields = self.get_expected_fields(relation="seed", seed_rows=8)
+        test_case_fields = self.get_test_fields(
+            project,
+            seed="seed",
+            incremental_model="nontyped_trinary_unique_key_list",
+            update_sql_file="add_new_rows",
+        )
+        self.check_scenario_correctness(expected_fields, test_case_fields, project)
+
+    def test__bad_unique_key_list(self, project):
+        """expect compilation error from unique key not being a column"""
+
+        (status, exc) = self.fail_to_build_inc_missing_unique_key_column(
+            incremental_model_name="not_found_unique_key_list"
+        )
+
+        assert status == RunStatus.Error
+        assert "thisisnotacolumn" in exc.lower()
+
+
+class TestIncrementalUniqueKey(BaseIncrementalUniqueKey):
+    pass
--- a/tests/functional/permission/test_permissions.py
+++ b/tests/functional/permission/test_permissions.py
@@ -64,7 +64,6 @@ class TestPermissions:
        project,
    ):
        # now it should work!
-        # breakpoint()
        project.run_sql("grant create on database {} to noaccess".format(project.database))
        project.run_sql(
            'grant usage, create on schema "{}" to noaccess'.format(project.test_schema)
Author	SHA1	Message	Date
Kyle Wigley	eae14e1be7	use adapter to execute sql	2022-04-01 16:18:13 -04:00
Matthew McKnight	32f0a30b58	create incremental test directory in adapter zone	2022-04-01 09:21:43 -05:00
Matthew McKnight	f430efc56a	v2 based on feedback for base version of testing, plus small removal of leftover breakpoint	2022-03-31 17:07:23 -05:00
Matthew McKnight	0b263604a2	Merge branch 'main' of github.com:dbt-labs/dbt into mcknight/convert_unique_key	2022-03-30 16:10:15 -05:00
Matthew McKnight	9282b4cc7a	uncommenting seed_count	2022-03-30 09:57:02 -05:00
Matthew McKnight	b8f79149be	removed commented out code	2022-03-29 16:20:38 -05:00
Matthew McKnight	50c7ba1e92	remove older test_unique_key tests	2022-03-29 15:50:35 -05:00
Matthew McKnight	970d57d433	taking in chenyu's changes to fixtures	2022-03-28 16:47:13 -05:00
Matthew McKnight	ae12ccf2e8	moving tests to base class and inheriting in a simple class	2022-03-28 16:27:12 -05:00
Matthew McKnight	053910cb1b	removed unused fixture	2022-03-28 16:02:45 -05:00
Matthew McKnight	d3451a6041	minor changes to the bad_unique_key tests	2022-03-28 15:47:42 -05:00
Matthew McKnight	3dec58f592	moving non basic test up one directory to be more broadly part of adapter zone	2022-03-28 15:24:15 -05:00
Matthew McKnight	f8d93b0524	adding changelog entry	2022-03-28 15:08:41 -05:00
Matthew McKnight	bd15abf502	testing cause of failure	2022-03-28 11:33:42 -05:00
Matthew McKnight	1e52c9c134	Merge branch 'main' of github.com:dbt-labs/dbt into mcknight/convert_unique_key	2022-03-25 15:45:10 -05:00
Matthew McKnight	17b5d11c8b	init push up of converted unique_key tests	2022-03-25 11:48:25 -05:00