dbt-labs · soksamnanglim · Oct 4, 2023 · Oct 4, 2023 · Oct 4, 2023 · Oct 4, 2023
@@ -0,0 +1,6 @@
+kind: Features
+body: 'Add support for specifying groups and roles in grant statements'
+time: 2023-10-04T10:39:38.680813-07:00
+custom:
+  Author: soksamnanglim
+  Issue: "415"
@@ -57,7 +57,7 @@ To confirm you have correct `dbt-core` and adapter versions installed please run
 
 `dbt-redshift` contains [unit](https://github.com/dbt-labs/dbt-redshift/tree/main/tests/unit) and [functional](https://github.com/dbt-labs/dbt-redshift/tree/main/tests/functional) tests. Functional tests require testing against an actual Redshift warehouse. We have CI set up to test against a Redshift warehouse during PR checks.
 
-In order to run functional tests locally, you will need a `test.env` file in the root of the repository that contains credentials for your Redshift warehouse.
+In order to run functional tests locally, you will need a `test.env` file in the root of the repository that contains credentials for your Redshift warehouse. You'll need all the objects provided in `test.env.example` in `test.env` for all the tests to pass.
 
 Note: This `test.env` file is git-ignored, but please be extra careful to never check in credentials or other sensitive information when developing. To create your `test.env` file, copy the provided example file, then supply your relevant credentials.
 

@@ -1,5 +1,19 @@
 .DEFAULT_GOAL:=help
 
+CI_FLAGS =\
+	DBT_TEST_USER_1=$(if $(DBT_TEST_USER_1),$(DBT_TEST_USER_1),dbt_test_user_1)\
+	DBT_TEST_USER_2=$(if $(DBT_TEST_USER_2),$(DBT_TEST_USER_2),dbt_test_user_2)\
+	DBT_TEST_USER_3=$(if $(DBT_TEST_USER_3),$(DBT_TEST_USER_3),dbt_test_user_3)\
+	DBT_TEST_GROUP_1=$(if $(DBT_TEST_GROUP_1),$(DBT_TEST_GROUP_1),dbt_test_group_1)\
+	DBT_TEST_GROUP_2=$(if $(DBT_TEST_GROUP_2),$(DBT_TEST_GROUP_2),dbt_test_group_2)\
+	DBT_TEST_GROUP_3=$(if $(DBT_TEST_GROUP_3),$(DBT_TEST_GROUP_3),dbt_test_group_3)\
+	DBT_TEST_ROLE_1=$(if $(DBT_TEST_ROLE_1),$(DBT_TEST_ROLE_1),dbt_test_role_1)\
+	DBT_TEST_ROLE_2=$(if $(DBT_TEST_ROLE_2),$(DBT_TEST_ROLE_2),dbt_test_role_2)\
+	DBT_TEST_ROLE_3=$(if $(DBT_TEST_ROLE_3),$(DBT_TEST_ROLE_3),dbt_test_role_3)\
+	RUSTFLAGS=$(if $(RUSTFLAGS),$(RUSTFLAGS),"-D warnings")\
+	LOG_DIR=$(if $(LOG_DIR),$(LOG_DIR),./logs)\
+	DBT_LOG_FORMAT=$(if $(DBT_LOG_FORMAT),$(DBT_LOG_FORMAT),json)
+
 .PHONY: dev
 dev: ## Installs adapter in develop mode along with development dependencies
 	@\

@@ -187,3 +187,93 @@ def generate_python_submission_response(self, submission_result: Any) -> Adapter
     def debug_query(self):
         """Override for DebugTask method"""
         self.execute("select 1 as id")
+
+    # grant-related methods
+    @available
+    def standardize_grants_dict(self, grants_table):
+        """
+        Override for standardize_grants_dict
+        """
+        grants_dict = {}  # Dict[str, Dict[str, List[str]]]
+        for row in grants_table:
+            grantee_type = row["grantee_type"]
+            grantee = row["grantee"]
+            privilege = row["privilege_type"]
+            if privilege not in grants_dict:
+                grants_dict[privilege] = {}
+
+            if grantee_type not in grants_dict[privilege]:
+                grants_dict[privilege][grantee_type] = []
+
+            grants_dict[privilege][grantee_type].append(grantee)
+
+        return grants_dict
+
+    @available
+    def diff_of_two_nested_dicts(self, dict_a, dict_b):
+        """
+        Given two dictionaries of type Dict[str, Dict[str, List[str]]]:
+            dict_a = {'key_x': {'key_a': 'VALUE_1'}, 'KEY_Y': {'key_b': value_2'}}
+            dict_b = {'key_x': {'key_a': 'VALUE_1'}, 'KEY_Y': {'key_b': value_2'}}
+        Return the same dictionary representation of dict_a MINUS dict_b,
+        performing a case-insensitive comparison between the strings in each.
+        All keys returned will be in the original case of dict_a.
+            returns {'key_x': ['VALUE_2'], 'KEY_Y': ['value_3']}
+        """
+
+        dict_diff = {}
+
+        for k, v_a in dict_a.items():
+            if k.casefold() in dict_b:
+                v_b = dict_b[k.casefold()]
+
+                for sub_key, values_a in v_a.items():
+                    if sub_key in v_b:
+                        values_b = v_b[sub_key]
+                        diff_values = [v for v in values_a if v.casefold() not in values_b]
+                        if diff_values:
+                            if k in dict_diff:
+                                dict_diff[k][sub_key] = diff_values
+                            else:
+                                dict_diff[k] = {sub_key: diff_values}
+                    else:
+                        if k in dict_diff:
+                            if values_a:
+                                dict_diff[k][sub_key] = values_a
+                        else:
+                            if values_a:
+                                dict_diff[k] = {sub_key: values_a}
+            else:
+                dict_diff[k] = v_a
+
+        return dict_diff
+
+    @available
+    def process_grant_dicts(self, unknown_dict):
+        """
+        Given a dictionary where the type can either be of type:
+        - Dict[str, List[str]]
+        - Dict[str, List[Dict[str, List[str]]
+        Return a processed dictionary of the type Dict[str, Dict[str, List[str]]
+        """
+        first_value = next(iter(unknown_dict.values()))
+        if first_value:
+            is_dict = isinstance(first_value[0], dict)
+        else:
+            is_dict = False
+
+        temp = {}
+        if not is_dict:
+            for privilege, grantees in unknown_dict.items():
+                if grantees:
+                    temp[privilege] = {"user": grantees}
+        else:
+            for privilege, grantee_map in unknown_dict.items():
+                grantees_map_temp = {}
+                for grantee_type, grantees in grantee_map[0].items():
+                    if grantees:
+                        grantees_map_temp[grantee_type] = grantees
+                if grantees_map_temp:
+                    temp[privilege] = grantees_map_temp
+
+        return temp
@@ -1,5 +1,42 @@
-{% macro redshift__get_show_grant_sql(relation) %}
+{# ------- DCL STATEMENT TEMPLATES ------- #}
+
+{%- macro redshift__get_grant_sql(relation, privilege, grantee_dict) -%}
+    {#-- generates a multiple-grantees grant privilege statement --#}
+    grant {{privilege}} on {{relation}} to
+    {%- for grantee_type, grantees in grantee_dict.items() -%}
+    {%- if grantee_type == 'user' and grantees -%}
+        {{ " " + (grantees | join(', ')) }}
+    {%- elif grantee_type == 'group' and grantees -%}
+        {{ " " + ("group " + grantees | join(', group ')) }}
+    {%- elif grantee_type == 'role' and grantees -%}
+        {{ " " + ("role " + grantees | join(', role ')) }}
+    {%- endif -%}
+    {%- if not loop.last -%}
+        ,
+    {%- endif -%}
+    {%- endfor -%}
+{%- endmacro -%}
+
+{%- macro redshift__get_revoke_sql(relation, privilege, revokee_dict) -%}
+    {#-- generates a multiple-grantees revoke privilege statement --#}
+    revoke {{privilege}} on {{relation}} from
+    {%- for revokee_type, revokees in revokee_dict.items() -%}
+    {%- if revokee_type == 'user' and revokees -%}
+        {{ " " + (revokees | join(', ')) }}
+    {%- elif revokee_type == 'group' and revokees -%}
+        {{ " " + ("group " + revokees | join(', group ')) }}
+    {%- elif revokee_type == 'role' and revokees -%}
+        {{ " " + ("role " + revokees | join(', role ')) }}
+    {%- endif -%}
+    {%- if not loop.last -%}
+        ,
+    {%- endif -%}
+    {%- endfor -%}
+{%- endmacro -%}
 
+
+{% macro redshift__get_show_grant_sql(relation) %}
+{#-- shows the privilege grants on a table for users, groups, and roles --#}
 with privileges as (
 
     -- valid options per https://docs.aws.amazon.com/redshift/latest/dg/r_HAS_TABLE_PRIVILEGE.html
@@ -16,6 +53,7 @@ with privileges as (
 )
 
 select
+    'user' as grantee_type,
     u.usename as grantee,
     p.privilege_type
 from pg_user u
@@ -24,4 +62,72 @@ where has_table_privilege(u.usename, '{{ relation }}', privilege_type)
     and u.usename != current_user
     and not u.usesuper
 
+union all
+-- check that group has table privilege
+select
+    'group' as grantee_type,
+    g.groname as grantee,
+    p.privilege_type
+from pg_group g
+cross join privileges p
+where exists(
+    select *
+    from information_schema.table_privileges tp
+    where tp.grantee=g.groname
+    and tp.table_schema=replace(split_part('{{ relation }}', '.', 2), '"', '')
+    and tp.table_name=replace(split_part('{{ relation }}', '.', 3), '"', '')
+    and LOWER(tp.privilege_type)=p.privilege_type
-    and tp.table_schema=replace(split_part('{{ relation }}', '.', 2), '"', '')
-    and tp.table_name=replace(split_part('{{ relation }}', '.', 3), '"', '')
+    and tp.table_schema = '{{ relation.schema }}'
+    and tp.table_name = '{{ relation.identifier }}'
-    and tp.table_schema=replace(split_part('{{ relation }}', '.', 2), '"', '')
-    and tp.table_name=replace(split_part('{{ relation }}', '.', 3), '"', '')
+    and tp.table_schema = '{{ relation.schema }}'
+    and tp.table_name = '{{ relation.identifier }}'
+)
+
+union all
+-- check that role has table privilege
+select
+    'role' as grantee_type,
+    r.role_name as grantee,
+    p.privilege_type
+from svv_roles r
+cross join privileges p
+where exists(
+    select *
+    from svv_relation_privileges rp
+    where rp.identity_name=r.role_name
+    and rp.namespace_name=replace(split_part('{{ relation }}', '.', 2), '"', '')
+    and rp.relation_name=replace(split_part('{{ relation }}', '.', 3), '"', '')
+    and LOWER(rp.privilege_type)=p.privilege_type
-    and rp.namespace_name=replace(split_part('{{ relation }}', '.', 2), '"', '')
-    and rp.relation_name=replace(split_part('{{ relation }}', '.', 3), '"', '')
+    and rp.namespace_name = '{{ relation.schema }}'
+    and rp.relation_name = '{{ relation.identifier }}'
-    and rp.namespace_name=replace(split_part('{{ relation }}', '.', 2), '"', '')
-    and rp.relation_name=replace(split_part('{{ relation }}', '.', 3), '"', '')
+    and rp.namespace_name = '{{ relation.schema }}'
+    and rp.relation_name = '{{ relation.identifier }}'
+)
+
+{% endmacro %}
+
+{% macro redshift__apply_grants(relation, grant_config, should_revoke=True) %}
+    {#-- Override for apply grants --#}
+    {#-- If grant_config is {} or None, this is a no-op --#}
+    {% if grant_config %}
+        {#-- change grant_config to Dict[str, Dict[str, List[str]] format --#}
+        {% set grant_config = adapter.process_grant_dicts(grant_config) %}
+
+        {% if should_revoke %}
+            {#-- We think that there is a chance that grants are carried over. --#}
+            {#-- Show the current grants for users, roles, and groups and calculate the diffs. --#}
+            {% set current_grants_table = run_query(get_show_grant_sql(relation)) %}
+            {% set current_grants_dict = adapter.standardize_grants_dict(current_grants_table) %}
+            {% set needs_granting = adapter.diff_of_two_nested_dicts(grant_config, current_grants_dict) %}
+            {% set needs_revoking = adapter.diff_of_two_nested_dicts(current_grants_dict, grant_config) %}
+            {% if not (needs_granting or needs_revoking) %}
+                {{ log('On ' ~ relation ~': All grants are in place, no revocation or granting needed.')}}
+            {% endif %}
+        {% else %}
+            {#-- We don't think there's any chance of previous grants having carried over. --#}
+            {#-- Jump straight to granting what the user has configured. --#}
+            {% set needs_revoking = {} %}
+            {% set needs_granting = grant_config %}
+        {% endif %}
+        {% if needs_granting or needs_revoking %}
+            {% set revoke_statement_list = get_dcl_statement_list(relation, needs_revoking, get_revoke_sql) %}
+            {% set grant_statement_list = get_dcl_statement_list(relation, needs_granting, get_grant_sql) %}
+            {% set dcl_statement_list = revoke_statement_list + grant_statement_list %}
+            {% if dcl_statement_list %}
+                {{ call_dcl_statements(dcl_statement_list) }}
+            {% endif %}
+        {% endif %}
+    {% endif %}
 {% endmacro %}
@@ -1,4 +1,55 @@
 import pytest
+import os
+
+from dbt_common.exceptions import DbtDatabaseError
+
+# This is a hack to prevent the fixture from running more than once
+GRANTS_AND_ROLES_SETUP = False
+
+GROUPS = {
+    "DBT_TEST_GROUP_1": "dbt_test_group_1",
+    "DBT_TEST_GROUP_2": "dbt_test_group_2",
+    "DBT_TEST_GROUP_3": "dbt_test_group_3",
+}
+ROLES = {
+    "DBT_TEST_ROLE_1": "dbt_test_role_1",
+    "DBT_TEST_ROLE_2": "dbt_test_role_2",
+    "DBT_TEST_ROLE_3": "dbt_test_role_3",
+}
+
+
+@pytest.fixture(scope="class", autouse=True)
+def setup_grants_and_roles(project):
+    print("Start setup for groups and roles")
+
+    global GRANTS_AND_ROLES_SETUP
+    for env_name, env_var in GROUPS.items():
+        os.environ[env_name] = env_var
+    for env_name, env_var in ROLES.items():
+        os.environ[env_name] = env_var
+    # if not GRANTS_AND_ROLES_SETUP:
+    if True:
+        print("Create groups and roles")
+        with project.adapter.connection_named("__test"):
+            for group in GROUPS.values():
+                try:
+                    print(f"CREATE GROUP {group}")
+                    project.adapter.execute(f"CREATE GROUP {group}")
+                except DbtDatabaseError:
+                    # This is expected if the group already exists
+                    pass
+
+            for role in ROLES.values():
+                try:
+                    print(f"CREATE ROLE {role}")
+                    project.adapter.execute(f"CREATE ROLE {role}")
+                except DbtDatabaseError:
+                    # This is expected if the group already exists
+                    pass
+
+            GRANTS_AND_ROLES_SETUP = True
+
+    print("End setup for groups and roles")
 
 
 @pytest.fixture

@@ -0,0 +1,79 @@
+import pytest
+import os
+
+from dbt.tests.util import (
+    relation_from_name,
+    get_connection,
+)
+
+TEST_USER_ENV_VARS = ["DBT_TEST_USER_1", "DBT_TEST_USER_2", "DBT_TEST_USER_3"]
+TEST_GROUP_ENV_VARS = ["DBT_TEST_GROUP_1", "DBT_TEST_GROUP_2", "DBT_TEST_GROUP_3"]
+TEST_ROLE_ENV_VARS = ["DBT_TEST_ROLE_1", "DBT_TEST_ROLE_2", "DBT_TEST_ROLE_3"]
+
+
+def replace_all(text, dic):
+    for i, j in dic.items():
+        text = text.replace(i, j)
+    return text
+
+
+class BaseGrantsRedshift:
+    def privilege_grantee_name_overrides(self):
+        # these privilege and grantee names are valid on most databases, but not all!
+        # looking at you, BigQuery
+        # optionally use this to map from "select" --> "other_select_name", "insert" --> ...
+        return {
+            "select": "select",
+            "insert": "insert",
+            "fake_privilege": "fake_privilege",
+            "invalid_user": "invalid_user",
+        }
+
+    def interpolate_name_overrides(self, yaml_text):
+        return replace_all(yaml_text, self.privilege_grantee_name_overrides())
+
+    @pytest.fixture(scope="class", autouse=True)
+    def get_test_groups(self, project):
+        test_groups = []
+        for env_var in TEST_GROUP_ENV_VARS:
+            group_name = os.getenv(env_var)
+            if group_name:
+                test_groups.append(group_name)
+        return test_groups
+
+    @pytest.fixture(scope="class", autouse=True)
+    def get_test_roles(self, project):
+        test_roles = []
+        for env_var in TEST_ROLE_ENV_VARS:
+            role_name = os.getenv(env_var)
+            if role_name:
+                test_roles.append(role_name)
+        return test_roles
+
+    @pytest.fixture(scope="class", autouse=True)
+    def get_test_users(self, project):
+        test_users = []
+        for env_var in TEST_USER_ENV_VARS:
+            user_name = os.getenv(env_var)
+            if user_name:
+                test_users.append(user_name)
+        return test_users
+
+    def get_grants_on_relation(self, project, relation_name):
+        relation = relation_from_name(project.adapter, relation_name)
+        adapter = project.adapter
+        with get_connection(adapter):
+            kwargs = {"relation": relation}
+            show_grant_sql = adapter.execute_macro("get_show_grant_sql", kwargs=kwargs)
+            _, grant_table = adapter.execute(show_grant_sql, fetch=True)
+            actual_grants = adapter.standardize_grants_dict(grant_table)
+        return actual_grants
+
+    # This is an override of the BaseGrants class
+    def assert_expected_grants_match_actual(self, project, actual_grants, expected_grants):
+        adapter = project.adapter
+        # need a case-insensitive comparison
+        # so just a simple "assert expected == actual_grants" won't work
+        diff_a = adapter.diff_of_two_nested_dicts(actual_grants, expected_grants)
+        diff_b = adapter.diff_of_two_nested_dicts(expected_grants, actual_grants)
+        assert diff_a == diff_b == {}