From 9a56ae58780384109f8f50d5200d9103bacb6abc Mon Sep 17 00:00:00 2001 From: Damian Owsianny Date: Tue, 15 Oct 2024 14:32:45 +0200 Subject: [PATCH] Add file_format and table_format configurations --- dbt/include/trino/macros/adapters.sql | 33 +++++ .../adapter/test_table_properties.py | 116 ++++++++++++++++++ 2 files changed, 149 insertions(+) diff --git a/dbt/include/trino/macros/adapters.sql b/dbt/include/trino/macros/adapters.sql index 3ac4a725..98bc4161 100644 --- a/dbt/include/trino/macros/adapters.sql +++ b/dbt/include/trino/macros/adapters.sql @@ -79,6 +79,39 @@ {% macro properties() %} {%- set _properties = config.get('properties') -%} + {%- set table_format = config.get('table_format') -%} + {%- set file_format = config.get('file_format') -%} + + {%- if file_format -%} + {%- if _properties -%} + {%- if _properties.format -%} + {% set msg %} + You can specify either 'file_format' or 'properties.format' configurations, but not both. + {% endset %} + {% do exceptions.raise_compiler_error(msg) %} + {%- else -%} + {%- do _properties.update({'format': file_format}) -%} + {%- endif -%} + {%- else -%} + {%- set _properties = {'format': file_format} -%} + {%- endif -%} + {%- endif -%} + + {%- if table_format -%} + {%- if _properties -%} + {%- if _properties.type -%} + {% set msg %} + You can specify either 'table_format' or 'properties.type' configurations, but not both. + {% endset %} + {% do exceptions.raise_compiler_error(msg) %} + {%- else -%} + {%- do _properties.update({'type': table_format}) -%} + {%- endif -%} + {%- else -%} + {%- set _properties = {'type': table_format} -%} + {%- endif -%} + {%- endif -%} + {%- if _properties is not none -%} WITH ( {%- for key, value in _properties.items() -%} diff --git a/tests/functional/adapter/test_table_properties.py b/tests/functional/adapter/test_table_properties.py index 459c8cef..218b654a 100644 --- a/tests/functional/adapter/test_table_properties.py +++ b/tests/functional/adapter/test_table_properties.py @@ -47,3 +47,119 @@ def test_table_properties(self, project): assert "WITH (" in logs assert "format = 'PARQUET'" in logs assert "location = 's3://datalake/custom_location'" in logs + + +@pytest.mark.iceberg +class TestFileFormatConfig(BaseTableProperties): + # Configuration in dbt_project.yml + @pytest.fixture(scope="class") + def project_config_update(self): + return { + "name": "properties_test", + "models": { + "+materialized": "table", + "file_format": "'PARQUET'", + }, + } + + def test_table_properties(self, project): + # Seed seed + results = run_dbt(["seed"], expect_pass=True) + assert len(results) == 1 + + # Create model with properties + results, logs = run_dbt_and_capture(["--debug", "run"], expect_pass=True) + assert len(results) == 1 + assert "WITH (" in logs + assert "format = 'PARQUET'" in logs + + +@pytest.mark.iceberg +class TestFileFormatConfigAndFormatTablePropertyFail(BaseTableProperties): + # Configuration in dbt_project.yml + @pytest.fixture(scope="class") + def project_config_update(self): + return { + "name": "properties_test", + "models": { + "+materialized": "table", + "+properties": { + "format": "'PARQUET'", + }, + "file_format": "'ORC'", + }, + } + + def test_table_properties(self, project): + # Seed seed + results = run_dbt(["seed"], expect_pass=True) + assert len(results) == 1 + + # Create model with properties + results, logs = run_dbt_and_capture(["--debug", "run"], expect_pass=False) + assert len(results) == 1 + assert ( + "You can specify either 'file_format' or 'properties.format' configurations, but not both." + in logs + ) + + +@pytest.mark.hive +# Setting `type` property is available only in Starburst Galaxy +# https://docs.starburst.io/starburst-galaxy/data-engineering/working-with-data-lakes/table-formats/gl-iceberg.html +@pytest.mark.skip_profile("trino_starburst") +class TestTableFormatConfig(BaseTableProperties): + # Configuration in dbt_project.yml + @pytest.fixture(scope="class") + def project_config_update(self): + return { + "name": "properties_test", + "models": { + "+materialized": "table", + "table_format": "'iceberg'", + }, + } + + def test_table_properties(self, project): + # Seed seed + results = run_dbt(["seed"], expect_pass=True) + assert len(results) == 1 + + # Create model with properties + results, logs = run_dbt_and_capture(["--debug", "run"], expect_pass=True) + assert len(results) == 1 + assert "WITH (" in logs + assert "type = 'iceberg'" in logs + + +@pytest.mark.hive +# Setting `type` property is available only in Starburst Galaxy +# https://docs.starburst.io/starburst-galaxy/data-engineering/working-with-data-lakes/table-formats/gl-iceberg.html +@pytest.mark.skip_profile("trino_starburst") +class TestTableFormatConfigAndTypeTablePropertyFail(BaseTableProperties): + # Configuration in dbt_project.yml + @pytest.fixture(scope="class") + def project_config_update(self): + return { + "name": "properties_test", + "models": { + "+materialized": "table", + "+properties": { + "type": "'iceberg'", + }, + "table_format": "'iceberg'", + }, + } + + def test_table_properties(self, project): + # Seed seed + results = run_dbt(["seed"], expect_pass=True) + assert len(results) == 1 + + # Create model with properties + results, logs = run_dbt_and_capture(["--debug", "run"], expect_pass=False) + assert len(results) == 1 + assert ( + "You can specify either 'table_format' or 'properties.type' configurations, but not both." + in logs + )