dbt-labs · jon-rtr · Apr 7, 2018 · Jul 11, 2018 · drewbanin · Apr 8, 2018
diff --git a/dbt/include/global_project/macros/adapters/snowflake.sql b/dbt/include/global_project/macros/adapters/snowflake.sql
@@ -1,7 +1,33 @@
+{% macro clusterby(_clusterby) %}
+  {%- if _clusterby is not none -%}
+    cluster by (
+      {%- if _clusterby is string -%}
+        {%- set _clusterby = [_clusterby] -%}
+      {%- endif -%}
+      {%- for item in _clusterby -%}
+        "{{ item }}"
+        {%- if not loop.last -%},{%- endif -%}
+      {%- endfor -%}
+    )
+  {%- endif -%}
+{%- endmacro -%}
+
 {% macro snowflake__create_table_as(temporary, relation, sql) -%}
+  {%- set _clusterby = config.get('clusterby') -%}
+
   {% if temporary %}
     use schema {{ schema }};
   {% endif %}
 
-  {{ default__create_table_as(temporary, relation, sql) }}
+  {# FIXME: We cannot call default__create_table_as here
+            as it terminates the return string with a semicolon.
+            Conversely, we have introduced code-copy as
+            a potential source of drift. #}
+  create {% if temporary: -%}temporary{%- endif %} table
+    {{ relation.include(schema=(not temporary)) }}
+  as (
+    {{ sql }}
+  )
+  {{ clusterby(_clusterby) }}
+  ;
 {% endmacro %}
diff --git a/dbt/model.py b/dbt/model.py
@@ -18,12 +18,13 @@ class SourceConfig(object):
         'schema',
         'enabled',
         'materialized',
-        'dist',
-        'sort',
+        'dist',         # redshift
+        'sort',         # redshift
+        'clusterby',    # snowflake
         'sql_where',
         'unique_key',
-        'sort_type',
-        'bind'
+        'sort_type',    # redshift
+        'bind'          # redshift
     ]
 
     def __init__(self, active_project, own_project, fqn, node_type):

diff --git a/dbt/utils.py b/dbt/utils.py
@@ -20,11 +20,12 @@
     'schema',
     'enabled',
     'materialized',
-    'dist',
-    'sort',
+    'dist',         # redshift
+    'sort',         # redshift
+    'clusterby',    # snowflake
     'sql_where',
     'unique_key',
-    'sort_type',
+    'sort_type',    # redshift
     'pre-hook',
     'post-hook',
     'vars',

diff --git a/sample.dbt_project.yml b/sample.dbt_project.yml
@@ -120,6 +120,7 @@ models:
             adwords_ads:
                 enabled: true
                 materialized: table
+                clusterby: ["date_day", "ad_group_id % 10"]
 
         # Applies to all SQL files found under ./models/snowplow/
         snowplow:

diff --git a/test/integration/018_adapter_ddl_tests/models/materialized.sql b/test/integration/018_adapter_ddl_tests/models/materialized.sql
@@ -2,7 +2,8 @@
   config(
     materialized = "table",
     sort = 'first_name',
-    dist = 'first_name'
+    dist = 'first_name',
+    clusterby = 'first_name',
   )
 }}
 

diff --git a/test/integration/018_adapter_ddl_tests/test_adapter_ddl.py b/test/integration/018_adapter_ddl_tests/test_adapter_ddl.py
@@ -10,14 +10,14 @@ def setUp(self):
 
     @property
     def schema(self):
-        return "adaper_ddl_018"
+        return "adapter_ddl_018"
 
     @property
     def models(self):
         return "test/integration/018_adapter_ddl_tests/models"
 
     @attr(type='postgres')
-    def test_sort_and_dist_keys_are_nops_on_postgres(self):
+    def test_clusterby_and_sort_and_dist_keys_are_nops_on_postgres(self):
         self.run_dbt(['run'])
 
         self.assertTablesEqual("seed","materialized")