fsc-utils/macros/datashares.sql

174 lines
7.0 KiB
SQL

{%- macro get_ancestors(node, include_depth=false, exclude_source=false) -%}
{#
Return a list of ancestors for a node in a DAG.
#}
{%- for dep in node.depends_on.nodes | unique | list recursive %}
{% if dep.startswith("model.") and "bronze__" not in dep %}
"{{- loop.depth0 ~ '-'if include_depth else '' }}{{node.config.materialized }}-{{ dep -}}",
{{- loop(graph.nodes[dep].depends_on.nodes) -}}
{% elif not exclude_source %}
"{{- loop.depth0 ~ '-'if include_depth else '' }}{{node.config.materialized }}-{{ dep -}}",
{%- endif -%}
{%- endfor %}
{%- endmacro -%}
{% macro get_view_ddl() %}
{#
Return a dictionary of view names and their DDL statements.
The DDL statements are escaped to be used in a Snowflake query.
The dictionary is converted to JSON to be used in a dbt macro..
#}
{% if execute %}
{% set query %}
SELECT
CONCAT_WS('.', TABLE_SCHEMA, TABLE_NAME) as VIEW_NAME,
VIEW_DEFINITION
FROM {{target.database}}.INFORMATION_SCHEMA.VIEWS
WHERE TABLE_SCHEMA NOT IN ('INFORMATION_SCHEMA', 'STREAMLINE')
AND TABLE_SCHEMA NOT LIKE 'TEST_%'
{%- endset -%}
{%- set results = run_query(query) -%}
{% set ddl = {} %}
{% for key, value in results.rows %}
{%- do ddl.update({key: value|replace("$$", "\$\$")}) -%}
{%- endfor -%}
{{- tojson(ddl) -}}
{%- endif -%}
{%- endmacro -%}
{% macro replace_database_references(references_to_replace, ddl, new_database) %}
{#
Return the DDL statement for a view with the references replaced.
references_to_replace: a dictionary of references to replace
ddl: the DDL statement to replace the references in
new_database: the new database to replace the references with
#}
{% set outer = namespace(replaced=ddl) %}
{% for key in references_to_replace %}
{%- set original = target.database ~ "." ~ key.upper() -%}
{%- set replacement = new_database ~ "." ~ key -%}
{%- set outer.replaced = outer.replaced|replace(original, replacement) -%}
{%- set original = target.database ~ "." ~ key.lower() -%}
{%- set replacement = new_database ~ "." ~ key -%}
{%- set outer.replaced = outer.replaced|replace(original, replacement) -%}
{%- endfor -%}
{% set outer.replaced = outer.replaced|replace(target.database.upper() ~ ".", "__SOURCE__.") %}
{% set outer.replaced = outer.replaced|replace(target.database.lower() ~ ".", "__SOURCE__.") %}
{{- outer.replaced -}}
{%- endmacro -%}
{% macro generate_view_ddl(dag, schema) %}
{#
Return a list of DDL statements for views in a DAG.
dag: a DAG of views
schema: schemas to create schema DDL for
#}
{%- set ddl = fromjson(fsc_utils.get_view_ddl()) -%}
{%- set created = {} -%}
{%- set final_text = [] -%}
{%- for view, deps in dag.items() -%}
{%- for d in deps -%}
{%- set table_name = d.split(".")[-1].replace("__", ".").upper() -%}
{%- if ddl.get(table_name) and table_name not in created -%}
{%- set replaced = fsc_utils.replace_database_references(ddl.keys(), ddl[table_name], "__NEW__") -%}
{%- do final_text.append(replaced) -%}
{%- do created.update({table_name:true}) -%}
{%- endif -%}
{%- endfor -%}
{%- endfor -%}
{%- set schema_ddl = [] -%}
{%- for s in schema -%}
{%- do schema_ddl.append("CREATE SCHEMA IF NOT EXISTS __NEW__." ~ s ~ ";") -%}
{%- endfor -%}
{{- toyaml(schema_ddl + final_text) -}}
{%- endmacro -%}
{% macro generate_dag_and_schemas(node_paths, materializations) %}
{#
Return a DAG of views and a list of schemas to create.
node_paths: a list of node paths to include in the DAG
materializations: a list of materializations to include in the DAG
#}
{%- set dag = {} -%}
{%- set schema = [] -%}
{%- for key, value in graph.nodes.items() -%}
{%
if value.refs
and set(value.fqn).intersection(node_paths)
and value.config.materialized in materializations
and value.config.enabled
and not value.sources
and not key.endswith("_create_gold")
-%}
{%- set name = value.schema + "." + value.alias -%}
{%- set _result = fromyaml("[" ~ fsc_utils.get_ancestors(value, exclude_source=true)[:-1] ~ "]") -%}
{% if _result -%}
{%- do _result.insert(0, key) -%}
{%- do dag.update({name.upper() : _result | reverse|list}) -%}
{% for d in _result -%}
{%- if d.split(".")[-1].split("__")[0] not in schema -%}
{%- do schema.append(d.split(".")[-1].split("__")[0]) -%}
{%- endif -%}
{%- endfor -%}
{%- else -%}
{%- do dag.update({name.upper() : [key] }) -%}
{%- if value.schema not in schema -%}
{%- do schema.append(value.schema) -%}
{%- endif -%}
{%- endif -%}
{%- endif -%}
{%- endfor -%}
{%- set final = {"dag": dag, "schema": schema} -%}
{{- tojson(final) -}}
{%- endmacro -%}
{% macro generate_table_views_ddl(tables, schema) %}
{#
Return a list of DDL statements for views of tables from a list.
tables: a list of tables to create views for
schema: schemas to create schema DDL for
#}
{%- set schema_ddl = [] -%}
{%- set view_ddl = [] -%}
{% for s in schema %}
{%- do schema_ddl.append("CREATE SCHEMA IF NOT EXISTS __NEW__." ~ s ~ ";") -%}
{%- endfor -%}
{% for table in tables %}
{%- do view_ddl.append("CREATE OR REPLACE VIEW __NEW__." ~ table ~ " AS SELECT * FROM " ~ "__SOURCE__." ~ table ~";") -%}
{%- endfor -%}
{{- toyaml(schema_ddl + view_ddl) -}}
{%- endmacro -%}
{% macro generate_datashare_ddl() %}
{#
generate DDL for datashare
Return: DDL for datashare
#}
{%- set gold_views = fromjson(fsc_utils.generate_dag_and_schemas(["gold"], ["view"])) -%}
{%- set gold_views_ddl = fromyaml(fsc_utils.generate_view_ddl(gold_views["dag"], gold_views["schema"])) -%}
{%- set gold_tables = fromjson(fsc_utils.generate_dag_and_schemas(["gold"], ["incremental", "table"])) -%}
{%- set gold_tables_ddl = fromyaml(fsc_utils.generate_table_views_ddl(gold_tables["dag"].keys(), gold_tables["schema"])) -%}
{%- set combined_ddl = gold_views_ddl + gold_tables_ddl -%}
{%- do combined_ddl.insert(0, "CREATE DATABASE IF NOT EXISTS __NEW__;") -%}
{{- "BEGIN\n" ~ (combined_ddl | join("\n")) ~ "\nEND" -}}
{%- endmacro -%}
{% macro get_exclusion_schema() %}
{#
Return a list of schemas to exclude from the data shares
#}
{% set schema = {} %}
{% for key, value in graph.nodes.items() -%}
{%
if key.startswith("test.") or value.schema.startswith("_")
-%}
{% do schema.update({value.schema:None}) %}
{%- endif %}
{%- endfor %}
{{- schema.keys() | list | tojson -}}
{%- endmacro -%}