import itertools
import logging
import re
from pathlib import Path
from typing import Any, Iterator, Literal, Mapping, Optional, Sequence, Tuple, cast
from dagster import AssetKey
from dagster._annotations import experimental, public
from sqlglot import ParseError, exp, parse_one, to_table
from sqlglot.optimizer import Scope, build_scope, optimize
from dagster_looker.lkml.liquid_utils import best_effort_render_liquid_sql
from dagster_looker.lkml.sqlglot_utils import custom_bigquery_dialect_inst
LookMLStructureType = Literal["dashboard", "explore", "table", "view"]
logger = logging.getLogger("dagster_looker")
def build_deps_for_looker_dashboard(
dagster_looker_translator: "DagsterLookerLkmlTranslator",
lookml_structure: Tuple[Path, LookMLStructureType, Mapping[str, Any]],
) -> Sequence[AssetKey]:
lookml_view_path, _, lookml_dashboard_props = lookml_structure
return list(
{
dagster_looker_translator.get_asset_key(
lookml_structure=(
lookml_view_path,
"explore",
lookml_element_from_dashboard_props,
)
)
for lookml_element_from_dashboard_props in itertools.chain(
# https://cloud.google.com/looker/docs/reference/param-lookml-dashboard#elements_2
lookml_dashboard_props.get("elements", []),
# https://cloud.google.com/looker/docs/reference/param-lookml-dashboard#filters
lookml_dashboard_props.get("filters", []),
)
if lookml_element_from_dashboard_props.get("explore")
}
)
def build_deps_for_looker_explore(
dagster_looker_translator: "DagsterLookerLkmlTranslator",
lookml_structure: Tuple[Path, LookMLStructureType, Mapping[str, Any]],
) -> Sequence[AssetKey]:
lookml_explore_path, _, lookml_explore_props = lookml_structure
# https://cloud.google.com/looker/docs/reference/param-explore-from
explore_base_view = [{"name": lookml_explore_props.get("from") or lookml_explore_props["name"]}]
# https://cloud.google.com/looker/docs/reference/param-explore-join
explore_join_views: Sequence[Mapping[str, Any]] = lookml_explore_props.get("joins", [])
return list(
{
dagster_looker_translator.get_asset_key(
lookml_structure=(
lookml_explore_path,
"view",
lookml_view_from_explore_props,
)
)
for lookml_view_from_explore_props in itertools.chain(
explore_base_view, explore_join_views
)
}
)
def build_deps_for_looker_view(
dagster_looker_translator: "DagsterLookerLkmlTranslator",
lookml_structure: Tuple[Path, LookMLStructureType, Mapping[str, Any]],
) -> Sequence[AssetKey]:
lookml_view_path, _, lookml_view_props = lookml_structure
# https://cloud.google.com/looker/docs/derived-tables
derived_table_sql: Optional[str] = lookml_view_props.get("derived_table", {}).get("sql")
if not derived_table_sql:
# https://cloud.google.com/looker/docs/reference/param-view-sql-table-name
sql_table_name = lookml_view_props.get("sql_table_name") or lookml_view_props["name"]
sqlglot_table = to_table(
sql_table_name.replace("`", ""), dialect=custom_bigquery_dialect_inst
)
return [
dagster_looker_translator.get_asset_key(
lookml_structure=(
lookml_view_path,
"table",
{"table": sqlglot_table, "from_structure": lookml_view_props},
)
)
]
# We need to handle the Looker substitution operator ($) properly since the lkml
# compatible SQL may not be parsable yet by sqlglot.
#
# https://cloud.google.com/looker/docs/sql-and-referring-to-lookml#substitution_operator_
upstream_view_pattern = re.compile(r"\${(.*?)\.SQL_TABLE_NAME\}")
if upstream_looker_views_from_substitution := upstream_view_pattern.findall(derived_table_sql):
return [
dagster_looker_translator.get_asset_key(
lookml_structure=(
lookml_view_path,
"view",
{"name": upstream_looker_view_name},
)
)
for upstream_looker_view_name in set(upstream_looker_views_from_substitution)
]
upstream_sqlglot_tables: Sequence[exp.Table] = []
try:
rendered_liquid_sql = best_effort_render_liquid_sql(
lookml_view_props["name"], lookml_view_path.name, derived_table_sql
)
parsed_derived_table_ast = parse_one(
sql=rendered_liquid_sql, dialect=custom_bigquery_dialect_inst
)
ast_to_evaluate = parsed_derived_table_ast
try:
optimized_derived_table_ast = optimize(
parsed_derived_table_ast,
dialect=custom_bigquery_dialect_inst,
validate_qualify_columns=False,
)
ast_to_evaluate = optimized_derived_table_ast
except ParseError:
pass
root_scope = build_scope(ast_to_evaluate)
upstream_sqlglot_tables = [
source
for scope in cast(Iterator[Scope], root_scope.traverse() if root_scope else [])
for (_, source) in scope.selected_sources.values()
if isinstance(source, exp.Table)
]
except Exception as e:
logger.warn(
f"Failed to parse derived table SQL for view `{lookml_view_props['name']}`"
f" in file `{lookml_view_path.name}`."
" The upstream dependencies for the view will be omitted.\n\n"
f"Exception: {e}"
)
return list(
{
dagster_looker_translator.get_asset_key(
lookml_structure=(
lookml_view_path,
"table",
{"table": sqlglot_table, "from_structure": lookml_view_props},
)
)
for sqlglot_table in upstream_sqlglot_tables
}
)
[docs]
@experimental
class DagsterLookerLkmlTranslator:
"""Holds a set of methods that derive Dagster asset definition metadata given a representation
of a LookML structure (dashboards, explores, views).
This class is exposed so that methods can be overriden to customize how Dagster asset metadata
is derived.
"""
[docs]
@public
def get_asset_key(
self, lookml_structure: Tuple[Path, LookMLStructureType, Mapping[str, Any]]
) -> AssetKey:
"""A method that takes in a LookML structure (dashboards, explores, views) and
returns the Dagster asset key that represents the structure.
The LookML structure is parsed using ``lkml``. You can learn more about this here:
https://lkml.readthedocs.io/en/latest/simple.html.
You can learn more about LookML dashboards and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/param-lookml-dashboard.
You can learn more about LookML explores and views and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/lookml-quick-reference.
This method can be overriden to provide a custom asset key for a LookML structure.
Args:
lookml_structure (Tuple[Path, str, Mapping[str, Any]]): A tuple with the path to file
defining a LookML structure, the LookML structure type, and a dictionary
representing a LookML structure.
Returns:
AssetKey: The Dagster asset key that represents the LookML structure.
"""
lookml_structure_path, lookml_structure_type, lookml_structure_props = lookml_structure
if lookml_structure_type == "dashboard":
return AssetKey(["dashboard", lookml_structure_props["dashboard"]])
if lookml_structure_type == "view":
return AssetKey(["view", lookml_structure_props["name"]])
if lookml_structure_type == "table":
sqlglot_table = lookml_structure_props["table"]
return AssetKey([part.name.replace("*", "_star") for part in sqlglot_table.parts])
if lookml_structure_type == "explore":
explore_name = lookml_structure_props.get("explore") or lookml_structure_props.get(
"name"
)
if not explore_name:
raise ValueError(
f"Could not find `name` or `explore` property in LookML structure type `{lookml_structure_type}`"
f" at path `{lookml_structure_path}` with properties {lookml_structure_props}"
)
return AssetKey(["explore", explore_name])
raise ValueError(
f"Unsupported LookML structure type `{lookml_structure_type}` at path `{lookml_structure_path}`"
)
[docs]
@public
def get_deps(
self, lookml_structure: Tuple[Path, LookMLStructureType, Mapping[str, Any]]
) -> Sequence[AssetKey]:
"""A method that takes in a LookML structure (dashboards, explores, views) and
returns the Dagster dependencies of that the structure.
The LookML structure is parsed using ``lkml``. You can learn more about this here:
https://lkml.readthedocs.io/en/latest/simple.html.
You can learn more about LookML dashboards and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/param-lookml-dashboard.
You can learn more about LookML explores and views and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/lookml-quick-reference.
This method can be overriden to provide custom dependencies for a LookML structure.
Args:
lookml_structure (Tuple[Path, str, Mapping[str, Any]]): A tuple with the path to file
defining a LookML structure, the LookML structure type, and a dictionary
representing a LookML structure.
Returns:
AssetKey: The Dagster dependencies for the LookML structure.
"""
lookml_structure_path, lookml_structure_type, _ = lookml_structure
if lookml_structure_type == "dashboard":
return build_deps_for_looker_dashboard(
dagster_looker_translator=self, lookml_structure=lookml_structure
)
if lookml_structure_type == "explore":
return build_deps_for_looker_explore(
dagster_looker_translator=self, lookml_structure=lookml_structure
)
if lookml_structure_type == "view":
return build_deps_for_looker_view(
dagster_looker_translator=self, lookml_structure=lookml_structure
)
raise ValueError(
f"Unsupported LookML structure type `{lookml_structure_type}` at path `{lookml_structure_path}`"
)
[docs]
@public
def get_description(
self, lookml_structure: Tuple[Path, LookMLStructureType, Mapping[str, Any]]
) -> Optional[str]:
"""A method that takes in a LookML structure (dashboards, explores, views) and
returns the Dagster description of the structure.
The LookML structure is parsed using ``lkml``. You can learn more about this here:
https://lkml.readthedocs.io/en/latest/simple.html.
You can learn more about LookML dashboards and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/param-lookml-dashboard.
You can learn more about LookML explores and views and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/lookml-quick-reference.
This method can be overriden to provide a custom description for a LookML structure.
Args:
lookml_structure (Tuple[Path, str, Mapping[str, Any]]): A tuple with the path to file
defining a LookML structure, the LookML structure type, and a dictionary
representing a LookML structure.
Returns:
Optional[str]: The Dagster description for the LookML structure.
"""
_, _, lookml_structure_props = lookml_structure
return lookml_structure_props.get("description")
[docs]
@public
def get_group_name(
self, lookml_structure: Tuple[Path, LookMLStructureType, Mapping[str, Any]]
) -> Optional[str]:
"""A method that takes in a LookML structure (dashboards, explores, views) and
returns the Dagster group name of the structure.
The LookML structure is parsed using ``lkml``. You can learn more about this here:
https://lkml.readthedocs.io/en/latest/simple.html.
You can learn more about LookML dashboards and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/param-lookml-dashboard.
You can learn more about LookML explores and views and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/lookml-quick-reference.
This method can be overriden to provide a custom group name for a LookML structure.
Args:
lookml_structure (Tuple[Path, str, Mapping[str, Any]]): A tuple with the path to file
defining a LookML structure, the LookML structure type, and a dictionary
representing a LookML structure.
Returns:
Optional[str]: A Dagster group name for the LookML structure.
"""
return None
[docs]
@public
def get_owners(
self, lookml_structure: Tuple[Path, LookMLStructureType, Mapping[str, Any]]
) -> Optional[Sequence[str]]:
"""A method that takes in a LookML structure (dashboards, explores, views) and
returns the Dagster owners of the structure.
The LookML structure is parsed using ``lkml``. You can learn more about this here:
https://lkml.readthedocs.io/en/latest/simple.html.
You can learn more about LookML dashboards and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/param-lookml-dashboard.
You can learn more about LookML explores and views and the properties available in this
dictionary here: https://cloud.google.com/looker/docs/reference/lookml-quick-reference.
This method can be overriden to provide custom owners for a LookML structure.
Args:
lookml_structure (Tuple[Path, str, Mapping[str, Any]]): A tuple with the path to file
defining a LookML structure, the LookML structure type, and a dictionary
representing a LookML structure.
Returns:
Optional[Sequence[str]]: A sequence of Dagster owners for the LookML structure.
"""
return None