Skip to content

Commit

Permalink
Methods to look up agg_time_dimensions (#995)
Browse files Browse the repository at this point in the history
  • Loading branch information
courtneyholcomb authored Jan 25, 2024
1 parent cb5afa2 commit e628fb1
Show file tree
Hide file tree
Showing 6 changed files with 170 additions and 23 deletions.
12 changes: 4 additions & 8 deletions metricflow/model/semantics/linkable_spec_resolver.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,6 @@
from metricflow.mf_logging.pretty_print import mf_pformat
from metricflow.model.semantics.linkable_element_properties import LinkableElementProperties
from metricflow.model.semantics.semantic_model_join_evaluator import SemanticModelJoinEvaluator
from metricflow.model.semantics.semantic_model_lookup import SemanticModelLookup
from metricflow.protocols.semantics import SemanticModelAccessor
from metricflow.specs.specs import (
DEFAULT_TIME_GRANULARITY,
Expand Down Expand Up @@ -524,9 +523,7 @@ def __init__(
linkable_element_sets_to_merge: List[LinkableElementSet] = []

for semantic_model in semantic_manifest.semantic_models:
linkable_element_sets_to_merge.append(
ValidLinkableSpecResolver._get_elements_in_semantic_model(semantic_model)
)
linkable_element_sets_to_merge.append(self._get_elements_in_semantic_model(semantic_model))

metric_time_elements_for_no_metrics = self._get_metric_time_elements(measure_reference=None)
self._no_metric_linkable_element_set = LinkableElementSet.merge_by_path_key(
Expand All @@ -550,8 +547,7 @@ def _get_semantic_model_for_measure(self, measure_reference: MeasureReference) -
)
return semantic_models_where_measure_was_found[0]

@staticmethod
def _get_elements_in_semantic_model(semantic_model: SemanticModel) -> LinkableElementSet:
def _get_elements_in_semantic_model(self, semantic_model: SemanticModel) -> LinkableElementSet:
"""Gets the elements in the semantic model, without requiring any joins.
Elements related to metric_time are handled separately in _get_metric_time_elements().
Expand All @@ -568,7 +564,7 @@ def _get_elements_in_semantic_model(semantic_model: SemanticModel) -> LinkableEl
properties=frozenset({LinkableElementProperties.LOCAL, LinkableElementProperties.ENTITY}),
)
)
for entity_link in SemanticModelLookup.entity_links_for_local_elements(semantic_model):
for entity_link in self._semantic_model_lookup.entity_links_for_local_elements(semantic_model):
linkable_entities.append(
LinkableEntity(
semantic_model_origin=semantic_model.reference,
Expand All @@ -579,7 +575,7 @@ def _get_elements_in_semantic_model(semantic_model: SemanticModel) -> LinkableEl
)
)

for entity_link in SemanticModelLookup.entity_links_for_local_elements(semantic_model):
for entity_link in self._semantic_model_lookup.entity_links_for_local_elements(semantic_model):
dimension_properties = frozenset({LinkableElementProperties.LOCAL})
for dimension in semantic_model.dimensions:
dimension_type = dimension.type
Expand Down
39 changes: 36 additions & 3 deletions metricflow/model/semantics/metric_lookup.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,15 +6,19 @@
from dbt_semantic_interfaces.enum_extension import assert_values_exhausted
from dbt_semantic_interfaces.protocols.metric import Metric, MetricInputMeasure, MetricType
from dbt_semantic_interfaces.protocols.semantic_manifest import SemanticManifest
from dbt_semantic_interfaces.references import MeasureReference, MetricReference
from dbt_semantic_interfaces.references import MeasureReference, MetricReference, TimeDimensionReference

from metricflow.errors.errors import DuplicateMetricError, MetricNotFoundError, NonExistentMeasureError
from metricflow.model.semantics.linkable_element_properties import LinkableElementProperties
from metricflow.model.semantics.linkable_spec_resolver import LinkableElementSet, ValidLinkableSpecResolver
from metricflow.model.semantics.linkable_spec_resolver import (
ElementPathKey,
LinkableElementSet,
ValidLinkableSpecResolver,
)
from metricflow.model.semantics.semantic_model_join_evaluator import MAX_JOIN_HOPS
from metricflow.model.semantics.semantic_model_lookup import SemanticModelLookup
from metricflow.protocols.semantics import MetricAccessor
from metricflow.specs.specs import LinkableInstanceSpec
from metricflow.specs.specs import LinkableInstanceSpec, TimeDimensionSpec

logger = logging.getLogger(__name__)

Expand Down Expand Up @@ -157,3 +161,32 @@ def contains_cumulative_or_time_offset_metric(self, metric_references: Sequence[
if input_metric.offset_window or input_metric.offset_to_grain:
return True
return False

def _get_agg_time_dimension_path_keys_for_metric(
self, metric_reference: MetricReference
) -> Sequence[ElementPathKey]:
"""Retrieves the aggregate time dimensions associated with the metric's measures."""
metric = self.get_metric(metric_reference)
path_keys = set()
for input_measure in metric.input_measures:
path_key = self._semantic_model_lookup.get_agg_time_dimension_path_key_for_measure(
measure_reference=input_measure.measure_reference
)
path_keys.add(path_key)
return list(path_keys)

def get_valid_agg_time_dimensions_for_metric(
self, metric_reference: MetricReference
) -> Sequence[TimeDimensionSpec]:
"""Get the agg time dimension specs that can be used in place of metric time for this metric, if applicable."""
agg_time_dimension_element_path_keys = self._get_agg_time_dimension_path_keys_for_metric(metric_reference)
if len(agg_time_dimension_element_path_keys) != 1:
# If the metric's input measures have different agg_time_dimensions, user must use metric_time.
return []

path_key = agg_time_dimension_element_path_keys[0]
valid_agg_time_dimension_specs = TimeDimensionSpec.generate_possible_specs_for_time_dimension(
time_dimension_reference=TimeDimensionReference(element_name=path_key.element_name),
entity_links=path_key.entity_links,
)
return valid_agg_time_dimension_specs
44 changes: 39 additions & 5 deletions metricflow/model/semantics/semantic_model_lookup.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,7 @@
from metricflow.errors.errors import InvalidSemanticModelError
from metricflow.mf_logging.pretty_print import mf_pformat
from metricflow.model.semantics.element_group import ElementGrouper
from metricflow.model.semantics.linkable_spec_resolver import ElementPathKey
from metricflow.model.spec_converters import MeasureConverter
from metricflow.protocols.semantics import SemanticModelAccessor
from metricflow.specs.specs import (
Expand Down Expand Up @@ -214,7 +215,7 @@ def _add_semantic_model(self, semantic_model: SemanticModel) -> None:
f"Aggregation time dimension does not have a time granularity set: {agg_time_dimension}"
)

primary_entity = SemanticModelLookup._resolved_primary_entity(semantic_model)
primary_entity = SemanticModelLookup.resolved_primary_entity(semantic_model)

if primary_entity is None:
raise RuntimeError(
Expand Down Expand Up @@ -291,7 +292,7 @@ def get_entity_from_semantic_model(
)

@staticmethod
def _resolved_primary_entity(semantic_model: SemanticModel) -> Optional[EntityReference]:
def resolved_primary_entity(semantic_model: SemanticModel) -> Optional[EntityReference]:
"""Return the primary entity for dimensions in the model."""
primary_entity_reference = semantic_model.primary_entity_reference

Expand All @@ -300,14 +301,12 @@ def _resolved_primary_entity(semantic_model: SemanticModel) -> Optional[EntityRe
)

# This should be caught by the validation, but adding a sanity check.
assert len(entities_with_type_primary) <= 1, f"Found >1 primary entity in {semantic_model}"
assert len(entities_with_type_primary) <= 1, f"Found > 1 primary entity in {semantic_model}"
if primary_entity_reference is not None:
assert len(entities_with_type_primary) == 0, (
f"The primary_entity field was set to {primary_entity_reference}, but there are non-zero entities with "
f"type {EntityType.PRIMARY} in {semantic_model}"
)

if primary_entity_reference is not None:
return primary_entity_reference

if len(entities_with_type_primary) > 0:
Expand Down Expand Up @@ -339,3 +338,38 @@ def get_element_spec_for_name(self, element_name: str) -> LinkableInstanceSpec:
return self._entity_ref_to_spec[EntityReference(element_name=element_name)]
else:
raise ValueError(f"Unable to find linkable element {element_name} in manifest")

def get_agg_time_dimension_path_key_for_measure(self, measure_reference: MeasureReference) -> ElementPathKey:
"""Get the agg time dimension associated with the measure."""
agg_time_dimension = self.get_agg_time_dimension_for_measure(measure_reference)

# A measure's agg_time_dimension is required to be in the same semantic model as the measure,
# so we can assume the same semantic model for both measure and dimension.
semantic_models = self.get_semantic_models_for_measure(measure_reference)
assert (
len(semantic_models) == 1
), f"Expected exactly one semantic model for measure {measure_reference}, but found semantic models {semantic_models}."
semantic_model = semantic_models[0]

entity_link = self.resolved_primary_entity(semantic_model)
assert entity_link is not None, (
f"Expected semantic model {semantic_model} to have a primary entity since it has a "
"measure requiring an agg_time_dimension, but found none.",
)

return ElementPathKey(
element_name=agg_time_dimension.element_name,
entity_links=(entity_link,),
time_granularity=None,
date_part=None,
)

def get_agg_time_dimension_specs_for_measure(
self, measure_reference: MeasureReference
) -> Sequence[TimeDimensionSpec]:
"""Get the agg time dimension specs that can be used in place of metric time for this measure."""
path_key = self.get_agg_time_dimension_path_key_for_measure(measure_reference)
return TimeDimensionSpec.generate_possible_specs_for_time_dimension(
time_dimension_reference=TimeDimensionReference(element_name=path_key.element_name),
entity_links=path_key.entity_links,
)
36 changes: 30 additions & 6 deletions metricflow/protocols/semantics.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@
from __future__ import annotations

from abc import ABC, abstractmethod
from typing import Dict, FrozenSet, Optional, Sequence, Set
from typing import TYPE_CHECKING, Dict, FrozenSet, Optional, Sequence, Set

from dbt_semantic_interfaces.protocols.dimension import Dimension
from dbt_semantic_interfaces.protocols.entity import Entity
Expand All @@ -28,11 +28,10 @@

from metricflow.model.semantics.element_group import ElementGrouper
from metricflow.model.semantics.linkable_element_properties import LinkableElementProperties
from metricflow.specs.specs import (
LinkableInstanceSpec,
MeasureSpec,
NonAdditiveDimensionSpec,
)
from metricflow.specs.specs import LinkableInstanceSpec, MeasureSpec, NonAdditiveDimensionSpec, TimeDimensionSpec

if TYPE_CHECKING:
from metricflow.model.semantics.linkable_spec_resolver import ElementPathKey


class SemanticModelAccessor(ABC):
Expand Down Expand Up @@ -92,12 +91,19 @@ def get_semantic_models_for_measure(self, measure_reference: MeasureReference) -
@abstractmethod
def get_agg_time_dimension_for_measure(self, measure_reference: MeasureReference) -> TimeDimensionReference:
"""Retrieves the aggregate time dimension that is associated with the measure reference."""
raise NotImplementedError

@abstractmethod
def get_entity_in_semantic_model(self, ref: SemanticModelElementReference) -> Optional[Entity]:
"""Retrieve the entity matching the element -> semantic model mapping, if any."""
raise NotImplementedError

@staticmethod
@abstractmethod
def resolved_primary_entity(semantic_model: SemanticModel) -> Optional[EntityReference]:
"""Return the primary entity for dimensions in the model."""
raise NotImplementedError

@abstractmethod
def get_by_reference(self, semantic_model_reference: SemanticModelReference) -> Optional[SemanticModel]:
"""Retrieve the semantic model object matching the input semantic model reference, if any."""
Expand Down Expand Up @@ -132,6 +138,17 @@ def get_element_spec_for_name(self, element_name: str) -> LinkableInstanceSpec:
"""Returns the spec for the given name of a linkable element (dimension or entity)."""
raise NotImplementedError

@abstractmethod
def get_agg_time_dimension_path_key_for_measure(self, measure_reference: MeasureReference) -> ElementPathKey:
"""Get the agg time dimension associated with the measure."""
raise NotImplementedError

def get_agg_time_dimension_specs_for_measure(
self, measure_reference: MeasureReference
) -> Sequence[TimeDimensionSpec]:
"""Get the agg time dimension specs that can be used in place of metric time for this measure."""
raise NotImplementedError


class MetricAccessor(ABC):
"""Interface for accessing semantic information about a set of metric objects.
Expand Down Expand Up @@ -201,3 +218,10 @@ def group_by_item_specs_for_no_metrics_query(
) -> Sequence[LinkableInstanceSpec]:
"""Return the possible group-by-items for a dimension values query with no metrics."""
raise NotImplementedError

@abstractmethod
def get_valid_agg_time_dimensions_for_metric(
self, metric_reference: MetricReference
) -> Sequence[TimeDimensionSpec]:
"""Get the agg time dimension specs that can be used in place of metric time for this metric, if applicable."""
raise NotImplementedError
33 changes: 32 additions & 1 deletion metricflow/specs/specs.py
Original file line number Diff line number Diff line change
Expand Up @@ -449,6 +449,37 @@ def comparison_key(self, exclude_fields: Sequence[TimeDimensionSpecField] = ())
exclude_fields=exclude_fields,
)

@staticmethod
def generate_possible_specs_for_time_dimension(
time_dimension_reference: TimeDimensionReference, entity_links: Tuple[EntityReference, ...]
) -> List[TimeDimensionSpec]:
"""Generate a list of time dimension specs with all combinations of granularity & date part."""
time_dimension_specs: List[TimeDimensionSpec] = []
for time_granularity in TimeGranularity:
time_dimension_specs.append(
TimeDimensionSpec(
element_name=time_dimension_reference.element_name,
entity_links=entity_links,
time_granularity=time_granularity,
date_part=None,
)
)
for date_part in DatePart:
for time_granularity in date_part.compatible_granularities:
time_dimension_specs.append(
TimeDimensionSpec(
element_name=time_dimension_reference.element_name,
entity_links=entity_links,
time_granularity=time_granularity,
date_part=date_part,
)
)
return time_dimension_specs

@property
def is_metric_time(self) -> bool: # noqa: D
return self.element_name == METRIC_TIME_ELEMENT_NAME


@dataclass(frozen=True)
class NonAdditiveDimensionSpec(SerializableDataclass):
Expand Down Expand Up @@ -635,7 +666,7 @@ def metric_time_specs(self) -> Sequence[TimeDimensionSpec]:
return tuple(
time_dimension_spec
for time_dimension_spec in self.time_dimension_specs
if time_dimension_spec.element_name == METRIC_TIME_ELEMENT_NAME
if time_dimension_spec.is_metric_time
)

@property
Expand Down
29 changes: 29 additions & 0 deletions metricflow/test/model/test_semantic_model_container.py
Original file line number Diff line number Diff line change
Expand Up @@ -157,3 +157,32 @@ def test_linkable_set_for_common_dimensions_in_different_models(
),
),
)


def test_get_valid_agg_time_dimensions_for_metric( # noqa: D
metric_lookup: MetricLookup, semantic_model_lookup: SemanticModelLookup
) -> None:
for metric_name in ["views", "listings", "bookings_per_view"]:
metric_reference = MetricReference(metric_name)
metric = metric_lookup.get_metric(metric_reference)
metric_agg_time_dims = metric_lookup.get_valid_agg_time_dimensions_for_metric(metric_reference)
measure_agg_time_dims = list(
{
semantic_model_lookup.get_agg_time_dimension_for_measure(measure.measure_reference)
for measure in metric.input_measures
}
)
if len(measure_agg_time_dims) == 1:
for metric_agg_time_dim in metric_agg_time_dims:
assert metric_agg_time_dim.reference == measure_agg_time_dims[0]
else:
assert len(metric_agg_time_dims) == 0


def test_get_agg_time_dimension_specs_for_measure(semantic_model_lookup: SemanticModelLookup) -> None: # noqa: D
for measure_name in ["bookings", "views", "listings"]:
measure_reference = MeasureReference(measure_name)
agg_time_dim_specs = semantic_model_lookup.get_agg_time_dimension_specs_for_measure(measure_reference)
agg_time_dim_reference = semantic_model_lookup.get_agg_time_dimension_for_measure(measure_reference)
for spec in agg_time_dim_specs:
assert spec.reference == agg_time_dim_reference

0 comments on commit e628fb1

Please sign in to comment.