dbt-labs
diff --git a/‎.changes/unreleased/Under the Hood-20260310-085119.yaml‎
Lines changed: 6 additions & 0 deletions b/‎.changes/unreleased/Under the Hood-20260310-085119.yaml‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎metricflow-semantics/metricflow_semantics/toolkit/string_helpers.py‎
Lines changed: 6 additions & 0 deletions b/‎metricflow-semantics/metricflow_semantics/toolkit/string_helpers.py‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎metricflow/dataflow/nodes/compute_metrics.py‎
Lines changed: 18 additions & 5 deletions b/‎metricflow/dataflow/nodes/compute_metrics.py‎
Lines changed: 18 additions & 5 deletions
diff --git a/‎metricflow/dataflow/optimizer/source_scan/cm_branch_combiner.py‎
Lines changed: 12 additions & 12 deletions b/‎metricflow/dataflow/optimizer/source_scan/cm_branch_combiner.py‎
Lines changed: 12 additions & 12 deletions
diff --git a/‎metricflow/dataflow/optimizer/source_scan/source_scan_optimizer.py‎
Lines changed: 1 addition & 1 deletion b/‎metricflow/dataflow/optimizer/source_scan/source_scan_optimizer.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎metricflow/metric_evaluation/dfs_me_planner.py‎
Lines changed: 250 additions & 0 deletions b/‎metricflow/metric_evaluation/dfs_me_planner.py‎
Lines changed: 250 additions & 0 deletions
@@ -0,0 +1,6 @@
+kind: Under the Hood
+body: Add DFS metric evaluation planner
+time: 2026-03-10T08:51:19.497736-07:00
+custom:
+  Author: plypaul
+  Issue: "1985"
@@ -1,6 +1,7 @@
 from __future__ import annotations
 
 import textwrap
+from typing import Optional
 
 MF_INDENT_2_SPACE = "  "
 
@@ -36,3 +37,8 @@ def mf_dedent(text: str) -> str:
        )
     """
     return textwrap.dedent(text.lstrip("\n")).rstrip("\n")
+
+
+def mf_wrap(text: str, width: Optional[int] = None) -> str:
+    """Wraps text to the specified width. Useful for user-facing messages."""
+    return "\n".join(textwrap.wrap(text=text, width=width if width is not None else 80))
@@ -2,6 +2,7 @@
 
 from collections.abc import Iterable
 from dataclasses import dataclass
+from functools import cached_property
 from typing import Sequence, Set, Tuple
 
 from metricflow_semantics.dag.id_prefix import IdPrefix, StaticIdPrefix
@@ -67,11 +68,16 @@ def description(self) -> str:  # noqa: D102
 
     @property
     def displayed_properties(self) -> Sequence[DisplayedProperty]:  # noqa: D102
-        displayed_properties = tuple(super().displayed_properties) + tuple(
+        displayed_properties = list(super().displayed_properties)
+        # TODO: Use different key names for computed / passthrough metric specs.
+        displayed_properties.extend(
             DisplayedProperty("metric_spec", metric_spec) for metric_spec in self.computed_metric_specs
         )
+        displayed_properties.extend(
+            DisplayedProperty("metric_spec", metric_spec) for metric_spec in self.passthrough_metric_specs
+        )
         if self.output_group_by_metric_instances:
-            displayed_properties += (
+            displayed_properties.append(
                 DisplayedProperty("output_group_by_metric_instances", self.output_group_by_metric_instances),
             )
         return displayed_properties
@@ -84,7 +90,10 @@ def functionally_identical(self, other_node: DataflowPlanNode) -> bool:  # noqa:
         if not isinstance(other_node, self.__class__):
             return False
 
-        if other_node.computed_metric_specs != self.computed_metric_specs:
+        if (
+            other_node.computed_metric_specs != self.computed_metric_specs
+            or other_node.passthrough_metric_specs != self.passthrough_metric_specs
+        ):
             return False
 
         return (
@@ -105,8 +114,8 @@ def can_combine(self, other_node: ComputeMetricsNode) -> Tuple[bool, str]:
 
         if other_node.output_group_by_metric_instances != self.output_group_by_metric_instances:
             return False, "one node is a group by metric source node"
-
-        alias_to_metric_spec = {spec.alias: spec for spec in self.computed_metric_specs if spec.alias is not None}
+        metric_specs = self.computed_metric_specs + self.passthrough_metric_specs
+        alias_to_metric_spec = {spec.alias: spec for spec in metric_specs if spec.alias is not None}
 
         for spec in other_node.computed_metric_specs:
             if (
@@ -135,3 +144,7 @@ def with_new_parents(self, new_parent_nodes: Sequence[DataflowPlanNode]) -> Comp
     @override
     def aggregated_to_elements(self) -> Set[LinkableInstanceSpec]:
         return set(self._aggregated_to_elements)
+
+    @cached_property
+    def metric_specs(self) -> Sequence[MetricSpec]:  # noqa: D102
+        return self.computed_metric_specs + self.passthrough_metric_specs
@@ -1,10 +1,11 @@
 from __future__ import annotations
 
+import itertools
 import logging
 from dataclasses import dataclass
 from typing import List, Optional, Sequence
 
-from metricflow_semantics.specs.metric_spec import MetricSpec
+from metricflow_semantics.toolkit.collections.ordered_set import FrozenOrderedSet
 from metricflow_semantics.toolkit.mf_logging.lazy_formattable import LazyFormat
 
 from metricflow.dataflow.dataflow_plan import (
@@ -338,19 +339,18 @@ def visit_compute_metrics_node(self, node: ComputeMetricsNode) -> ComputeMetrics
         combined_parent_node = combined_parent_nodes[0]
         assert combined_parent_node is not None
 
-        # Dedupe (preserving order for output consistency) as it's possible for multiple derived metrics to use the same
-        # metric.
-        unique_metric_specs: List[MetricSpec] = []
-        for metric_spec in tuple(self._current_left_node.computed_metric_specs) + tuple(
-            current_right_node.computed_metric_specs
-        ):
-            if metric_spec not in unique_metric_specs:
-                unique_metric_specs.append(metric_spec)
-
         combined_node = ComputeMetricsNode.create(
             parent_node=combined_parent_node,
-            computed_metric_specs=unique_metric_specs,
-            passthrough_metric_specs=(),
+            # Dedupe (preserving order for output consistency) as it's possible for multiple derived metrics to use the same
+            # metric.
+            computed_metric_specs=FrozenOrderedSet(
+                itertools.chain(self._current_left_node.computed_metric_specs, current_right_node.computed_metric_specs)
+            ),
+            passthrough_metric_specs=FrozenOrderedSet(
+                itertools.chain(
+                    self._current_left_node.passthrough_metric_specs, current_right_node.passthrough_metric_specs
+                )
+            ),
             aggregated_to_elements=current_right_node.aggregated_to_elements,
             output_group_by_metric_instances=current_right_node.output_group_by_metric_instances,
         )
 
@@ -172,7 +172,7 @@ def visit_compute_metrics_node(self, node: ComputeMetricsNode) -> OptimizeBranch
                 optimized_branch=ComputeMetricsNode.create(
                     parent_node=optimized_parent_result.optimized_branch,
                     computed_metric_specs=node.computed_metric_specs,
-                    passthrough_metric_specs=(),
+                    passthrough_metric_specs=node.passthrough_metric_specs,
                     output_group_by_metric_instances=node.output_group_by_metric_instances,
                     aggregated_to_elements=node.aggregated_to_elements,
                 )
 
@@ -0,0 +1,250 @@
+from __future__ import annotations
+
+import logging
+from collections.abc import Iterable, Sequence
+from typing import Optional
+
+from dbt_semantic_interfaces.enum_extension import assert_values_exhausted
+from dbt_semantic_interfaces.protocols import Metric
+from dbt_semantic_interfaces.type_enums import MetricType
+from metricflow_semantics.semantic_graph.model_id import SemanticModelId
+from metricflow_semantics.specs.instance_spec import LinkableInstanceSpec
+from metricflow_semantics.specs.metric_spec import MetricSpec
+from metricflow_semantics.specs.where_filter.where_filter_spec_factory import WhereFilterSpecFactory
+from metricflow_semantics.toolkit.mf_logging.lazy_formattable import LazyFormat
+from typing_extensions import override
+
+from metricflow.metric_evaluation.metric_query_planner import MetricEvaluationPlanner
+from metricflow.metric_evaluation.plan.me_edges import MetricQueryDependencyEdge
+from metricflow.metric_evaluation.plan.me_nodes import (
+    ConversionMetricQueryNode,
+    CumulativeMetricQueryNode,
+    DerivedMetricsQueryNode,
+    MetricQueryNode,
+    SimpleMetricsQueryNode,
+    TopLevelQueryNode,
+)
+from metricflow.metric_evaluation.plan.me_plan import (
+    MetricEvaluationPlan,
+    MutableMetricEvaluationPlan,
+)
+from metricflow.metric_evaluation.plan.query_element import MetricQueryElement, MetricQueryPropertySet
+from metricflow.plan_conversion.node_processor import PredicatePushdownState
+
+logger = logging.getLogger(__name__)
+
+
+class DepthFirstSearchMetricEvaluationPlanner(MetricEvaluationPlanner):
+    """Builds a metric evaluation plan using a depth-first traversal of the metric dependency graph.
+
+    For example, the metric evaluation plan for the query [`bookings_per_listing`, `bookings`] results in a plan
+    that has the following edges:
+
+        MetricQuery([`bookings_per_listing`]) -> MetricQuery([`bookings`])
+        MetricQuery([`bookings_per_listing`]) -> MetricQuery([`listings`])
+        Top Level Query -> MetricQuery([`bookings_per_listing`])
+        Top Level Query -> MetricQuery([`bookings`])
+
+    This mirrors the original approach to compute metrics in the `DataflowPlanBuilder`.
+    """
+
+    @override
+    def build_plan(
+        self,
+        metric_specs: Sequence[MetricSpec],
+        group_by_item_specs: Sequence[LinkableInstanceSpec],
+        predicate_pushdown_state: PredicatePushdownState,
+        filter_spec_factory: WhereFilterSpecFactory,
+    ) -> MetricEvaluationPlan:
+        """Build a metric evaluation plan using iterative depth-first traversal.
+
+        This resolves each requested metric into metric-query nodes and dependency edges, then attaches a top-level
+        query node that references all requested metrics.
+        """
+        top_level_query_elements = tuple(
+            MetricQueryElement.create(
+                metric_spec=metric_spec,
+                group_by_item_specs=group_by_item_specs,
+                predicate_pushdown_state=predicate_pushdown_state,
+            )
+            for metric_spec in metric_specs
+        )
+
+        evaluation_plan = MutableMetricEvaluationPlan.create()
+
+        # The query elements to process in the iterative DFS traversal loop. The next element is popped from the right
+        # so elements are added in reverse to preserve order.
+        query_elements_to_process: list[MetricQueryElement] = list(reversed(top_level_query_elements))
+        # Keeps track of the query elements that have been processed into a node in the evaluation plan.
+        query_element_to_node: dict[MetricQueryElement, MetricQueryNode] = {}
+
+        while query_elements_to_process:
+            current_query_element = query_elements_to_process.pop()
+            logger.debug(LazyFormat("Handling query element", current_query_element=current_query_element))
+            if current_query_element in query_element_to_node:
+                continue
+
+            current_metric_spec = current_query_element.metric_spec
+            current_query_properties = current_query_element.query_properties
+            current_predicate_pushdown_state = current_query_element.predicate_pushdown_state
+
+            metric_name = current_metric_spec.element_name
+            metric = self._manifest_object_lookup.get_metric(metric_name)
+            metric_type = metric.type
+
+            # Handle non-derived metrics.
+            metric_query_node = self._create_base_metric_query_node(
+                metric=metric,
+                metric_type=metric_type,
+                metric_spec=current_metric_spec,
+                query_properties=current_query_properties,
+            )
+            if metric_query_node is not None:
+                evaluation_plan.add_node(metric_query_node)
+                query_element_to_node[current_query_element] = metric_query_node
+                continue
+
+            # Handle derived metrics.
+            input_query_elements = self._get_input_metric_query_elements_for_derived_metric(
+                metric_spec=current_metric_spec,
+                group_by_item_specs=current_query_element.group_by_item_specs,
+                predicate_pushdown_state=current_predicate_pushdown_state,
+                filter_spec_factory=filter_spec_factory,
+            )
+            assert len(input_query_elements) > 0, LazyFormat(
+                "Expected a ratio or derived metric to have input query elements",
+                current_metric_spec=current_metric_spec,
+                metric=metric,
+            )
+
+            inputs_that_need_processing = tuple(
+                input_query_element
+                for input_query_element in input_query_elements
+                if input_query_element not in query_element_to_node
+            )
+            # To implement DFS traversal, check if the input nodes have been processed. If not, add the input nodes
+            # for processing and then try to process the current node again.
+            if len(inputs_that_need_processing) > 0:
+                # Add the current node first as the loop pops the next current element from the end.
+                query_elements_to_process.append(current_query_element)
+                # Adding inputs in reverse order to match traversal order with definition order.
+                query_elements_to_process.extend(reversed(inputs_that_need_processing))
+                continue
+
+            # All inputs of the derived metric have been processed, so add the node for the derived metric and the
+            # edges.
+            derived_metric_query_node = DerivedMetricsQueryNode.create(
+                computed_metric_specs=[current_metric_spec],
+                passthrough_metric_specs=(),
+                query_properties=current_query_properties,
+            )
+            evaluation_plan.add_node(derived_metric_query_node)
+
+            for input_query_element in input_query_elements:
+                input_query_node = query_element_to_node[input_query_element]
+                evaluation_plan.add_edge(
+                    MetricQueryDependencyEdge.create(
+                        target_node=derived_metric_query_node,
+                        target_node_output_spec=current_metric_spec,
+                        source_node=input_query_node,
+                        source_node_output_spec=input_query_element.metric_spec,
+                    )
+                )
+
+            query_element_to_node[current_query_element] = derived_metric_query_node
+
+        # Once nodes for all metrics in the query have been generated, add a `TopLevelQueryNode` to provide a single
+        # entry point.
+        top_level_query_node = TopLevelQueryNode.create(
+            passthrough_metric_specs=metric_specs,
+            query_properties=MetricQueryPropertySet.create(group_by_item_specs, predicate_pushdown_state),
+        )
+        evaluation_plan.add_node(top_level_query_node)
+
+        for top_level_query_element in top_level_query_elements:
+            evaluation_plan.add_edge(
+                MetricQueryDependencyEdge.create(
+                    target_node=top_level_query_node,
+                    target_node_output_spec=top_level_query_element.metric_spec,
+                    source_node=query_element_to_node[top_level_query_element],
+                    source_node_output_spec=top_level_query_element.metric_spec,
+                )
+            )
+
+        return evaluation_plan
+
+    def _create_base_metric_query_node(
+        self,
+        metric: Metric,
+        metric_type: MetricType,
+        metric_spec: MetricSpec,
+        query_properties: MetricQueryPropertySet,
+    ) -> Optional[MetricQueryNode]:
+        """Return a node for base metric types or `None` for metrics that require dependency expansion."""
+        if metric_type is MetricType.SIMPLE:
+            metric_aggregation_params = metric.type_params.metric_aggregation_params
+            if metric_aggregation_params is None:
+                raise ValueError(
+                    LazyFormat(
+                        "Simple metric is missing metric aggregation parameters",
+                        metric_spec=metric_spec,
+                        metric=metric,
+                    )
+                )
+            return SimpleMetricsQueryNode.create(
+                model_id=SemanticModelId.get_instance(metric_aggregation_params.semantic_model),
+                metric_specs=(metric_spec,),
+                query_properties=query_properties,
+            )
+
+        if metric_type is MetricType.CUMULATIVE:
+            return CumulativeMetricQueryNode.create(metric_spec=metric_spec, query_properties=query_properties)
+        elif metric_type is MetricType.CONVERSION:
+            return ConversionMetricQueryNode.create(metric_spec=metric_spec, query_properties=query_properties)
+        elif metric_type is MetricType.RATIO or metric_type is MetricType.DERIVED:
+            return None
+        else:
+            assert_values_exhausted(metric_type)
+
+    def _get_input_metric_query_elements_for_derived_metric(
+        self,
+        metric_spec: MetricSpec,
+        group_by_item_specs: Iterable[LinkableInstanceSpec],
+        predicate_pushdown_state: PredicatePushdownState,
+        filter_spec_factory: WhereFilterSpecFactory,
+    ) -> Sequence[MetricQueryElement]:
+        """Return input query elements for a ratio / derived metric.
+
+        Input query elements generally inherit group-by and predicate settings from the metric being expanded.
+        Time-offset metrics are handled differently - see appropriate section in the `DataflowPlanBuilder`.
+        """
+        additional_filter_specs = metric_spec.where_filter_specs
+        group_by_item_specs_for_inputs = group_by_item_specs
+        predicate_pushdown_state_for_inputs = predicate_pushdown_state
+
+        if metric_spec.has_time_offset:
+            group_by_item_specs_for_inputs = self._required_group_by_items_for_inputs_to_a_time_offset_metric(
+                queried_group_by_specs=group_by_item_specs,
+                filter_specs=metric_spec.where_filter_specs,
+            )
+            predicate_pushdown_state_for_inputs = PredicatePushdownState.with_pushdown_disabled()
+            # If metric is offset, we'll apply where constraint after offset to avoid removing values
+            # unexpectedly. Time constraint will be applied by INNER JOINing to time spine.
+            # We may consider encapsulating this in pushdown state later, but as of this moment pushdown
+            # is about post-join to pre-join for dimension access, and relies on the builder to collect
+            # predicates from query and metric specs and make them available at simple-metric-input level.
+            additional_filter_specs = ()
+
+        input_metric_specs = self._build_input_metric_specs_for_derived_metric(
+            metric_name=metric_spec.element_name,
+            filter_spec_factory=filter_spec_factory,
+            additional_filter_specs=additional_filter_specs,
+        )
+        return tuple(
+            MetricQueryElement.create(
+                metric_spec=input_metric_spec,
+                group_by_item_specs=group_by_item_specs_for_inputs,
+                predicate_pushdown_state=predicate_pushdown_state_for_inputs,
+            )
+            for input_metric_spec in input_metric_specs
+        )
Original file line number	Diff line number	Diff line change
`@@ -172,7 +172,7 @@ def visit_compute_metrics_node(self, node: ComputeMetricsNode) -> OptimizeBranch`
`172`	`172`	`optimized_branch=ComputeMetricsNode.create(`
`173`	`173`	`parent_node=optimized_parent_result.optimized_branch,`
`174`	`174`	`computed_metric_specs=node.computed_metric_specs,`
`175`		`- passthrough_metric_specs=(),`
	`175`	`+ passthrough_metric_specs=node.passthrough_metric_specs,`
`176`	`176`	`output_group_by_metric_instances=node.output_group_by_metric_instances,`
`177`	`177`	`aggregated_to_elements=node.aggregated_to_elements,`
`178`	`178`	`)`