Cranelift: Do not track expression depth in egraph cost function (#12248)

fitzgen · web-flow · commit 50431b450123 · 2026-01-06T18:53:48.000Z
We don't have any rules that try to rebalance trees to make them shallower in
the mid-end (we determined it was the wrong place to do that kind of thing,
since we don't know register pressure at that point) so there is no need to
track expression depth in the cost function.
diff --git a/cranelift/codegen/src/egraph/cost.rs b/cranelift/codegen/src/egraph/cost.rs
@@ -30,52 +30,20 @@ use crate::ir::Opcode;
 /// `finite()` method.) An infinite cost is used to represent a value
 /// that cannot be computed, or otherwise serve as a sentinel when
 /// performing search for the lowest-cost representation of a value.
-#[derive(Clone, Copy, PartialEq, Eq)]
+#[derive(Clone, Copy, PartialEq, Eq, PartialOrd, Ord)]
 pub(crate) struct Cost(u32);
 
 impl core::fmt::Debug for Cost {
     fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
         if *self == Cost::infinity() {
             write!(f, "Cost::Infinite")
         } else {
-            f.debug_struct("Cost::Finite")
-                .field("op_cost", &self.op_cost())
-                .field("depth", &self.depth())
-                .finish()
+            f.debug_tuple("Cost::Finite").field(&self.cost()).finish()
         }
     }
 }
 
-impl Ord for Cost {
-    #[inline]
-    fn cmp(&self, other: &Self) -> core::cmp::Ordering {
-        // We make sure that the high bits are the op cost and the low bits are
-        // the depth. This means that we can use normal integer comparison to
-        // order by op cost and then depth.
-        //
-        // We want to break op cost ties with depth (rather than the other way
-        // around). When the op cost is the same, we prefer shallow and wide
-        // expressions to narrow and deep expressions and breaking ties with
-        // `depth` gives us that. For example, `(a + b) + (c + d)` is preferred
-        // to `((a + b) + c) + d`. This is beneficial because it exposes more
-        // instruction-level parallelism and shortens live ranges.
-        self.0.cmp(&other.0)
-    }
-}
-
-impl PartialOrd for Cost {
-    #[inline]
-    fn partial_cmp(&self, other: &Self) -> Option<core::cmp::Ordering> {
-        Some(self.cmp(other))
-    }
-}
-
 impl Cost {
-    const DEPTH_BITS: u8 = 8;
-    const DEPTH_MASK: u32 = (1 << Self::DEPTH_BITS) - 1;
-    const OP_COST_MASK: u32 = !Self::DEPTH_MASK;
-    const MAX_OP_COST: u32 = Self::OP_COST_MASK >> Self::DEPTH_BITS;
-
     pub(crate) fn infinity() -> Cost {
         // 2^32 - 1 is, uh, pretty close to infinite... (we use `Cost`
         // only for heuristics and always saturate so this suffices!)
@@ -86,39 +54,27 @@ impl Cost {
         Cost(0)
     }
 
-    /// Construct a new `Cost` from the given parts.
-    ///
-    /// If the opcode cost is greater than or equal to the maximum representable
-    /// opcode cost, then the resulting `Cost` saturates to infinity.
-    fn new(opcode_cost: u32, depth: u8) -> Cost {
-        if opcode_cost >= Self::MAX_OP_COST {
-            Self::infinity()
-        } else {
-            Cost(opcode_cost << Self::DEPTH_BITS | u32::from(depth))
-        }
-    }
-
-    fn depth(&self) -> u8 {
-        let depth = self.0 & Self::DEPTH_MASK;
-        u8::try_from(depth).unwrap()
+    /// Construct a new `Cost`.
+    fn new(cost: u32) -> Cost {
+        Cost(cost)
     }
 
-    fn op_cost(&self) -> u32 {
-        (self.0 & Self::OP_COST_MASK) >> Self::DEPTH_BITS
+    fn cost(&self) -> u32 {
+        self.0
     }
 
     /// Return the cost of an opcode.
     fn of_opcode(op: Opcode) -> Cost {
         match op {
             // Constants.
-            Opcode::Iconst | Opcode::F32const | Opcode::F64const => Cost::new(1, 0),
+            Opcode::Iconst | Opcode::F32const | Opcode::F64const => Cost::new(1),
 
             // Extends/reduces.
             Opcode::Uextend
             | Opcode::Sextend
             | Opcode::Ireduce
             | Opcode::Iconcat
-            | Opcode::Isplit => Cost::new(1, 0),
+            | Opcode::Isplit => Cost::new(1),
 
             // "Simple" arithmetic.
             Opcode::Iadd
@@ -129,27 +85,27 @@ impl Cost {
             | Opcode::Bnot
             | Opcode::Ishl
             | Opcode::Ushr
-            | Opcode::Sshr => Cost::new(3, 0),
+            | Opcode::Sshr => Cost::new(3),
 
             // "Expensive" arithmetic.
-            Opcode::Imul => Cost::new(10, 0),
+            Opcode::Imul => Cost::new(10),
 
             // Everything else.
             _ => {
                 // By default, be slightly more expensive than "simple"
                 // arithmetic.
-                let mut c = Cost::new(4, 0);
+                let mut c = Cost::new(4);
 
                 // And then get more expensive as the opcode does more side
                 // effects.
                 if op.can_trap() || op.other_side_effects() {
-                    c = c + Cost::new(10, 0);
+                    c = c + Cost::new(10);
                 }
                 if op.can_load() {
-                    c = c + Cost::new(20, 0);
+                    c = c + Cost::new(20);
                 }
                 if op.can_store() {
-                    c = c + Cost::new(50, 0);
+                    c = c + Cost::new(50);
                 }
 
                 c
@@ -163,12 +119,12 @@ impl Cost {
     /// that satisfies `inst_predicates::is_pure_for_egraph()`.
     pub(crate) fn of_pure_op(op: Opcode, operand_costs: impl IntoIterator<Item = Self>) -> Self {
         let c = Self::of_opcode(op) + operand_costs.into_iter().sum();
-        Cost::new(c.op_cost(), c.depth().saturating_add(1))
+        Cost::new(c.cost())
     }
 
     /// Compute the cost of an operation in the side-effectful skeleton.
     pub(crate) fn of_skeleton_op(op: Opcode, arity: usize) -> Self {
-        Cost::of_opcode(op) + Cost::new(u32::try_from(arity).unwrap(), (arity != 0) as _)
+        Cost::of_opcode(op) + Cost::new(u32::try_from(arity).unwrap())
     }
 }
 
@@ -188,9 +144,7 @@ impl core::ops::Add<Cost> for Cost {
     type Output = Cost;
 
     fn add(self, other: Cost) -> Cost {
-        let op_cost = self.op_cost().saturating_add(other.op_cost());
-        let depth = core::cmp::max(self.depth(), other.depth());
-        Cost::new(op_cost, depth)
+        Cost::new(self.cost().saturating_add(other.cost()))
     }
 }
 
@@ -200,39 +154,25 @@ mod tests {
 
     #[test]
     fn add_cost() {
-        let a = Cost::new(5, 2);
-        let b = Cost::new(37, 3);
-        assert_eq!(a + b, Cost::new(42, 3));
-        assert_eq!(b + a, Cost::new(42, 3));
+        let a = Cost::new(5);
+        let b = Cost::new(37);
+        assert_eq!(a + b, Cost::new(42));
+        assert_eq!(b + a, Cost::new(42));
     }
 
     #[test]
     fn add_infinity() {
-        let a = Cost::new(5, 2);
+        let a = Cost::new(5);
         let b = Cost::infinity();
         assert_eq!(a + b, Cost::infinity());
         assert_eq!(b + a, Cost::infinity());
     }
 
     #[test]
     fn op_cost_saturates_to_infinity() {
-        let a = Cost::new(Cost::MAX_OP_COST - 10, 2);
-        let b = Cost::new(11, 2);
+        let a = Cost::new(u32::MAX - 10);
+        let b = Cost::new(11);
         assert_eq!(a + b, Cost::infinity());
         assert_eq!(b + a, Cost::infinity());
     }
-
-    #[test]
-    fn depth_saturates_to_max_depth() {
-        let a = Cost::new(10, u8::MAX);
-        let b = Cost::new(10, 1);
-        assert_eq!(
-            Cost::of_pure_op(Opcode::Iconst, [a, b]),
-            Cost::new(21, u8::MAX)
-        );
-        assert_eq!(
-            Cost::of_pure_op(Opcode::Iconst, [b, a]),
-            Cost::new(21, u8::MAX)
-        );
-    }
 }