WebAssembly · kripken · Jul 16, 2025 · Jul 17, 2025 · tlively · Jul 17, 2025
diff --git a/src/ir/metadata.cpp b/src/ir/metadata.cpp
@@ -105,20 +105,25 @@ bool equal(Function* a, Function* b) {
     return false;
   }
 
+  return equal(a->body, b->body, a, b);
+}
+
+bool equal(Expression* a, Expression* b, Function* aFunc, Function* bFunc) {
+  assert(aFunc && bFunc);
+
   // TODO: We do not consider debug locations here. This is often what is
   //       desired in optimized builds (e.g. if we are trying to fold two
   //       pieces of code together, that benefit outweighs slightly inaccurate
   //       debug info). If we find that non-optimizer locations call this in
   //       ways that lead to degraded debug info, we could add an option to
   //       control it.
-
-  if (a->codeAnnotations.empty() && b->codeAnnotations.empty()) {
+  if (aFunc->codeAnnotations.empty() && bFunc->codeAnnotations.empty()) {
     // Nothing to compare; no differences.
     return true;
   }
 
-  Serializer aList(a->body);
-  Serializer bList(b->body);
+  Serializer aList(a);
+  Serializer bList(b);
 
   if (aList.list.size() != bList.list.size()) {
     return false;
@@ -128,8 +133,8 @@ bool equal(Function* a, Function* b) {
   for (Index i = 0; i < aList.list.size(); i++) {
     if (!compare(aList.list[i],
                  bList.list[i],
-                 a->codeAnnotations,
-                 b->codeAnnotations,
+                 aFunc->codeAnnotations,
+                 bFunc->codeAnnotations,
                  Function::CodeAnnotation())) {
       return false;
     }

diff --git a/src/ir/metadata.h b/src/ir/metadata.h
@@ -35,6 +35,10 @@ void copyBetweenFunctions(Expression* origin,
 // after all else is known equal).
 bool equal(Function* a, Function* b);
 
+// Check if two expressions are equal in metadata. They may or may not be from
+// the same function.
+bool equal(Expression* a, Expression* b, Function* aFunc, Function* bFunc);
+
 } // namespace wasm::metadata
 
 #endif // wasm_ir_metadata_h
diff --git a/src/ir/utils.h b/src/ir/utils.h
@@ -18,6 +18,7 @@
 #define wasm_ir_utils_h
 
 #include "ir/branch-utils.h"
+#include "ir/metadata.h"
 #include "pass.h"
 #include "wasm-builder.h"
 #include "wasm-traversal.h"
@@ -69,6 +70,21 @@ struct ExpressionAnalyzer {
     return flexibleEqual(left, right, comparer);
   }
 
+  // Compare two expressions and their metadata as well. If just the first
+  // function is provided, we consider them both to arrive from the same one.
+  static bool equalIncludingMetadata(Expression* left,
+                                     Expression* right,
+                                     Function* leftFunc = nullptr,
+                                     Function* rightFunc = nullptr) {
+    if (!equal(left, right)) {
+      return false;
+    }
+    if (!rightFunc) {
+      rightFunc = leftFunc;
+    }
+    return metadata::equal(left, right, leftFunc, rightFunc);
+  }
+
   // A shallow comparison, ignoring child nodes.
   static bool shallowEqual(Expression* left, Expression* right) {
     auto comparer = [left, right](Expression* currLeft, Expression* currRight) {

diff --git a/src/passes/CodeFolding.cpp b/src/passes/CodeFolding.cpp
@@ -249,8 +249,8 @@ struct CodeFolding
     // run the rest of the optimization mormally.
     auto maybeAddBlock = [this](Block* block, Expression*& other) -> Block* {
       // If other is a suffix of the block, wrap it in a block.
-      if (block->list.empty() ||
-          !ExpressionAnalyzer::equal(other, block->list.back())) {
+      if (block->list.empty() || !ExpressionAnalyzer::equalIncludingMetadata(
+                                   other, block->list.back(), getFunction())) {
         return nullptr;
       }
       // Do it, assign to the out param `other`, and return the block.
@@ -395,7 +395,8 @@ struct CodeFolding
       Index tail = 1;
       for (; tail < tails.size(); ++tail) {
         auto* other = getMergeable(tails[tail], num);
-        if (!other || !ExpressionAnalyzer::equal(item, other)) {
+        if (!other || !ExpressionAnalyzer::equalIncludingMetadata(
+                        item, other, getFunction())) {
           // Other tail too short or has a difference.
           break;
         }
@@ -673,7 +674,8 @@ struct CodeFolding
                            [&](Expression* item) {
                              if (item ==
                                    first || // don't bother comparing the first
-                                 ExpressionAnalyzer::equal(item, first)) {
+                                 ExpressionAnalyzer::equalIncludingMetadata(
+                                   item, first, getFunction())) {
                                // equal, keep it
                                return false;
                              } else {
@@ -691,8 +693,9 @@ struct CodeFolding
                                          explore.end(),
                                          [&](Tail& tail) {
                                            auto* item = getItem(tail, num);
-                                           return !ExpressionAnalyzer::equal(
-                                             item, correct);
+                                           return !ExpressionAnalyzer::
+                                             equalIncludingMetadata(
+                                               item, correct, getFunction());
                                          }),
                           explore.end());
             // try to optimize this deeper tail. if we succeed, then stop here,

diff --git a/src/passes/LocalCSE.cpp b/src/passes/LocalCSE.cpp
@@ -157,6 +157,11 @@ struct HEComparer {
     if (a.digest != b.digest) {
       return false;
     }
+    // Note that we do not consider metadata here. That means we may replace two
+    // identical expressions with different metadata, say, different branch
+    // hints, but that is ok: we are only removing things from executing (by
+    // reusing the first computed value), so this will not cause new invalid
+    // branch hints to execute.
     return ExpressionAnalyzer::equal(a.expr, b.expr);
   }
 };

diff --git a/src/passes/OptimizeInstructions.cpp b/src/passes/OptimizeInstructions.cpp
@@ -1168,16 +1168,18 @@ struct OptimizeInstructions
   void visitIf(If* curr) {
     curr->condition = optimizeBoolean(curr->condition);
     if (curr->ifFalse) {
+      auto* func = getFunction();
       if (auto* unary = curr->condition->dynCast<Unary>()) {
         if (unary->op == EqZInt32) {
           // flip if-else arms to get rid of an eqz
           curr->condition = unary->value;
           std::swap(curr->ifTrue, curr->ifFalse);
-          BranchHints::flip(curr, getFunction());
+          BranchHints::flip(curr, func);
         }
       }
       if (curr->condition->type != Type::unreachable &&
-          ExpressionAnalyzer::equal(curr->ifTrue, curr->ifFalse)) {
+          ExpressionAnalyzer::equalIncludingMetadata(
+            curr->ifTrue, curr->ifFalse, func)) {
         // The sides are identical, so fold. If we can replace the If with one
         // arm and there are no side effects in the condition, replace it. But
         // make sure not to change a concrete expression to an unreachable
@@ -3235,8 +3237,12 @@ struct OptimizeInstructions
       }
     }
     {
-      // Sides are identical, fold
+      // If sides are identical, fold.
       Expression *ifTrue, *ifFalse, *c;
+      // Note we do not compare metadata here: This is a select, so both arms
+      // execute anyhow, and things like branch hints were already being run.
+      // After optimization, we will only run fewer things, and run no risk of
+      // running new bad things.
       if (matches(curr, select(any(&ifTrue), any(&ifFalse), any(&c))) &&
           ExpressionAnalyzer::equal(ifTrue, ifFalse)) {
         auto value = effects(ifTrue);

diff --git a/test/lit/passes/code-folding_branch-hints.wast b/test/lit/passes/code-folding_branch-hints.wast
@@ -0,0 +1,107 @@
+;; NOTE: Assertions have been generated by update_lit_checks.py --all-items and should not be edited.
+;; NOTE: This test was ported using port_passes_tests_to_lit.py and could be cleaned up.
+
+;; RUN: wasm-opt %s -all --code-folding -S -o - | filecheck %s
+
+(module
+ ;; CHECK:      (type $0 (func (param i32 i32) (result f32)))
+
+ ;; CHECK:      (func $different (type $0) (param $x i32) (param $y i32) (result f32)
+ ;; CHECK-NEXT:  (if
+ ;; CHECK-NEXT:   (local.get $x)
+ ;; CHECK-NEXT:   (then
+ ;; CHECK-NEXT:    (@metadata.code.branch_hint "\00")
+ ;; CHECK-NEXT:    (if
+ ;; CHECK-NEXT:     (local.get $y)
+ ;; CHECK-NEXT:     (then
+ ;; CHECK-NEXT:      (nop)
+ ;; CHECK-NEXT:     )
+ ;; CHECK-NEXT:    )
+ ;; CHECK-NEXT:   )
+ ;; CHECK-NEXT:   (else
+ ;; CHECK-NEXT:    (@metadata.code.branch_hint "\01")
+ ;; CHECK-NEXT:    (if
+ ;; CHECK-NEXT:     (local.get $y)
+ ;; CHECK-NEXT:     (then
+ ;; CHECK-NEXT:      (nop)
+ ;; CHECK-NEXT:     )
+ ;; CHECK-NEXT:    )
+ ;; CHECK-NEXT:   )
+ ;; CHECK-NEXT:  )
+ ;; CHECK-NEXT:  (f32.const 0)
+ ;; CHECK-NEXT: )
+ (func $different (param $x i32) (param $y i32) (result f32)
+  ;; The branch hints differ, so we do not optimize.
+  (if (result f32)
+   (local.get $x)
+   (then
+    (block (result f32)
+     (@metadata.code.branch_hint "\00")
+     (if
+      (local.get $y)
+      (then
+       (nop)
+      )
+     )
+     (f32.const 0)
+    )
+   )
+   (else
+    (block (result f32)
+     (@metadata.code.branch_hint "\01")
+     (if
+      (local.get $y)
+      (then
+       (nop)
+      )
+     )
+     (f32.const 0)
+    )
+   )
+  )
+ )
+
+ ;; CHECK:      (func $same (type $0) (param $x i32) (param $y i32) (result f32)
+ ;; CHECK-NEXT:  (drop
+ ;; CHECK-NEXT:   (local.get $x)
+ ;; CHECK-NEXT:  )
+ ;; CHECK-NEXT:  (@metadata.code.branch_hint "\00")
+ ;; CHECK-NEXT:  (if
+ ;; CHECK-NEXT:   (local.get $y)
+ ;; CHECK-NEXT:   (then
+ ;; CHECK-NEXT:    (nop)
+ ;; CHECK-NEXT:   )
+ ;; CHECK-NEXT:  )
+ ;; CHECK-NEXT:  (f32.const 0)
+ ;; CHECK-NEXT: )
+ (func $same (param $x i32) (param $y i32) (result f32)
+  ;; The branch hints are the same, so we optimize.
+  (if (result f32)
+   (local.get $x)
+   (then
+    (block (result f32)
+     (@metadata.code.branch_hint "\00")
+     (if
+      (local.get $y)
+      (then
+       (nop)
+      )
+     )
+     (f32.const 0)
+    )
+   )
+   (else
+    (block (result f32)
+     (@metadata.code.branch_hint "\00")
+     (if
+      (local.get $y)
+      (then
+       (nop)
+      )
+     )
+     (f32.const 0)
+    )
+   )
+  )
+ )
+)