vllm-project · jikunshang · Apr 8, 2026 · Apr 8, 2026 · Copilot · Apr 8, 2026
diff --git a/tests/fused_moe/test_remap_hidden_states.py b/tests/fused_moe/test_remap_hidden_states.py
@@ -211,10 +211,19 @@ def test_remap_hidden_states(num_rows, hidden_size, total_experts_num, topk,
         if unpermuted_scales.dtype is torch.float8_e8m0fnu:
             unpermuted_scales = unpermuted_scales.view(torch.uint8)
             ref_unpermuted_scales = ref_unpermuted_scales.view(torch.uint8)
-        torch.testing.assert_close(unpermuted_scales,
-                                   ref_unpermuted_scales,
-                                   rtol=0,
-                                   atol=0)
+        try:
+            torch.testing.assert_close(unpermuted_scales,
+                                       ref_unpermuted_scales,
+                                       rtol=0,
+                                       atol=0,
+                                       equal_nan=True)
+        except AssertionError:
+            # Fp8block may fails on g31 CI
-            # Fp8block may fails on g31 CI
+            # fp8block may fail on g31 CI
-            # Fp8block may fails on g31 CI
+            # fp8block may fail on g31 CI
+            mismatched_indices = torch.nonzero(
+                unpermuted_scales != ref_unpermuted_scales)
+            print("Mismatched scales at indices:", mismatched_indices)
+            print("Mismatched scales:", unpermuted_scales[mismatched_indices])
+            print("Mismatched ref:", ref_unpermuted_scales[mismatched_indices])
-        except AssertionError:
-            # Fp8block may fails on g31 CI
-            mismatched_indices = torch.nonzero(
-                unpermuted_scales != ref_unpermuted_scales)
-            print("Mismatched scales at indices:", mismatched_indices)
-            print("Mismatched scales:", unpermuted_scales[mismatched_indices])
-            print("Mismatched ref:", ref_unpermuted_scales[mismatched_indices])
+        except AssertionError as exc:
+            # Log mismatch details for debugging, but do not hide failures.
+            mismatched_indices = torch.nonzero(
+                unpermuted_scales != ref_unpermuted_scales)
+            print("Mismatched scales at indices:", mismatched_indices)
+            print("Mismatched scales:", unpermuted_scales[mismatched_indices])
+            print("Mismatched ref:", ref_unpermuted_scales[mismatched_indices])
+            raise exc
-            mismatched_indices = torch.nonzero(
-                unpermuted_scales != ref_unpermuted_scales)
-            print("Mismatched scales at indices:", mismatched_indices)
-            print("Mismatched scales:", unpermuted_scales[mismatched_indices])
-            print("Mismatched ref:", ref_unpermuted_scales[mismatched_indices])
+            mismatch_mask = unpermuted_scales != ref_unpermuted_scales
+            mismatched_indices = torch.nonzero(mismatch_mask, as_tuple=False)
+            max_mismatches_to_print = 20
+            mismatched_indices = mismatched_indices[:max_mismatches_to_print]
+            print("Mismatched scales at indices:", mismatched_indices)
+            if mismatched_indices.numel() > 0:
+                mismatch_index_tuple = tuple(mismatched_indices[:, dim]
+                                             for dim in range(
+                                                 mismatched_indices.shape[1]))
+                print("Mismatched scales:",
+                      unpermuted_scales[mismatch_index_tuple])
+                print("Mismatched ref:",
+                      ref_unpermuted_scales[mismatch_index_tuple])
-        except AssertionError:
-            # Fp8block may fails on g31 CI
-            mismatched_indices = torch.nonzero(
-                unpermuted_scales != ref_unpermuted_scales)
-            print("Mismatched scales at indices:", mismatched_indices)
-            print("Mismatched scales:", unpermuted_scales[mismatched_indices])
-            print("Mismatched ref:", ref_unpermuted_scales[mismatched_indices])
+        except AssertionError as exc:
+            # Log mismatch details for debugging, but do not hide failures.
+            mismatched_indices = torch.nonzero(
+                unpermuted_scales != ref_unpermuted_scales)
+            print("Mismatched scales at indices:", mismatched_indices)
+            print("Mismatched scales:", unpermuted_scales[mismatched_indices])
+            print("Mismatched ref:", ref_unpermuted_scales[mismatched_indices])
+            raise exc
-            mismatched_indices = torch.nonzero(
-                unpermuted_scales != ref_unpermuted_scales)
-            print("Mismatched scales at indices:", mismatched_indices)
-            print("Mismatched scales:", unpermuted_scales[mismatched_indices])
-            print("Mismatched ref:", ref_unpermuted_scales[mismatched_indices])
+            mismatch_mask = unpermuted_scales != ref_unpermuted_scales
+            mismatched_indices = torch.nonzero(mismatch_mask, as_tuple=False)
+            max_mismatches_to_print = 20
+            mismatched_indices = mismatched_indices[:max_mismatches_to_print]
+            print("Mismatched scales at indices:", mismatched_indices)
+            if mismatched_indices.numel() > 0:
+                mismatch_index_tuple = tuple(mismatched_indices[:, dim]
+                                             for dim in range(
+                                                 mismatched_indices.shape[1]))
+                print("Mismatched scales:",
+                      unpermuted_scales[mismatch_index_tuple])
+                print("Mismatched ref:",
+                      ref_unpermuted_scales[mismatch_index_tuple])
 
 
 def ref_init_expert_map(expert_map, local_experts_num, ep_rank, ep_size):