vllm-project · brucechanglongxu · Feb 28, 2026 · gemini-code-assist · Feb 28, 2026
@@ -1217,6 +1217,7 @@ def should_moe_wna16_use_cuda(
 ):
     return (
         current_platform.is_cuda()
+        and not current_platform.is_rocm()
-        current_platform.is_cuda()
-        and not current_platform.is_rocm()
+        current_platform.device_name == "cuda"
-        current_platform.is_cuda()
-        and not current_platform.is_rocm()
+        current_platform.device_name == "cuda"
         and bit == 4
         and group_size in [32, 64, 128]
         and num_valid_tokens / num_experts <= 6

@@ -336,6 +336,7 @@ class RocmPlatform(Platform):
         "petit_nvfp4",
         "torchao",
         "bitsandbytes",
+        "moe_wna16",
     ]
 
     @classmethod