diff --git a/vllm/_aiter_ops.py b/vllm/_aiter_ops.py index 3414443e52cb..8ef34bfd6dce 100644 --- a/vllm/_aiter_ops.py +++ b/vllm/_aiter_ops.py @@ -1052,12 +1052,16 @@ def is_fp8bmm_enabled(cls) -> bool: @classmethod @if_aiter_supported def is_fp4bmm_enabled(cls) -> bool: - return cls._AITER_ENABLED and cls._FP4BMM_ENABLED + from vllm.platforms.rocm import on_gfx950 + + return cls._AITER_ENABLED and cls._FP4BMM_ENABLED and on_gfx950() @classmethod @if_aiter_supported def is_asm_fp4_gemm_dynamic_quant_enabled(cls) -> bool: - return cls._AITER_ENABLED and cls._FP4_GEMM_DYNAMIC_QUANT_ASM + from vllm.platforms.rocm import on_gfx950 + + return cls._AITER_ENABLED and cls._FP4_GEMM_DYNAMIC_QUANT_ASM and on_gfx950() @classmethod @if_aiter_supported