diff --git a/vllm/model_executor/layers/fused_moe/oracle/fp8.py b/vllm/model_executor/layers/fused_moe/oracle/fp8.py index c7b012677331..85997468af9e 100644 --- a/vllm/model_executor/layers/fused_moe/oracle/fp8.py +++ b/vllm/model_executor/layers/fused_moe/oracle/fp8.py @@ -567,7 +567,7 @@ def make_fp8_moe_kernel( experts, shared_experts=( shared_experts - if moe_config.moe_parallel_config.use_all2all_kernels + if moe_config.moe_parallel_config.use_deepep_ll_kernels else None ), moe_parallel_config=moe_config.moe_parallel_config, diff --git a/vllm/model_executor/layers/fused_moe/oracle/nvfp4.py b/vllm/model_executor/layers/fused_moe/oracle/nvfp4.py index dd1a24d863de..b06cf49cfd81 100644 --- a/vllm/model_executor/layers/fused_moe/oracle/nvfp4.py +++ b/vllm/model_executor/layers/fused_moe/oracle/nvfp4.py @@ -433,7 +433,7 @@ def make_nvfp4_moe_kernel( experts, shared_experts=( shared_experts - if moe_config.moe_parallel_config.use_all2all_kernels + if moe_config.moe_parallel_config.use_deepep_ll_kernels else None ), moe_parallel_config=moe_config.moe_parallel_config,