fix the missing args

luccafong · luccafong · commit 60c880bcf77e · 2025-11-12T10:35:13.000-08:00
Signed-off-by: Lu Fang &lt;fanglu@fb.com&gt;
diff --git a/vllm/model_executor/layers/fused_moe/fused_marlin_moe.py b/vllm/model_executor/layers/fused_moe/fused_marlin_moe.py
@@ -731,6 +731,7 @@ def apply(
                 if self.quant_config.use_int4_w4a16
                 else scalar_types.float4_e2m1f.id
             ),  # works only for w4a16
+            apply_router_weight_on_input=apply_router_weight_on_input,
             global_num_experts=global_num_experts,
             activation=activation,
             expert_map=expert_map,