diff --git a/vllm/model_executor/layers/quantization/gguf.py b/vllm/model_executor/layers/quantization/gguf.py index bcdfafb50fc5..a3c74e3b30d5 100644 --- a/vllm/model_executor/layers/quantization/gguf.py +++ b/vllm/model_executor/layers/quantization/gguf.py @@ -624,8 +624,8 @@ def apply( layer: FusedMoE, x: torch.Tensor, router_logits: torch.Tensor, - top_k: int, - renormalize: bool, + top_k: int = 0, + renormalize: bool = False, use_grouped_topk: bool = False, topk_group: int | None = None, num_expert_group: int | None = None,