Skip to content

Commit 95225ce

Browse files
committed
fix lint
Signed-off-by: Lu Fang <[email protected]>
1 parent 5a73a86 commit 95225ce

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1606,8 +1606,10 @@ def select_gemm_impl(
16061606
prepare_finalize.activation_format
16071607
== mk.FusedMoEActivationFormat.BatchedExperts
16081608
):
1609+
max_num_tokens_per_rank = prepare_finalize.max_num_tokens_per_rank()
1610+
assert max_num_tokens_per_rank is not None
16091611
return BatchedMarlinExperts(
1610-
max_num_tokens=prepare_finalize.max_num_tokens_per_rank(),
1612+
max_num_tokens=max_num_tokens_per_rank,
16111613
num_dispatchers=prepare_finalize.num_dispatchers(),
16121614
quant_config=self.moe_quant_config,
16131615
w13_g_idx=layer.w13_weight_g_idx,

0 commit comments

Comments
 (0)