File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed
vllm/v1/attention/backends Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -729,7 +729,7 @@ def forward(
729729 cu_seqlens_k = attn_metadata .prefill_metadata .query_start_loc ,
730730 max_seqlen_q = attn_metadata .prefill_metadata .max_query_len ,
731731 max_seqlen_k = attn_metadata .prefill_metadata .max_seq_len ,
732- min_seqlen_q = 1 ,
732+ min_seqlen_q = attn_metadata . prefill_metadata . min_query_len ,
733733 dropout_p = 0.0 ,
734734 softmax_scale = self .scale ,
735735 causal = True ,
@@ -759,7 +759,7 @@ def forward(
759759 cu_seqlens_q = attn_metadata .extend_metadata .query_start_loc ,
760760 max_seqlen_q = attn_metadata .extend_metadata .max_query_len ,
761761 max_seqlen_k = attn_metadata .extend_metadata .max_seq_len ,
762- min_seqlen_q = 1 ,
762+ min_seqlen_q = attn_metadata . extend_metadata . min_query_len ,
763763 block_table = attn_metadata .block_table [
764764 num_decodes : num_decodes + num_extends
765765 ],
You can’t perform that action at this time.
0 commit comments