We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent fd4d6b4 commit ccbfb6eCopy full SHA for ccbfb6e
examples/python/run_llama_batched_vllm.py
@@ -277,7 +277,7 @@ def _prepare_eval_queries(
277
if sliding_window:
278
seq_lens.append(min(num_past_tokens + num_queries, sliding_window))
279
num_past = min(num_past_tokens, sliding_window)
280
- past_slot_mapping += all_slot_mappings[request_id][num_past:]
+ past_slot_mapping += all_slot_mappings[request_id][:num_past]
281
slot_mapping += all_slot_mappings[request_id][num_past: num_past + num_queries]
282
else:
283
seq_lens.append(num_past_tokens + num_queries)
0 commit comments