We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 69279d2 commit 94df2f1Copy full SHA for 94df2f1
vllm/v1/worker/gpu_model_runner.py
@@ -1447,7 +1447,7 @@ def execute_model(
1447
if envs.VLLM_COMPUTE_PADDED_LOGITS_INDICES:
1448
assert self.logits_indices is not None
1449
num_logits = logits_indices.shape[0]
1450
- assert num_logits > 0
+ assert num_logits > 0
1451
self.logits_indices[:num_logits].copy_(logits_indices)
1452
# Ensure we keep duplicates instead of zeros
1453
self.logits_indices[num_logits:].fill_(logits_indices[-1].item())
0 commit comments