diff --git a/vllm/model_executor/models/granite4_vision.py b/vllm/model_executor/models/granite4_vision.py index 147f02eced97..710fc94ee5f8 100644 --- a/vllm/model_executor/models/granite4_vision.py +++ b/vllm/model_executor/models/granite4_vision.py @@ -887,9 +887,10 @@ def forward( and get_pp_group().is_first_rank and self._ds_layer_indices ): + n = inputs_embeds.size(0) ds: IntermediateTensors | None = IntermediateTensors( { - f"ds_{llm_layer}": self._ds_buffers[lvl] + f"ds_{llm_layer}": self._ds_buffers[lvl][:n] for lvl, llm_layer in enumerate(self._ds_layer_indices) } )