diff --git a/vllm/model_executor/models/hunyuan_vision.py b/vllm/model_executor/models/hunyuan_vision.py index 6fc56094af65..cb3e2654cb31 100644 --- a/vllm/model_executor/models/hunyuan_vision.py +++ b/vllm/model_executor/models/hunyuan_vision.py @@ -247,6 +247,12 @@ def forward( qkv, _ = self.qkv(x) q, k, v = qkv.chunk(3, dim=-1) out = self.attn(q, k, v) + out = out.view( + x.size(0), + -1, + self.num_attention_heads_per_partition + * self.hidden_size_per_attention_head, + ) output, _ = self.o_proj(out) return output