diff --git a/vllm/model_executor/models/minicpm.py b/vllm/model_executor/models/minicpm.py index a05be794a29c..8f7b8b21b561 100644 --- a/vllm/model_executor/models/minicpm.py +++ b/vllm/model_executor/models/minicpm.py @@ -300,10 +300,7 @@ def forward( ) -> torch.Tensor: qkv, _ = self.qkv_proj(hidden_states) q, k, v = qkv.split([self.q_size, self.kv_size, self.kv_size], dim=-1) - orig_dtype = q.dtype - q, k = q.float(), k.float() q, k = self.rotary_emb(positions, q, k) - q, k = q.to(orig_dtype), k.to(orig_dtype) attn_output = self.attn(q, k, v) output, _ = self.o_proj(attn_output) return output