diff --git a/optimum/habana/transformers/models/deepseek_v3/modeling_deepseek_v3.py b/optimum/habana/transformers/models/deepseek_v3/modeling_deepseek_v3.py index fb7751545a..4c9314f810 100644 --- a/optimum/habana/transformers/models/deepseek_v3/modeling_deepseek_v3.py +++ b/optimum/habana/transformers/models/deepseek_v3/modeling_deepseek_v3.py @@ -1692,7 +1692,6 @@ def forward( hidden_states = outputs[0] logits = self.lm_head(hidden_states) - logits = logits.float() loss = None if labels is not None: