diff --git a/optimum/habana/transformers/models/llama/modeling_llama.py b/optimum/habana/transformers/models/llama/modeling_llama.py index d9f3a7cf7a..60c9962ec1 100755 --- a/optimum/habana/transformers/models/llama/modeling_llama.py +++ b/optimum/habana/transformers/models/llama/modeling_llama.py @@ -599,6 +599,9 @@ def prepare_inputs_for_generation( def apply_customized_rope(q, k, cos, sin, position_ids): if q.device.type == "hpu" and FusedRoPE: - return FusedRoPE.apply(q, cos, sin, position_ids), FusedRoPE.apply(k, cos, sin, position_ids) + # TODO: remove `.clone()` when SynapseAI v1.15 is released + return FusedRoPE.apply(q, cos.clone(), sin.clone(), position_ids), FusedRoPE.apply( + k, cos.clone(), sin.clone(), position_ids + ) else: return apply_rotary_pos_emb(q, k, cos, sin, position_ids)