From ad7f5abfab99c60bc999a80eeb1ecab1a2e32a45 Mon Sep 17 00:00:00 2001 From: Joao Gante Date: Mon, 13 May 2024 12:47:29 +0000 Subject: [PATCH] qwen does not support the new cache classes --- src/transformers/models/qwen2/modeling_qwen2.py | 1 - 1 file changed, 1 deletion(-) diff --git a/src/transformers/models/qwen2/modeling_qwen2.py b/src/transformers/models/qwen2/modeling_qwen2.py index b5a1370ae1fc..709504aba715 100644 --- a/src/transformers/models/qwen2/modeling_qwen2.py +++ b/src/transformers/models/qwen2/modeling_qwen2.py @@ -821,7 +821,6 @@ class Qwen2PreTrainedModel(PreTrainedModel): _skip_keys_device_placement = "past_key_values" _supports_flash_attn_2 = True _supports_sdpa = True - _supports_cache_class = True def _init_weights(self, module): std = self.config.initializer_range