Skip to content

Commit

Permalink
chore: support quantized loading
Browse files Browse the repository at this point in the history
  • Loading branch information
stillmatic committed Mar 5, 2024
1 parent 7600d8e commit 6e24ea3
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 4 deletions.
4 changes: 2 additions & 2 deletions gazelle/modeling_gazelle.py
Original file line number Diff line number Diff line change
Expand Up @@ -278,9 +278,9 @@ def forward(self, audio_features: torch.Tensor) -> torch.Tensor:
)
class GazellePreTrainedModel(PreTrainedModel):
config_class = GazelleConfig
base_model_prefix = "model"
base_model_prefix = "gazelle"
supports_gradient_checkpointing = True
_no_split_modules = ["GazelleAudioAttention"]
_no_split_modules = ["GazelleAudioAttention", "Wav2Vec2Model"]
_skip_keys_device_placement = "past_key_values"
_supports_flash_attn_2 = True

Expand Down
4 changes: 2 additions & 2 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -11,8 +11,8 @@ classifiers = ["License :: OSI Approved :: Apache Software License"]
dynamic = ["version", "description"]
dependencies = [
"transformers>=4.37.0",
"torch>=2.2",
"torchaudio>=2.2",
"torch>=2.1",
"torchaudio>=2.1",
"sentencepiece",
]

Expand Down

0 comments on commit 6e24ea3

Please sign in to comment.