diff --git a/mteb/custom_validators.py b/mteb/custom_validators.py index 6708c83577..7e72051047 100644 --- a/mteb/custom_validators.py +++ b/mteb/custom_validators.py @@ -47,6 +47,7 @@ "msr-la-nc", "multiple", "openrail", + "gemma", ] ) diff --git a/mteb/models/google_models.py b/mteb/models/google_models.py index 9636d1ded2..e69d2aa27d 100644 --- a/mteb/models/google_models.py +++ b/mteb/models/google_models.py @@ -237,3 +237,23 @@ def encode( public_training_data=None, training_datasets=GECKO_TRAINING_DATA, ) + +embedding_gemma_300m = ModelMeta( + name="google/embeddinggemma-300m", + languages=MULTILINGUAL_EVALUATED_LANGUAGES, + open_weights=True, + revision="64614b0b8b64f0c6c1e52b07e4e9a4e8fe4d2da2", + release_date="2025-09-04", + n_parameters=307_581_696, + embed_dim=768, + max_tokens=2048, + license="gemma", + reference="https://ai.google.dev/gemma/docs/embeddinggemma/model_card", + framework=["Sentence Transformers", "PyTorch"], + use_instructions=True, + public_training_code=None, + public_training_data=None, + training_datasets=GECKO_TRAINING_DATA, + similarity_fn_name="cosine", + memory_usage_mb=578, +)