diff --git a/mteb/models/overview.py b/mteb/models/overview.py index 3e4ce485ad..223aff87f4 100644 --- a/mteb/models/overview.py +++ b/mteb/models/overview.py @@ -76,6 +76,7 @@ sonar_models, stella_models, text2vec_models, + ua_sentence_models, uae_models, vdr_models, vista_models, @@ -140,6 +141,7 @@ rerankers_monot5_based, richinfoai_models, ru_sentence_models, + ua_sentence_models, salesforce_models, searchmap_models, sentence_transformers_models, diff --git a/mteb/models/ua_sentence_models.py b/mteb/models/ua_sentence_models.py new file mode 100644 index 0000000000..dd23160f77 --- /dev/null +++ b/mteb/models/ua_sentence_models.py @@ -0,0 +1,31 @@ +"""Sentence models for evaluation on the Ukrainian part of MTEB""" + +from __future__ import annotations + +from mteb.model_meta import ModelMeta + +xlm_roberta_ua_distilled = ModelMeta( + name="panalexeu/xlm-roberta-ua-distilled", + n_parameters=278_000_000, + memory_usage_mb=1061, + max_tokens=512, + embed_dim=768, + revision="9216f50d76b032350ca312246fa2f5dcaa6ca971", + release_date="2025-04-15", + license="mit", + open_weights=True, + public_training_code="https://github.com/panalexeu/xlm-roberta-ua-distilled/blob/main/researches/research_final.ipynb", + similarity_fn_name="cosine", + framework=["Sentence Transformers"], + reference="https://github.com/panalexeu/xlm-roberta-ua-distilled/tree/main", + languages=["eng-Latn", "ukr-Cyrl"], + training_datasets={ + # "sentence-transformers/parallel-sentences-talks": ["train"], + # "sentence-transformers/parallel-sentences-wikimatrix": ["train"], + # "sentence-transformers/parallel-sentences-tatoeba": ["train"], + }, + adapted_from="FacebookAI/xlm-roberta-base", + modalities=["text"], + public_training_data=None, + use_instructions=False, +)