diff --git a/mteb/models/ru_sentence_models.py b/mteb/models/ru_sentence_models.py index 905fb6550a..c3c63d5461 100644 --- a/mteb/models/ru_sentence_models.py +++ b/mteb/models/ru_sentence_models.py @@ -357,6 +357,32 @@ adapted_from="cointegrated/rubert-tiny2", ) +rubert_mini_frida = ModelMeta( + name="sergeyzh/rubert-mini-frida", + languages=["rus_Cyrl"], + open_weights=True, + revision="19b279b78afd945b5ccae78f63e284909814adc2", + release_date="2025-03-02", + n_parameters=32_300_000, + memory_usage_mb=123, + embed_dim=312, + license="mit", + max_tokens=2048, + reference="https://huggingface.co/sergeyzh/rubert-mini-frida", + similarity_fn_name="cosine", + framework=["Sentence Transformers", "PyTorch"], + use_instructions=True, + public_training_code=None, + public_training_data=None, + training_datasets={ + # https://huggingface.co/datasets/IlyaGusev/gazeta + # https://huggingface.co/datasets/zloelias/lenta-ru + # https://huggingface.co/datasets/HuggingFaceFW/fineweb-2 + # https://huggingface.co/datasets/HuggingFaceFW/fineweb + }, + adapted_from="sergeyzh/rubert-mini-sts", +) + labse_ru_turbo = ModelMeta( name="sergeyzh/LaBSE-ru-turbo", languages=["rus_Cyrl"], @@ -378,6 +404,32 @@ public_training_data=None, ) +berta = ModelMeta( + name="sergeyzh/BERTA", + languages=["rus_Cyrl"], + open_weights=True, + revision="914c8c8aed14042ed890fc2c662d5e9e66b2faa7", + release_date="2025-03-10", + n_parameters=128_000_000, + memory_usage_mb=489, + embed_dim=768, + license="mit", + max_tokens=512, + reference="https://huggingface.co/sergeyzh/BERTA", + similarity_fn_name="cosine", + framework=["Sentence Transformers", "PyTorch"], + use_instructions=True, + training_datasets={ + # https://huggingface.co/datasets/IlyaGusev/gazeta + # https://huggingface.co/datasets/zloelias/lenta-ru + # https://huggingface.co/datasets/HuggingFaceFW/fineweb-2 + # https://huggingface.co/datasets/HuggingFaceFW/fineweb + }, + public_training_code=None, + adapted_from="sergeyzh/LaBSE-ru-turbo", + public_training_data=None, +) + rosberta_prompts = { # Default "Classification": "classification: ",