diff --git a/mteb/models/model_implementations/align_models.py b/mteb/models/model_implementations/align_models.py index 0dfdfe500c..3115d56bbc 100644 --- a/mteb/models/model_implementations/align_models.py +++ b/mteb/models/model_implementations/align_models.py @@ -116,6 +116,7 @@ def encode( release_date="2023-02-24", modalities=["image", "text"], n_parameters=176_000_000, + n_embedding_parameters=None, memory_usage_mb=671, max_tokens=64, embed_dim=768, diff --git a/mteb/models/model_implementations/amazon_models.py b/mteb/models/model_implementations/amazon_models.py index 4513655967..cd0e1af761 100644 --- a/mteb/models/model_implementations/amazon_models.py +++ b/mteb/models/model_implementations/amazon_models.py @@ -8,6 +8,7 @@ release_date="2024-04-30", languages=["eng-Latn"], n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=None, embed_dim=None, diff --git a/mteb/models/model_implementations/andersborges.py b/mteb/models/model_implementations/andersborges.py index 7fcbfce4d1..01d03d120f 100644 --- a/mteb/models/model_implementations/andersborges.py +++ b/mteb/models/model_implementations/andersborges.py @@ -12,6 +12,7 @@ revision="cb576c78dcc1b729e4612645f61db59929d69e61", release_date="2025-11-21", n_parameters=48042496, + n_embedding_parameters=None, memory_usage_mb=183, max_tokens=np.inf, embed_dim=256, @@ -43,6 +44,7 @@ revision="cb576c78dcc1b729e4612645f61db59929d69e61", release_date="2025-11-21", n_parameters=48578560, + n_embedding_parameters=None, memory_usage_mb=185, max_tokens=np.inf, embed_dim=256, diff --git a/mteb/models/model_implementations/ara_models.py b/mteb/models/model_implementations/ara_models.py index 7c39ab9801..3f001ce10a 100644 --- a/mteb/models/model_implementations/ara_models.py +++ b/mteb/models/model_implementations/ara_models.py @@ -10,6 +10,7 @@ revision="ed357f222f0b6ea6670d2c9b5a1cb93950d34200", release_date="2024-07-28", n_parameters=135_000_000, + n_embedding_parameters=49_152_000, memory_usage_mb=516, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/arctic_models.py b/mteb/models/model_implementations/arctic_models.py index e9a96c22ee..0423e84818 100644 --- a/mteb/models/model_implementations/arctic_models.py +++ b/mteb/models/model_implementations/arctic_models.py @@ -147,6 +147,7 @@ open_weights=True, framework=["Sentence Transformers", "PyTorch", "ONNX", "safetensors"], n_parameters=22_600_000, + n_embedding_parameters=11_720_448, memory_usage_mb=86, max_tokens=512, embed_dim=384, @@ -173,6 +174,7 @@ open_weights=True, framework=["Sentence Transformers", "PyTorch", "ONNX", "safetensors"], n_parameters=32_200_000, + n_embedding_parameters=11_720_448, memory_usage_mb=127, max_tokens=512, embed_dim=384, @@ -199,6 +201,7 @@ open_weights=True, framework=["Sentence Transformers", "PyTorch", "ONNX", "safetensors"], n_parameters=109_000_000, + n_embedding_parameters=23_440_896, memory_usage_mb=415, max_tokens=512, embed_dim=768, @@ -225,6 +228,7 @@ open_weights=True, framework=["Sentence Transformers", "PyTorch", "ONNX", "safetensors"], n_parameters=137_000_000, + n_embedding_parameters=None, memory_usage_mb=522, max_tokens=2048, embed_dim=768, @@ -250,6 +254,7 @@ open_weights=True, framework=["Sentence Transformers", "PyTorch", "ONNX", "safetensors"], n_parameters=335_000_000, + n_embedding_parameters=31_254_528, memory_usage_mb=1274, max_tokens=512, embed_dim=1024, @@ -280,6 +285,7 @@ open_weights=True, framework=["Sentence Transformers", "PyTorch", "ONNX", "safetensors", "GGUF"], n_parameters=109_000_000, + n_embedding_parameters=23_440_896, memory_usage_mb=415, max_tokens=512, embed_dim=768, @@ -306,6 +312,7 @@ open_weights=True, framework=["Sentence Transformers", "PyTorch", "ONNX", "safetensors"], n_parameters=305_000_000, + n_embedding_parameters=None, memory_usage_mb=1165, max_tokens=8192, embed_dim=768, @@ -331,6 +338,7 @@ open_weights=True, framework=["Sentence Transformers", "PyTorch", "ONNX", "safetensors"], n_parameters=568_000_000, + n_embedding_parameters=256_002_048, memory_usage_mb=2166, max_tokens=8192, embed_dim=1024, diff --git a/mteb/models/model_implementations/b1ade_models.py b/mteb/models/model_implementations/b1ade_models.py index 621a109a08..3ff7d55e86 100644 --- a/mteb/models/model_implementations/b1ade_models.py +++ b/mteb/models/model_implementations/b1ade_models.py @@ -16,6 +16,7 @@ open_weights=True, release_date="2025-03-10", n_parameters=335_000_000, + n_embedding_parameters=31_254_528, memory_usage_mb=1278, embed_dim=1024, license="mit", diff --git a/mteb/models/model_implementations/bedrock_models.py b/mteb/models/model_implementations/bedrock_models.py index fd0022ec7a..064097a6d0 100644 --- a/mteb/models/model_implementations/bedrock_models.py +++ b/mteb/models/model_implementations/bedrock_models.py @@ -179,6 +179,7 @@ def _to_numpy(self, embedding_response) -> np.ndarray: embed_dim=1536, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, public_training_code=None, public_training_data=None, # assumed @@ -206,6 +207,7 @@ def _to_numpy(self, embedding_response) -> np.ndarray: embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, public_training_code=None, public_training_data=None, # assumed @@ -235,6 +237,7 @@ def _to_numpy(self, embedding_response) -> np.ndarray: revision="1", release_date="2023-11-02", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, public_training_code=None, public_training_data=None, # assumed @@ -263,6 +266,7 @@ def _to_numpy(self, embedding_response) -> np.ndarray: revision="1", release_date="2023-11-02", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, public_training_code=None, public_training_data=None, # assumed diff --git a/mteb/models/model_implementations/bge_models.py b/mteb/models/model_implementations/bge_models.py index e16fb537ff..8bcb2b1b8b 100644 --- a/mteb/models/model_implementations/bge_models.py +++ b/mteb/models/model_implementations/bge_models.py @@ -325,6 +325,7 @@ revision="5c38ec7c405ec4b44b94cc5a9bb96e735b38267a", release_date="2023-09-12", # initial commit of hf model. n_parameters=33_400_000, + n_embedding_parameters=11_720_448, memory_usage_mb=127, embed_dim=512, license="mit", @@ -357,6 +358,7 @@ revision="a5beb1e3e68b9ab74eb54cfd186867f64f240e1a", release_date="2023-09-11", # initial commit of hf model. n_parameters=109_000_000, + n_embedding_parameters=23_440_896, memory_usage_mb=390, embed_dim=768, license="mit", @@ -389,6 +391,7 @@ revision="d4aa6901d3a41ba39fb536a557fa166f842b0e09", release_date="2023-09-12", # initial commit of hf model. n_parameters=335_000_000, + n_embedding_parameters=31_254_528, memory_usage_mb=1242, embed_dim=1024, license="mit", @@ -421,6 +424,7 @@ revision="1d2363c5de6ce9ba9c890c8e23a4c72dce540ca8", release_date="2023-08-05", # initial commit of hf model. n_parameters=33_400_000, + n_embedding_parameters=10_817_536, memory_usage_mb=127, embed_dim=512, license="mit", @@ -448,6 +452,7 @@ revision="0e5f83d4895db7955e4cb9ed37ab73f7ded339b6", release_date="2023-08-05", # initial commit of hf model. n_parameters=109_000_000, + n_embedding_parameters=16_226_304, memory_usage_mb=390, embed_dim=768, license="mit", @@ -475,6 +480,7 @@ revision="b5d9f5c027e87b6f0b6fa4b614f8f9cdc45ce0e8", release_date="2023-08-02", # initial commit of hf model. n_parameters=335_000_000, + n_embedding_parameters=21_635_072, memory_usage_mb=1242, embed_dim=1024, license="mit", @@ -502,6 +508,7 @@ revision="4778d71a06863076696b03fd2777eb118712cad8", release_date="2023-08-05", # initial commit of hf model. n_parameters=33_400_000, + n_embedding_parameters=11_720_448, memory_usage_mb=127, embed_dim=512, license="mit", @@ -529,6 +536,7 @@ revision="b737bf5dcc6ee8bdc530531266b4804a5d77b5d8", release_date="2023-08-05", # initial commit of hf model. n_parameters=109_000_000, + n_embedding_parameters=23_440_896, memory_usage_mb=390, embed_dim=768, license="mit", @@ -562,6 +570,7 @@ revision="abe7d9d814b775ca171121fb03f394dc42974275", release_date="2023-08-05", # initial commit of hf model. n_parameters=335_000_000, + n_embedding_parameters=31_254_528, memory_usage_mb=1242, embed_dim=1024, license="mit", @@ -590,6 +599,7 @@ revision="7999e1d3359715c523056ef9478215996d62a620", release_date="2023-09-12", # initial commit of hf model. n_parameters=33_400_000, + n_embedding_parameters=10_817_536, memory_usage_mb=91, embed_dim=512, license="mit", @@ -616,6 +626,7 @@ revision="f03589ceff5aac7111bd60cfc7d497ca17ecac65", release_date="2023-09-11", # initial commit of hf model. n_parameters=109_000_000, + n_embedding_parameters=16_226_304, memory_usage_mb=416, embed_dim=768, license="mit", @@ -642,6 +653,7 @@ revision="79e7739b6ab944e86d6171e44d24c997fc1e0116", release_date="2023-09-12", # initial commit of hf model. n_parameters=335_000_000, + n_embedding_parameters=21_635_072, memory_usage_mb=1278, embed_dim=1024, license="mit", @@ -665,6 +677,7 @@ revision="5617a9f61b028005a4858fdac845db406aefb181", release_date="2024-06-28", n_parameters=568_000_000, + n_embedding_parameters=256_002_048, memory_usage_mb=2167, embed_dim=1024, license="mit", @@ -761,6 +774,7 @@ revision="992e13d8984fde2c31ef8a3cb2c038aeec513b8a", release_date="2024-07-25", # initial commit of hf model. n_parameters=int(9.24 * 1e9), + n_embedding_parameters=917_511_168, memory_usage_mb=35254, embed_dim=3584, # from old C-MTEB leaderboard license="https://ai.google.dev/gemma/terms", @@ -808,6 +822,7 @@ revision="971c7e1445cc86656ca0bd85ed770b8675a40bb5", release_date="2024-07-25", # initial commit of hf model. n_parameters=int(7.11 * 1e9), + n_embedding_parameters=131_084_288, memory_usage_mb=27125, embed_dim=4096, license="apache-2.0", @@ -842,6 +857,7 @@ revision="46f03bc86361cf88102b0b517b36c8259f2946b1", release_date="2024-01-30", # January 30, 2024 - BGE-M3 release date n_parameters=568_000_000, + n_embedding_parameters=256_002_048, memory_usage_mb=2167, embed_dim=1024, license="mit", @@ -871,6 +887,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=567754752, + n_embedding_parameters=256_002_048, memory_usage_mb=2166, max_tokens=8194.0, embed_dim=1024, diff --git a/mteb/models/model_implementations/bica_model.py b/mteb/models/model_implementations/bica_model.py index e44d9240d0..a05cd33fa5 100644 --- a/mteb/models/model_implementations/bica_model.py +++ b/mteb/models/model_implementations/bica_model.py @@ -9,6 +9,7 @@ revision="31237a836e5ae908c308a256573e5f0986498574", release_date="2025-11-14", n_parameters=110_000_000, + n_embedding_parameters=23_440_896, memory_usage_mb=418, embed_dim=768, license="mit", diff --git a/mteb/models/model_implementations/blip2_models.py b/mteb/models/model_implementations/blip2_models.py index d4e1a91e64..777f55a2d3 100644 --- a/mteb/models/model_implementations/blip2_models.py +++ b/mteb/models/model_implementations/blip2_models.py @@ -177,6 +177,7 @@ def encode( release_date="2024-03-22", modalities=["image", "text"], n_parameters=3_740_000_000, + n_embedding_parameters=None, memory_usage_mb=14285, max_tokens=None, embed_dim=768, @@ -201,6 +202,7 @@ def encode( release_date="2024-03-31", modalities=["image", "text"], n_parameters=7_750_000_000, + n_embedding_parameters=None, memory_usage_mb=29577, max_tokens=None, embed_dim=768, diff --git a/mteb/models/model_implementations/blip_models.py b/mteb/models/model_implementations/blip_models.py index b1214e12a7..2df5037f50 100644 --- a/mteb/models/model_implementations/blip_models.py +++ b/mteb/models/model_implementations/blip_models.py @@ -141,6 +141,7 @@ def encode( release_date="2023-12-07", modalities=["image", "text"], n_parameters=470_000_000, + n_embedding_parameters=23_442_432, memory_usage_mb=1792, max_tokens=512, embed_dim=768, @@ -169,6 +170,7 @@ def encode( release_date="2023-08-01", modalities=["image", "text"], n_parameters=247_000_000, + n_embedding_parameters=23_442_432, memory_usage_mb=942, max_tokens=512, embed_dim=768, @@ -198,6 +200,7 @@ def encode( release_date="2023-12-07", modalities=["image", "text"], n_parameters=247_000_000, + n_embedding_parameters=23_442_432, memory_usage_mb=1467, max_tokens=512, embed_dim=768, @@ -225,6 +228,7 @@ def encode( release_date="2023-01-22", modalities=["image", "text"], n_parameters=247_000_000, + n_embedding_parameters=23_442_432, memory_usage_mb=942, max_tokens=512, embed_dim=768, @@ -252,6 +256,7 @@ def encode( release_date="2023-08-01", modalities=["image", "text"], n_parameters=247_000_000, + n_embedding_parameters=23_442_432, memory_usage_mb=942, max_tokens=512, embed_dim=768, @@ -279,6 +284,7 @@ def encode( release_date="2023-08-01", modalities=["image", "text"], n_parameters=470_000_000, + n_embedding_parameters=23_442_432, memory_usage_mb=1793, max_tokens=512, embed_dim=768, @@ -307,6 +313,7 @@ def encode( release_date="2023-08-01", modalities=["image", "text"], n_parameters=247_000_000, + n_embedding_parameters=23_442_432, memory_usage_mb=942, max_tokens=512, embed_dim=768, @@ -335,6 +342,7 @@ def encode( release_date="2023-08-01", modalities=["image", "text"], n_parameters=470_000_000, + n_embedding_parameters=23_442_432, memory_usage_mb=1793, max_tokens=512, embed_dim=768, diff --git a/mteb/models/model_implementations/bm25.py b/mteb/models/model_implementations/bm25.py index dec2b6d698..1d5186e0e8 100644 --- a/mteb/models/model_implementations/bm25.py +++ b/mteb/models/model_implementations/bm25.py @@ -132,6 +132,7 @@ def encode(self, texts: list[str]): revision="0_1_10", release_date="2024-07-10", # release of version 0.1.10 n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, embed_dim=None, license=None, diff --git a/mteb/models/model_implementations/bmretriever_models.py b/mteb/models/model_implementations/bmretriever_models.py index b1cd20f90c..de28b872c1 100644 --- a/mteb/models/model_implementations/bmretriever_models.py +++ b/mteb/models/model_implementations/bmretriever_models.py @@ -103,6 +103,7 @@ def __init__( release_date="2024-04-29", embed_dim=1024, n_parameters=353_822_720, + n_embedding_parameters=51_511_296, memory_usage_mb=1349, max_tokens=2048, license="mit", @@ -133,6 +134,7 @@ def __init__( release_date="2024-04-29", embed_dim=2048, n_parameters=908_759_040, + n_embedding_parameters=103_022_592, memory_usage_mb=3466, max_tokens=2048, license="mit", @@ -163,6 +165,7 @@ def __init__( release_date="2024-04-29", embed_dim=2048, n_parameters=2_506_172_416, + n_embedding_parameters=524_288_000, memory_usage_mb=9560, max_tokens=8192, license="mit", @@ -193,6 +196,7 @@ def __init__( release_date="2024-04-29", embed_dim=4096, n_parameters=7_110_660_096, + n_embedding_parameters=131_072_000, memory_usage_mb=27124, max_tokens=32768, license="mit", diff --git a/mteb/models/model_implementations/cadet_models.py b/mteb/models/model_implementations/cadet_models.py index 41ba75b79e..8abda25241 100644 --- a/mteb/models/model_implementations/cadet_models.py +++ b/mteb/models/model_implementations/cadet_models.py @@ -41,6 +41,7 @@ open_weights=True, release_date="2025-05-11", n_parameters=109_000_000, + n_embedding_parameters=23_440_896, memory_usage_mb=418, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/cde_models.py b/mteb/models/model_implementations/cde_models.py index c0119397c6..5851548302 100644 --- a/mteb/models/model_implementations/cde_models.py +++ b/mteb/models/model_implementations/cde_models.py @@ -226,6 +226,7 @@ def _load_task_sample( revision="e151df18af0d7f1d1c37b074fee58406ececf19f", release_date="2024-09-24", n_parameters=int(281 * 1e6), + n_embedding_parameters=None, memory_usage_mb=1072, # Though the second-stage model is only 140M max_tokens=512, embed_dim=768, @@ -255,6 +256,7 @@ def _load_task_sample( revision="4e1d021a6c3fd7ce8aa0a7204057eee5ae61d390", release_date="2025-01-13", n_parameters=int(306 * 1e6), + n_embedding_parameters=None, memory_usage_mb=1166, # Though the second-stage model is only 140M max_tokens=512, embed_dim=768, diff --git a/mteb/models/model_implementations/clip_models.py b/mteb/models/model_implementations/clip_models.py index 03f3af9a1b..5d6cc7cef7 100644 --- a/mteb/models/model_implementations/clip_models.py +++ b/mteb/models/model_implementations/clip_models.py @@ -128,6 +128,7 @@ def encode( release_date="2021-02-26", modalities=["image", "text"], n_parameters=428_000_000, + n_embedding_parameters=None, memory_usage_mb=1631, max_tokens=77, embed_dim=768, @@ -152,6 +153,7 @@ def encode( release_date="2021-02-26", modalities=["image", "text"], n_parameters=151_000_000, + n_embedding_parameters=None, memory_usage_mb=576, max_tokens=77, embed_dim=512, @@ -176,6 +178,7 @@ def encode( release_date="2021-02-26", modalities=["image", "text"], n_parameters=151_000_000, + n_embedding_parameters=None, memory_usage_mb=576, max_tokens=77, embed_dim=512, diff --git a/mteb/models/model_implementations/clips_models.py b/mteb/models/model_implementations/clips_models.py index 220bb202f8..28fdba2640 100644 --- a/mteb/models/model_implementations/clips_models.py +++ b/mteb/models/model_implementations/clips_models.py @@ -30,6 +30,7 @@ revision="0243664a6c5e12eef854b091eb283e51833c3e9f", release_date="2025-09-23", n_parameters=40_800_000, + n_embedding_parameters=19_200_768, memory_usage_mb=78, embed_dim=384, license="mit", @@ -57,6 +58,7 @@ revision="6bd5722f236da48b4b8bcb28cc1fc478f7089956", release_date="2025-09-23", n_parameters=124_400_000, + n_embedding_parameters=38_401_536, memory_usage_mb=237, embed_dim=768, license="mit", @@ -84,6 +86,7 @@ revision="683333f86ed9eb3699b5567f0fdabeb958d412b0", release_date="2025-09-23", n_parameters=355_000_000, + n_embedding_parameters=51_202_048, memory_usage_mb=1355, embed_dim=1024, license="mit", diff --git a/mteb/models/model_implementations/codefuse_models.py b/mteb/models/model_implementations/codefuse_models.py index b242cbc402..3b1ae34c61 100644 --- a/mteb/models/model_implementations/codefuse_models.py +++ b/mteb/models/model_implementations/codefuse_models.py @@ -236,6 +236,7 @@ def instruction_template( revision="36416618b83d4bd84a8ca30c2ee01ed518f9f2e7", release_date="2025-09-18", n_parameters=595_776_512, + n_embedding_parameters=None, memory_usage_mb=1137, embed_dim=1024, license="apache-2.0", @@ -266,6 +267,7 @@ def instruction_template( revision="fdce0e09655f42cea26f7f66f5a70cd4507ea45c", release_date="2025-09-18", n_parameters=1_720_574_976, + n_embedding_parameters=None, memory_usage_mb=3282, embed_dim=2560, license="apache-2.0", @@ -296,6 +298,7 @@ def instruction_template( revision="9fe95901ed2b6b59dd7673d6e93c9d76766a1e25", release_date="2025-09-18", n_parameters=4_021_774_336, + n_embedding_parameters=None, memory_usage_mb=7672, embed_dim=2560, license="apache-2.0", @@ -318,6 +321,7 @@ def instruction_template( release_date="2025-12-22", languages=c2llm_languages, n_parameters=497252096, + n_embedding_parameters=None, memory_usage_mb=948.0, max_tokens=32768, embed_dim=896, @@ -346,6 +350,7 @@ def instruction_template( release_date="2025-12-22", languages=c2llm_languages, n_parameters=7667028992, + n_embedding_parameters=None, memory_usage_mb=14624.0, max_tokens=32768, embed_dim=3584, diff --git a/mteb/models/model_implementations/codesage_models.py b/mteb/models/model_implementations/codesage_models.py index 83646e278f..3734091823 100644 --- a/mteb/models/model_implementations/codesage_models.py +++ b/mteb/models/model_implementations/codesage_models.py @@ -28,6 +28,7 @@ release_date="2024-02-03", modalities=["text"], n_parameters=1_300_000_000, + n_embedding_parameters=100_667_392, memory_usage_mb=4959, max_tokens=2048, embed_dim=2048, @@ -55,6 +56,7 @@ release_date="2024-02-03", modalities=["text"], n_parameters=356_000_000, + n_embedding_parameters=50_333_696, memory_usage_mb=1358, max_tokens=2048, embed_dim=1024, @@ -82,6 +84,7 @@ release_date="2024-02-03", modalities=["text"], n_parameters=130_000_000, + n_embedding_parameters=50_333_696, memory_usage_mb=496, max_tokens=2048, embed_dim=1024, diff --git a/mteb/models/model_implementations/cohere_models.py b/mteb/models/model_implementations/cohere_models.py index 5822fb3c03..a208f2dda2 100644 --- a/mteb/models/model_implementations/cohere_models.py +++ b/mteb/models/model_implementations/cohere_models.py @@ -392,6 +392,7 @@ def encode( revision="1", release_date="2023-11-02", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=None, embed_dim=512, @@ -418,6 +419,7 @@ def encode( revision="1", release_date="2023-11-02", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=512, embed_dim=1024, @@ -443,6 +445,7 @@ def encode( reference="https://cohere.com/blog/introducing-embed-v3", release_date="2023-11-02", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=512, embed_dim=384, @@ -468,6 +471,7 @@ def encode( revision="1", release_date="2023-11-02", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=512, embed_dim=384, diff --git a/mteb/models/model_implementations/cohere_v.py b/mteb/models/model_implementations/cohere_v.py index b6c89bf754..dbebc3f8aa 100644 --- a/mteb/models/model_implementations/cohere_v.py +++ b/mteb/models/model_implementations/cohere_v.py @@ -391,6 +391,7 @@ def encode( revision="1", release_date="2024-10-24", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=None, embed_dim=1024, @@ -415,6 +416,7 @@ def encode( revision="1", release_date="2024-10-24", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=None, embed_dim=1024, @@ -439,6 +441,7 @@ def encode( revision="1", release_date="2024-12-01", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=128000, embed_dim=1536, @@ -463,6 +466,7 @@ def encode( revision="1", release_date="2024-12-01", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=128000, embed_dim=1536, @@ -488,6 +492,7 @@ def encode( revision="1", release_date="2024-12-01", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=128000, embed_dim=1536, diff --git a/mteb/models/model_implementations/colpali_models.py b/mteb/models/model_implementations/colpali_models.py index 329615eb9f..e2f03b767b 100644 --- a/mteb/models/model_implementations/colpali_models.py +++ b/mteb/models/model_implementations/colpali_models.py @@ -220,6 +220,7 @@ def __init__( release_date="2024-08-21", modalities=["image", "text"], n_parameters=2_920_000_000, + n_embedding_parameters=None, memory_usage_mb=4700, max_tokens=16384, embed_dim=128, @@ -247,6 +248,7 @@ def __init__( release_date="2024-08-26", modalities=["image", "text"], n_parameters=2_920_000_000, + n_embedding_parameters=None, memory_usage_mb=4700, max_tokens=16384, embed_dim=128, @@ -274,6 +276,7 @@ def __init__( release_date="2024-11-01", modalities=["image", "text"], n_parameters=2_920_000_000, + n_embedding_parameters=None, memory_usage_mb=4700, max_tokens=16384, embed_dim=128, diff --git a/mteb/models/model_implementations/colqwen_models.py b/mteb/models/model_implementations/colqwen_models.py index 6c0831adc7..511dc0846d 100644 --- a/mteb/models/model_implementations/colqwen_models.py +++ b/mteb/models/model_implementations/colqwen_models.py @@ -224,6 +224,7 @@ def similarity(self, a, b): release_date="2025-11-03", modalities=["image", "text"], n_parameters=2_210_000_000, + n_embedding_parameters=None, memory_usage_mb=7200, max_tokens=32768, embed_dim=128, @@ -251,6 +252,7 @@ def similarity(self, a, b): release_date="2025-01-31", modalities=["image", "text"], n_parameters=3_000_000_000, + n_embedding_parameters=None, memory_usage_mb=7200, max_tokens=128000, embed_dim=128, @@ -295,6 +297,7 @@ def similarity(self, a, b): release_date="2025-11-26", modalities=["image", "text"], n_parameters=8_000_000_000, + n_embedding_parameters=None, memory_usage_mb=16724, max_tokens=262144, embed_dim=320, @@ -319,6 +322,7 @@ def similarity(self, a, b): release_date="2025-11-26", modalities=["image", "text"], n_parameters=4_000_000_000, + n_embedding_parameters=None, memory_usage_mb=8466, max_tokens=262144, embed_dim=320, @@ -365,6 +369,7 @@ def similarity(self, a, b): release_date="2025-03-31", modalities=["image", "text"], n_parameters=3_000_000_000, + n_embedding_parameters=None, memory_usage_mb=7200, max_tokens=128000, embed_dim=128, @@ -430,6 +435,7 @@ def similarity(self, a, b): release_date="2025-11-04", modalities=["image", "text"], n_parameters=3_000_000_000, + n_embedding_parameters=None, memory_usage_mb=7200, max_tokens=128000, embed_dim=128, @@ -456,6 +462,7 @@ def similarity(self, a, b): release_date="2025-11-04", modalities=["image", "text"], n_parameters=7_000_000_000, + n_embedding_parameters=None, memory_usage_mb=14400, max_tokens=128000, embed_dim=128, diff --git a/mteb/models/model_implementations/colsmol_models.py b/mteb/models/model_implementations/colsmol_models.py index c55ecf180d..0795db9ed0 100644 --- a/mteb/models/model_implementations/colsmol_models.py +++ b/mteb/models/model_implementations/colsmol_models.py @@ -60,6 +60,7 @@ def __init__( release_date="2025-01-22", modalities=["image", "text"], n_parameters=256_000_000, + n_embedding_parameters=None, memory_usage_mb=800, max_tokens=8192, embed_dim=128, @@ -87,6 +88,7 @@ def __init__( release_date="2025-01-22", modalities=["image", "text"], n_parameters=500_000_000, + n_embedding_parameters=None, memory_usage_mb=1200, max_tokens=8192, embed_dim=128, diff --git a/mteb/models/model_implementations/conan_models.py b/mteb/models/model_implementations/conan_models.py index fc70397ea6..ad2df9e62b 100644 --- a/mteb/models/model_implementations/conan_models.py +++ b/mteb/models/model_implementations/conan_models.py @@ -211,6 +211,7 @@ def encode( embed_dim=3584, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license="apache-2.0", reference="https://huggingface.co/TencentBAC/Conan-embedding-v2", diff --git a/mteb/models/model_implementations/dino_models.py b/mteb/models/model_implementations/dino_models.py index 00c9092fee..a6be50e157 100644 --- a/mteb/models/model_implementations/dino_models.py +++ b/mteb/models/model_implementations/dino_models.py @@ -117,6 +117,7 @@ def encode( release_date="2023-07-18", modalities=["image"], n_parameters=22_100_000, + n_embedding_parameters=None, memory_usage_mb=84, max_tokens=None, embed_dim=384, @@ -148,6 +149,7 @@ def encode( release_date="2023-07-18", modalities=["image"], n_parameters=86_600_000, + n_embedding_parameters=None, memory_usage_mb=330, max_tokens=None, embed_dim=768, @@ -179,6 +181,7 @@ def encode( release_date="2023-07-18", modalities=["image"], n_parameters=304_000_000, + n_embedding_parameters=None, memory_usage_mb=1161, max_tokens=None, embed_dim=1024, @@ -210,6 +213,7 @@ def encode( release_date="2023-07-18", modalities=["image"], n_parameters=1_140_000_000, + n_embedding_parameters=None, memory_usage_mb=4335, max_tokens=None, embed_dim=1536, @@ -245,6 +249,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=304_000_000, + n_embedding_parameters=None, memory_usage_mb=1158, max_tokens=None, embed_dim=1024, @@ -276,6 +281,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=1_130_000_000, + n_embedding_parameters=None, memory_usage_mb=4329, max_tokens=None, embed_dim=1536, @@ -307,6 +313,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=2_080_000_000, + n_embedding_parameters=None, memory_usage_mb=7951, max_tokens=None, embed_dim=2688, @@ -338,6 +345,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=3_000_000_000, + n_embedding_parameters=None, memory_usage_mb=11247, max_tokens=None, embed_dim=3072, @@ -369,6 +377,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=5_000_000_000, + n_embedding_parameters=None, memory_usage_mb=18838, max_tokens=None, embed_dim=3584, @@ -400,6 +409,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=7_000_000_000, + n_embedding_parameters=None, memory_usage_mb=24605, max_tokens=None, embed_dim=4096, @@ -431,6 +441,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=7_000_000_000, + n_embedding_parameters=None, memory_usage_mb=24613, max_tokens=None, embed_dim=4096, @@ -462,6 +473,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=7_000_000_000, + n_embedding_parameters=None, memory_usage_mb=24623, max_tokens=None, embed_dim=4096, @@ -494,6 +506,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=2_000_000_000, + n_embedding_parameters=None, memory_usage_mb=7951, max_tokens=None, embed_dim=2688, @@ -525,6 +538,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=2_000_000_000, + n_embedding_parameters=None, memory_usage_mb=7951, max_tokens=None, embed_dim=2688, @@ -556,6 +570,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=3_000_000_000, + n_embedding_parameters=None, memory_usage_mb=11247, max_tokens=None, embed_dim=3072, @@ -587,6 +602,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=3_000_000_000, + n_embedding_parameters=None, memory_usage_mb=11247, max_tokens=None, embed_dim=3072, @@ -618,6 +634,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=304_000_000, + n_embedding_parameters=None, memory_usage_mb=1161, max_tokens=None, embed_dim=1024, @@ -649,6 +666,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=700_000_000, + n_embedding_parameters=None, memory_usage_mb=2412, max_tokens=None, embed_dim=1280, @@ -680,6 +698,7 @@ def encode( release_date="2025-04-24", modalities=["image"], n_parameters=1_000_000_000, + n_embedding_parameters=None, memory_usage_mb=4337, max_tokens=None, embed_dim=1536, diff --git a/mteb/models/model_implementations/e5_instruct.py b/mteb/models/model_implementations/e5_instruct.py index 1f5c312048..0f817b40a4 100644 --- a/mteb/models/model_implementations/e5_instruct.py +++ b/mteb/models/model_implementations/e5_instruct.py @@ -57,6 +57,7 @@ use_instructions=True, reference="https://huggingface.co/intfloat/multilingual-e5-large-instruct", n_parameters=560_000_000, + n_embedding_parameters=256_002_048, memory_usage_mb=1068, embed_dim=1024, license="mit", @@ -102,6 +103,7 @@ use_instructions=True, reference="https://huggingface.co/intfloat/e5-mistral-7b-instruct", n_parameters=7_111_000_000, + n_embedding_parameters=131_072_000, memory_usage_mb=13563, embed_dim=4096, license="mit", @@ -145,6 +147,7 @@ release_date="2024-08-30", languages=["eng-Latn"], n_parameters=7110660096, + n_embedding_parameters=None, memory_usage_mb=13563, max_tokens=32768.0, embed_dim=4096, @@ -228,6 +231,7 @@ release_date="2024-06-28", languages=["eng-Latn"], n_parameters=7241732096, + n_embedding_parameters=131_072_000, memory_usage_mb=27625, max_tokens=32768.0, embed_dim=4096, diff --git a/mteb/models/model_implementations/e5_models.py b/mteb/models/model_implementations/e5_models.py index 042f3fd10f..228f04ea53 100644 --- a/mteb/models/model_implementations/e5_models.py +++ b/mteb/models/model_implementations/e5_models.py @@ -76,6 +76,7 @@ revision="fd1525a9fd15316a2d503bf26ab031a61d056e98", release_date=E5_PAPER_RELEASE_DATE, n_parameters=118_000_000, + n_embedding_parameters=96_014_208, memory_usage_mb=449, embed_dim=384, license="mit", @@ -103,6 +104,7 @@ revision="d13f1b27baf31030b7fd040960d60d909913633f", release_date=E5_PAPER_RELEASE_DATE, n_parameters=278_000_000, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, embed_dim=768, license="mit", @@ -130,6 +132,7 @@ revision="ab10c1a7f42e74530fe7ae5be82e6d4f11a719eb", release_date=E5_PAPER_RELEASE_DATE, n_parameters=560_000_000, + n_embedding_parameters=256_002_048, memory_usage_mb=2136, embed_dim=1024, license="mit", @@ -157,6 +160,7 @@ revision="dca8b1a9dae0d4575df2bf423a5edb485a431236", release_date=E5_PAPER_RELEASE_DATE, n_parameters=33_000_000, + n_embedding_parameters=11_720_448, memory_usage_mb=127, embed_dim=384, license="mit", @@ -184,6 +188,7 @@ revision="e272f3049e853b47cb5ca3952268c6662abda68f", release_date=E5_PAPER_RELEASE_DATE, n_parameters=33_000_000, + n_embedding_parameters=11_720_448, memory_usage_mb=127, embed_dim=384, license="mit", @@ -211,6 +216,7 @@ revision="1c644c92ad3ba1efdad3f1451a637716616a20e8", release_date=E5_PAPER_RELEASE_DATE, n_parameters=109_000_000, + n_embedding_parameters=23_440_896, memory_usage_mb=418, embed_dim=768, license="mit", @@ -239,6 +245,7 @@ revision="b322e09026e4ea05f42beadf4d661fb4e101d311", release_date=E5_PAPER_RELEASE_DATE, n_parameters=335_000_000, + n_embedding_parameters=31_254_528, memory_usage_mb=1278, embed_dim=1024, license="mit", @@ -267,6 +274,7 @@ revision="4dc6d853a804b9c8886ede6dda8a073b7dc08a81", release_date="2022-12-26", n_parameters=335_000_000, + n_embedding_parameters=31_254_528, memory_usage_mb=1278, embed_dim=1024, license="apache-2.0", @@ -295,6 +303,7 @@ revision="b533fe4636f4a2507c08ddab40644d20b0006d6a", release_date="2022-12-26", n_parameters=109_000_000, + n_embedding_parameters=23_440_896, memory_usage_mb=418, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/e5_v.py b/mteb/models/model_implementations/e5_v.py index a09e9a5ba1..baf3174433 100644 --- a/mteb/models/model_implementations/e5_v.py +++ b/mteb/models/model_implementations/e5_v.py @@ -171,6 +171,7 @@ def encode( release_date="2024-07-17", modalities=["image", "text"], n_parameters=8_360_000_000, + n_embedding_parameters=None, memory_usage_mb=15936, max_tokens=8192, embed_dim=4096, diff --git a/mteb/models/model_implementations/eagerworks_models.py b/mteb/models/model_implementations/eagerworks_models.py index ae6470d471..0153e8c742 100644 --- a/mteb/models/model_implementations/eagerworks_models.py +++ b/mteb/models/model_implementations/eagerworks_models.py @@ -153,6 +153,7 @@ def encode( release_date="2025-11-20", modalities=["image", "text"], n_parameters=4_000_000_000, + n_embedding_parameters=None, memory_usage_mb=16929, max_tokens=262144, embed_dim=2560, diff --git a/mteb/models/model_implementations/emillykkejensen_models.py b/mteb/models/model_implementations/emillykkejensen_models.py index f4619c91a2..a91921aa95 100644 --- a/mteb/models/model_implementations/emillykkejensen_models.py +++ b/mteb/models/model_implementations/emillykkejensen_models.py @@ -10,6 +10,7 @@ revision="9f3307b9f601db564a9190cb475324d128dcfe86", release_date="2025-10-17", n_parameters=307_581_696, + n_embedding_parameters=None, embed_dim=768, max_tokens=2048, license="apache-2.0", @@ -43,6 +44,7 @@ revision="cf1e7ba36ebd3d605549d8f02930a18e17b54513", release_date="2025-10-17", n_parameters=595776512, + n_embedding_parameters=None, memory_usage_mb=2272, embed_dim=1024, max_tokens=32768, @@ -67,6 +69,7 @@ revision="82d74c7a5d8e1ddf31b132865df2d16b2b0294ee", release_date="2025-10-17", n_parameters=306939648, + n_embedding_parameters=None, memory_usage_mb=1171, embed_dim=768, max_tokens=8192, diff --git a/mteb/models/model_implementations/en_code_retriever.py b/mteb/models/model_implementations/en_code_retriever.py index 3f682f19a7..8c654ef5ed 100644 --- a/mteb/models/model_implementations/en_code_retriever.py +++ b/mteb/models/model_implementations/en_code_retriever.py @@ -18,6 +18,7 @@ revision="be653fab7d27a7348a0c2c3d16b9f92a7f10cb0c", release_date="2025-07-10", n_parameters=149_000_000, + n_embedding_parameters=None, memory_usage_mb=568, embed_dim=768, license="mit", diff --git a/mteb/models/model_implementations/euler_models.py b/mteb/models/model_implementations/euler_models.py index ed1da1c863..cb21d144f5 100644 --- a/mteb/models/model_implementations/euler_models.py +++ b/mteb/models/model_implementations/euler_models.py @@ -9,6 +9,7 @@ release_date="2025-11-06", languages=["eng-Latn"], n_parameters=8000000000, + n_embedding_parameters=None, memory_usage_mb=15618, max_tokens=1536, embed_dim=4096, diff --git a/mteb/models/model_implementations/evaclip_models.py b/mteb/models/model_implementations/evaclip_models.py index 0cc04c0951..4f7e571391 100644 --- a/mteb/models/model_implementations/evaclip_models.py +++ b/mteb/models/model_implementations/evaclip_models.py @@ -149,6 +149,7 @@ def encode( release_date="2023-04-26", modalities=["image", "text"], n_parameters=149_000_000, + n_embedding_parameters=None, memory_usage_mb=568, max_tokens=77, embed_dim=512, @@ -173,6 +174,7 @@ def encode( release_date="2023-04-26", modalities=["image", "text"], n_parameters=428_000_000, + n_embedding_parameters=None, memory_usage_mb=1633, max_tokens=77, embed_dim=768, @@ -197,6 +199,7 @@ def encode( release_date="2023-04-26", modalities=["image", "text"], n_parameters=4_700_000_000, + n_embedding_parameters=None, memory_usage_mb=17929, max_tokens=77, embed_dim=1024, @@ -222,6 +225,7 @@ def encode( release_date="2023-04-26", modalities=["image", "text"], n_parameters=5_000_000_000, + n_embedding_parameters=None, memory_usage_mb=19073, max_tokens=77, embed_dim=1024, diff --git a/mteb/models/model_implementations/fa_models.py b/mteb/models/model_implementations/fa_models.py index 0bce68d8b2..b72c28dfcd 100644 --- a/mteb/models/model_implementations/fa_models.py +++ b/mteb/models/model_implementations/fa_models.py @@ -12,6 +12,7 @@ revision="d73a0e2c7492c33bd5819bcdb23eba207404dd19", release_date="2021-05-19", n_parameters=162_841_344, + n_embedding_parameters=76_800_000, memory_usage_mb=621, embed_dim=768, license="not specified", @@ -48,6 +49,7 @@ revision="b9506ddc579ac8c398ae6dae680401ae0a1a5b23", release_date="2021-06-28", n_parameters=118_297_344, + n_embedding_parameters=32_256_000, memory_usage_mb=451, embed_dim=768, license="not specified", @@ -74,6 +76,7 @@ revision="36f912ac44e22250aee16ea533a4ff8cd848c1a1", release_date="2021-06-28", n_parameters=118_298_112, + n_embedding_parameters=32_256_000, memory_usage_mb=451, embed_dim=768, license="not specified", @@ -99,6 +102,7 @@ revision="72bd0a3557622f0ae08a092f4643609e0b950cdd", release_date="2024-12-10", n_parameters=162_841_344, + n_embedding_parameters=76_800_000, memory_usage_mb=621, embed_dim=768, license="apache-2.0", @@ -123,6 +127,7 @@ revision="fa5ca89df5670700d9325b8872ac65c17cb24582", release_date="2024-12-08", n_parameters=122_905_344, + n_embedding_parameters=36_864_000, memory_usage_mb=469, embed_dim=768, license="apache-2.0", @@ -150,6 +155,7 @@ revision="5d07f0c543aca654373b931ae07cd197769110fd", release_date="2024-12-07", n_parameters=353_039_360, + n_embedding_parameters=49_152_000, memory_usage_mb=1347, embed_dim=1024, license="apache-2.0", @@ -181,6 +187,7 @@ revision="a0e3973064c97768e121b9b95f21adc94e0ca3fb", release_date="2024-10-07", n_parameters=124_441_344, + n_embedding_parameters=38_400_000, memory_usage_mb=475, embed_dim=768, license="not specified", @@ -229,6 +236,7 @@ revision="8bbed87e36669387f71437c061430ba56d1b496f", release_date="2025-05-01", n_parameters=122_905_344, + n_embedding_parameters=36_864_000, memory_usage_mb=496, embed_dim=768, license="not specified", @@ -260,6 +268,7 @@ revision="b59682efa961122cc0e4408296d5852870c82eae", release_date="2025-05-01", n_parameters=353_039_360, + n_embedding_parameters=49_152_000, memory_usage_mb=1347, embed_dim=1024, license="not specified", diff --git a/mteb/models/model_implementations/facebookai.py b/mteb/models/model_implementations/facebookai.py index 416c592844..82b7588e24 100644 --- a/mteb/models/model_implementations/facebookai.py +++ b/mteb/models/model_implementations/facebookai.py @@ -113,6 +113,7 @@ revision="e73636d4f797dec63c3081bb6ed5c7b0bb3f2089", release_date="2019-11-05", # arxiv paper release n_parameters=278043648, + n_embedding_parameters=192_001_536, memory_usage_mb=1064, embed_dim=768, license="mit", @@ -163,6 +164,7 @@ revision="c23d21b0620b635a76227c604d44e43a9f0ee389", release_date="2019-11-05", # arxiv paper release n_parameters=559890432, + n_embedding_parameters=256_002_048, memory_usage_mb=2141, embed_dim=1024, license="mit", diff --git a/mteb/models/model_implementations/geogpt_models.py b/mteb/models/model_implementations/geogpt_models.py index e9ee5c508e..716d24b21a 100644 --- a/mteb/models/model_implementations/geogpt_models.py +++ b/mteb/models/model_implementations/geogpt_models.py @@ -20,6 +20,7 @@ ), release_date="2025-04-22", n_parameters=7241732096, + n_embedding_parameters=131_072_000, memory_usage_mb=27625, embed_dim=4096, license="apache-2.0", diff --git a/mteb/models/model_implementations/gme_v_models.py b/mteb/models/model_implementations/gme_v_models.py index d54c005dc3..571789c6f4 100644 --- a/mteb/models/model_implementations/gme_v_models.py +++ b/mteb/models/model_implementations/gme_v_models.py @@ -356,6 +356,7 @@ def fetch_image(image: Image.Image, size_factor: int = IMAGE_FACTOR) -> Image.Im release_date="2024-12-24", modalities=["image", "text"], n_parameters=2_210_000_000, + n_embedding_parameters=233_373_696, memory_usage_mb=8427, embed_dim=1536, license="apache-2.0", @@ -380,6 +381,7 @@ def fetch_image(image: Image.Image, size_factor: int = IMAGE_FACTOR) -> Image.Im release_date="2024-12-24", modalities=["image", "text"], n_parameters=8_290_000_000, + n_embedding_parameters=544_997_376, memory_usage_mb=31629, embed_dim=3584, license="apache-2.0", diff --git a/mteb/models/model_implementations/google_models.py b/mteb/models/model_implementations/google_models.py index ee98344ab1..4ecfba39c7 100644 --- a/mteb/models/model_implementations/google_models.py +++ b/mteb/models/model_implementations/google_models.py @@ -162,6 +162,7 @@ def encode( revision="1", # revision is intended for implementation release_date="2024-05-14", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=2048, embed_dim=768, @@ -187,6 +188,7 @@ def encode( revision="1", # revision is intended for implementation release_date="2024-11-18", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=2048, embed_dim=768, @@ -212,6 +214,7 @@ def encode( revision="1", release_date="2024-05-14", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=2048, embed_dim=768, @@ -237,6 +240,7 @@ def encode( revision="1", release_date="2025-03-07", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=2048, embed_dim=3072, @@ -272,6 +276,7 @@ def gemma_embedding_loader(model_name: str, revision: str, **kwargs): revision="64614b0b8b64f0c6c1e52b07e4e9a4e8fe4d2da2", release_date="2025-09-04", n_parameters=307_581_696, + n_embedding_parameters=201_326_592, embed_dim=768, max_tokens=2048, license="gemma", diff --git a/mteb/models/model_implementations/granite_vision_embedding_models.py b/mteb/models/model_implementations/granite_vision_embedding_models.py index facb0ac3d7..4e9672be1c 100644 --- a/mteb/models/model_implementations/granite_vision_embedding_models.py +++ b/mteb/models/model_implementations/granite_vision_embedding_models.py @@ -173,6 +173,7 @@ def similarity(self, a, b): release_date="2025-06-11", modalities=["image", "text"], n_parameters=2_980_000_000, + n_embedding_parameters=None, memory_usage_mb=11351, max_tokens=128000, embed_dim=128, diff --git a/mteb/models/model_implementations/gritlm_models.py b/mteb/models/model_implementations/gritlm_models.py index 68af6440fb..7fcf394071 100644 --- a/mteb/models/model_implementations/gritlm_models.py +++ b/mteb/models/model_implementations/gritlm_models.py @@ -44,6 +44,7 @@ def gritlm_instruction(instruction: str = "", prompt_type=None) -> str: revision="13f00a0e36500c80ce12870ea513846a066004af", release_date="2024-02-15", n_parameters=7_240_000_000, + n_embedding_parameters=131_072_000, memory_usage_mb=13813, embed_dim=4096, license="apache-2.0", @@ -73,6 +74,7 @@ def gritlm_instruction(instruction: str = "", prompt_type=None) -> str: revision="7f089b13e3345510281733ca1e6ff871b5b4bc76", release_date="2024-02-15", n_parameters=57_920_000_000, + n_embedding_parameters=None, memory_usage_mb=89079, embed_dim=32768, license="apache-2.0", diff --git a/mteb/models/model_implementations/gte_models.py b/mteb/models/model_implementations/gte_models.py index 104e221bda..9393a6fa49 100644 --- a/mteb/models/model_implementations/gte_models.py +++ b/mteb/models/model_implementations/gte_models.py @@ -48,6 +48,7 @@ def instruction_template( revision="e26182b2122f4435e8b3ebecbf363990f409b45b", release_date="2024-06-15", # initial commit of hf model. n_parameters=7_613_000_000, + n_embedding_parameters=543_499_264, memory_usage_mb=29040, embed_dim=3584, license="apache-2.0", @@ -80,6 +81,7 @@ def instruction_template( revision="07d27e5226328010336563bc1b564a5e3436a298", release_date="2024-04-20", # initial commit of hf model. n_parameters=7_720_000_000, + n_embedding_parameters=None, memory_usage_mb=29449, embed_dim=4096, license="apache-2.0", @@ -117,6 +119,7 @@ def instruction_template( revision="c6c1b92f4a3e1b92b326ad29dd3c8433457df8dd", release_date="2024-07-29", # initial commit of hf model. n_parameters=1_780_000_000, + n_embedding_parameters=232_928_256, memory_usage_mb=6776, embed_dim=8960, license="apache-2.0", @@ -145,6 +148,7 @@ def instruction_template( revision="af7bd46fbb00b3a6963c8dd7f1786ddfbfbe973a", release_date="2023-11-08", # initial commit of hf model. n_parameters=int(30.3 * 1e6), + n_embedding_parameters=10_817_536, memory_usage_mb=58, embed_dim=1024, license="mit", @@ -173,6 +177,7 @@ def instruction_template( revision="71ab7947d6fac5b64aa299e6e40e6c2b2e85976c", release_date="2023-11-08", # initial commit of hf model. n_parameters=int(102 * 1e6), + n_embedding_parameters=16_226_304, memory_usage_mb=195, embed_dim=1024, license="mit", @@ -201,6 +206,7 @@ def instruction_template( revision="64c364e579de308104a9b2c170ca009502f4f545", release_date="2023-11-08", # initial commit of hf model. n_parameters=int(326 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=621, embed_dim=1024, license="mit", @@ -330,6 +336,7 @@ def instruction_template( revision="ca1791e0bcc104f6db161f27de1340241b13c5a4", release_date="2024-07-20", # initial commit of hf model. n_parameters=int(305 * 1e6), + n_embedding_parameters=192_036_864, memory_usage_mb=582, embed_dim=768, license="apache-2.0", @@ -359,6 +366,7 @@ def instruction_template( revision="7ca8b4ca700621b67618669f5378fe5f5820b8e4", release_date="2025-01-21", # initial commit of hf model. n_parameters=int(149 * 1e6), + n_embedding_parameters=None, memory_usage_mb=284, embed_dim=768, license="apache-2.0", @@ -402,6 +410,7 @@ def instruction_template( revision="a829fd0e060bb84554da0dfd354d0de0f7712b7f", # can be any release_date="2024-06-20", # initial commit of hf model n_parameters=137_000_000, + n_embedding_parameters=23_445_504, memory_usage_mb=None, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/hinvec_models.py b/mteb/models/model_implementations/hinvec_models.py index f891495a01..15cbc1ac77 100644 --- a/mteb/models/model_implementations/hinvec_models.py +++ b/mteb/models/model_implementations/hinvec_models.py @@ -47,6 +47,7 @@ def instruction_template( revision="d4fc678720cc1b8c5d18599ce2d9a4d6090c8b6b", release_date="2025-06-19", n_parameters=939_591_680, + n_embedding_parameters=None, memory_usage_mb=3715, embed_dim=2048, license="cc-by-nc-4.0", diff --git a/mteb/models/model_implementations/human.py b/mteb/models/model_implementations/human.py index 8848acfde7..90227d5131 100644 --- a/mteb/models/model_implementations/human.py +++ b/mteb/models/model_implementations/human.py @@ -9,6 +9,7 @@ revision="2025_09_25", release_date=None, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, embed_dim=None, license=None, diff --git a/mteb/models/model_implementations/ibm_granite_models.py b/mteb/models/model_implementations/ibm_granite_models.py index 5ae7be2c0f..51f82fb7cc 100644 --- a/mteb/models/model_implementations/ibm_granite_models.py +++ b/mteb/models/model_implementations/ibm_granite_models.py @@ -100,6 +100,7 @@ revision="47db56afe692f731540413c67dd818ff492277e7", release_date="2024-12-18", n_parameters=107_000_000, + n_embedding_parameters=96_000_768, memory_usage_mb=204, embed_dim=384, license="apache-2.0", @@ -131,6 +132,7 @@ revision="84e3546b88b0cb69f8078608a1df558020bcbf1f", release_date="2024-12-18", n_parameters=278_000_000, + n_embedding_parameters=192_001_536, memory_usage_mb=530, embed_dim=768, license="apache-2.0", @@ -162,6 +164,7 @@ revision="eddbb57470f896b5f8e2bfcb823d8f0e2d2024a5", release_date="2024-12-18", n_parameters=30_000_000, + n_embedding_parameters=19_301_760, memory_usage_mb=58, embed_dim=384, license="apache-2.0", @@ -193,6 +196,7 @@ revision="e48d3a5b47eaa18e3fe07d4676e187fd80f32730", release_date="2024-12-18", n_parameters=125_000_000, + n_embedding_parameters=38_603_520, memory_usage_mb=238, embed_dim=768, license="apache-2.0", @@ -225,6 +229,7 @@ revision="6e7b8ce0e76270394ac4669ba4bbd7133b60b7f9", release_date="2025-08-15", n_parameters=149_000_000, + n_embedding_parameters=None, memory_usage_mb=284, embed_dim=768, license="apache-2.0", @@ -250,6 +255,7 @@ revision="54a8d2616a0844355a5164432d3f6dafb37b17a3", release_date="2025-08-15", n_parameters=47_000_000, + n_embedding_parameters=None, memory_usage_mb=91, embed_dim=384, license="apache-2.0", diff --git a/mteb/models/model_implementations/inf_models.py b/mteb/models/model_implementations/inf_models.py index 48bbfe09aa..0124ae056a 100644 --- a/mteb/models/model_implementations/inf_models.py +++ b/mteb/models/model_implementations/inf_models.py @@ -56,6 +56,7 @@ revision="cb70ca7c31dfa866b2eff2dad229c144d8ddfd91", release_date="2024-12-24", # initial commit of hf model. n_parameters=7_069_121_024, + n_embedding_parameters=None, memory_usage_mb=13483, embed_dim=3584, license="apache-2.0", @@ -83,6 +84,7 @@ revision="c9c05c2dd50707a486966ba81703021ae2094a06", release_date="2025-02-08", # initial commit of hf model. n_parameters=1_543_268_864, + n_embedding_parameters=232_928_256, memory_usage_mb=2944, embed_dim=1536, license="apache-2.0", diff --git a/mteb/models/model_implementations/jasper_models.py b/mteb/models/model_implementations/jasper_models.py index 03dd820d29..885259daa8 100644 --- a/mteb/models/model_implementations/jasper_models.py +++ b/mteb/models/model_implementations/jasper_models.py @@ -299,6 +299,7 @@ def encode( revision="d6330ce98f8a0d741e781df845904c9484f00efa", release_date="2024-12-11", # first commit n_parameters=1_999_000_000, + n_embedding_parameters=232_932_864, memory_usage_mb=3802, max_tokens=131072, embed_dim=8960, @@ -346,6 +347,7 @@ def encode( revision="06a100f753a5a96d9e583b3af79c6fcdfacc4719", release_date="2025-11-14", n_parameters=595776512, + n_embedding_parameters=None, memory_usage_mb=2272, embed_dim=2048, license="mit", diff --git a/mteb/models/model_implementations/jina_clip.py b/mteb/models/model_implementations/jina_clip.py index 4c86ebddbc..4c521d7d49 100644 --- a/mteb/models/model_implementations/jina_clip.py +++ b/mteb/models/model_implementations/jina_clip.py @@ -144,6 +144,7 @@ def encode( release_date="2024-05-30", modalities=["image", "text"], n_parameters=223_000_000, + n_embedding_parameters=None, memory_usage_mb=849, max_tokens=8192, embed_dim=768, diff --git a/mteb/models/model_implementations/jina_models.py b/mteb/models/model_implementations/jina_models.py index b016d1691d..a7abeb55e1 100644 --- a/mteb/models/model_implementations/jina_models.py +++ b/mteb/models/model_implementations/jina_models.py @@ -733,6 +733,7 @@ def get_programming_task_override( release_date="2025-09-18", # official release date modalities=["text"], n_parameters=int(0.6 * 1e9), + n_embedding_parameters=None, memory_usage_mb=1138, max_tokens=131072, embed_dim=None, @@ -776,6 +777,7 @@ def get_programming_task_override( release_date="2025-06-24", # official release date modalities=["image", "text"], n_parameters=int(3.8 * 1e9), + n_embedding_parameters=None, memory_usage_mb=7500, max_tokens=32768, embed_dim=2048, @@ -824,6 +826,7 @@ def get_programming_task_override( revision="215a6e121fa0183376388ac6b1ae230326bfeaed", release_date="2024-09-18", # official release date n_parameters=int(572 * 1e6), + n_embedding_parameters=None, memory_usage_mb=1092, max_tokens=8194, embed_dim=1024, @@ -884,6 +887,7 @@ def get_programming_task_override( revision="6e85f575bc273f1fd840a658067d0157933c83f0", release_date="2023-09-27", n_parameters=137_000_000, + n_embedding_parameters=23_445_504, memory_usage_mb=262, embed_dim=768, license="apache-2.0", @@ -948,6 +952,7 @@ def get_programming_task_override( revision="44e7d1d6caec8c883c2d4b207588504d519788d0", release_date="2023-09-27", n_parameters=32_700_000, + n_embedding_parameters=15_630_336, memory_usage_mb=62, embed_dim=512, license="apache-2.0", @@ -1009,6 +1014,7 @@ def get_programming_task_override( revision="32aa658e5ceb90793454d22a57d8e3a14e699516", release_date="2023-07-07", n_parameters=110_000_000, + n_embedding_parameters=24_674_304, memory_usage_mb=420, embed_dim=768, license="apache-2.0", @@ -1066,6 +1072,7 @@ def get_programming_task_override( revision="5ac6cd473e2324c6d5f9e558a6a9f65abb57143e", release_date="2023-07-07", n_parameters=35_000_000, + n_embedding_parameters=16_449_536, memory_usage_mb=134, embed_dim=512, license="apache-2.0", diff --git a/mteb/models/model_implementations/kalm_models.py b/mteb/models/model_implementations/kalm_models.py index 1613d53efc..053217ceda 100644 --- a/mteb/models/model_implementations/kalm_models.py +++ b/mteb/models/model_implementations/kalm_models.py @@ -780,6 +780,7 @@ def encode( release_date="2024-10-23", languages=["eng-Latn", "zho-Hans"], n_parameters=494032768, + n_embedding_parameters=136_134_656, memory_usage_mb=1885, max_tokens=512, embed_dim=896, @@ -805,6 +806,7 @@ def encode( release_date="2024-08-27", languages=["eng-Latn", "zho-Hans"], n_parameters=494032768, + n_embedding_parameters=136_134_656, memory_usage_mb=1885, max_tokens=512, embed_dim=896, @@ -836,6 +838,7 @@ def encode( release_date="2024-12-26", languages=["eng-Latn", "zho-Hans"], n_parameters=494032768, + n_embedding_parameters=136_134_656, memory_usage_mb=1885, max_tokens=512, embed_dim=896, @@ -867,6 +870,7 @@ def encode( release_date="2025-06-25", languages=["eng-Latn", "zho-Hans"], n_parameters=494032768, + n_embedding_parameters=136_134_656, memory_usage_mb=942, max_tokens=512, embed_dim=896, @@ -898,6 +902,7 @@ def encode( release_date="2025-09-30", languages=["eng-Latn", "zho-Hans"], n_parameters=494032768, + n_embedding_parameters=136_134_656, memory_usage_mb=1885, max_tokens=512, embed_dim=896, @@ -948,6 +953,7 @@ def encode( open_weights=True, release_date="2025-11-06", n_parameters=11.76 * 1e9, + n_embedding_parameters=None, memory_usage_mb=44884, max_tokens=32768, embed_dim=3840, diff --git a/mteb/models/model_implementations/kblab.py b/mteb/models/model_implementations/kblab.py index 5859b796b2..8bc828eab4 100644 --- a/mteb/models/model_implementations/kblab.py +++ b/mteb/models/model_implementations/kblab.py @@ -10,6 +10,7 @@ revision="6b5e83cd29c03729cfdc33d13b1423399b0efb5c", release_date="2023-01-11", n_parameters=124690944, + n_embedding_parameters=38_649_600, memory_usage_mb=476, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/kennethenevoldsen_models.py b/mteb/models/model_implementations/kennethenevoldsen_models.py index 388507afbe..f424f1bb68 100644 --- a/mteb/models/model_implementations/kennethenevoldsen_models.py +++ b/mteb/models/model_implementations/kennethenevoldsen_models.py @@ -12,6 +12,7 @@ revision="132c53391e7a780dc6a2f9a03724d0158fe7122c", release_date="2023-07-12", n_parameters=355087360, + n_embedding_parameters=51_200_000, memory_usage_mb=1554, embed_dim=1024, license="mit", @@ -47,6 +48,7 @@ revision="701bce95d499fa97610d57e8823c54fd1fb79930", release_date="2023-07-12", n_parameters=124445952, + n_embedding_parameters=38_403_840, memory_usage_mb=475, embed_dim=768, license="mit", diff --git a/mteb/models/model_implementations/kfst.py b/mteb/models/model_implementations/kfst.py index e1220638ea..c907ac4d6c 100644 --- a/mteb/models/model_implementations/kfst.py +++ b/mteb/models/model_implementations/kfst.py @@ -10,6 +10,7 @@ revision="d40c10ca7b1e68b5a8372f2d112dac9eb3279df1", release_date="2022-02-22", n_parameters=278043648, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, embed_dim=768, license="not specified", diff --git a/mteb/models/model_implementations/kowshik24_models.py b/mteb/models/model_implementations/kowshik24_models.py index 086fea9901..f83b83ccae 100644 --- a/mteb/models/model_implementations/kowshik24_models.py +++ b/mteb/models/model_implementations/kowshik24_models.py @@ -9,6 +9,7 @@ revision="6689c21e69be5950596bad084457cbaa138728d8", release_date="2025-11-10", n_parameters=278_000_000, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/lens_models.py b/mteb/models/model_implementations/lens_models.py index 613f39aaf3..e12e21cde0 100644 --- a/mteb/models/model_implementations/lens_models.py +++ b/mteb/models/model_implementations/lens_models.py @@ -18,6 +18,7 @@ revision="e473b33364e6c48a324796fd1411d3b93670c6fe", release_date="2025-01-17", n_parameters=int(7.11 * 1e9), + n_embedding_parameters=131_084_288, memory_usage_mb=27125, embed_dim=4000, license="apache-2.0", @@ -41,6 +42,7 @@ revision="a0b87bd91cb27b6f2f0b0fe22c28026da1d464ef", release_date="2025-01-17", n_parameters=int(7.11 * 1e9), + n_embedding_parameters=131_084_288, memory_usage_mb=27125, embed_dim=8000, license="apache-2.0", diff --git a/mteb/models/model_implementations/lgai_embedding_models.py b/mteb/models/model_implementations/lgai_embedding_models.py index 4bf7bbc413..d9d2fcacd3 100644 --- a/mteb/models/model_implementations/lgai_embedding_models.py +++ b/mteb/models/model_implementations/lgai_embedding_models.py @@ -52,6 +52,7 @@ revision="5e0b2316acc8c2e2941ded6b9cb200b1cb313e65", release_date="2025-06-11", n_parameters=7_110_000_000, + n_embedding_parameters=131_084_288, memory_usage_mb=27125, embed_dim=4096, license="apache-2.0", diff --git a/mteb/models/model_implementations/linq_models.py b/mteb/models/model_implementations/linq_models.py index 237eba5ee5..b6dac1cdc0 100644 --- a/mteb/models/model_implementations/linq_models.py +++ b/mteb/models/model_implementations/linq_models.py @@ -43,6 +43,7 @@ def instruction_template( revision="0c1a0b0589177079acc552433cad51d7c9132379", release_date="2024-05-29", # initial commit of hf model. n_parameters=7_110_000_000, + n_embedding_parameters=None, memory_usage_mb=13563, embed_dim=4096, license="cc-by-nc-4.0", diff --git a/mteb/models/model_implementations/listconranker.py b/mteb/models/model_implementations/listconranker.py index 76df6f2239..f80c6406df 100644 --- a/mteb/models/model_implementations/listconranker.py +++ b/mteb/models/model_implementations/listconranker.py @@ -123,6 +123,7 @@ def predict( revision="95ae6a5f422a916bc36520f0f3e198e7d91520a0", release_date="2024-12-11", n_parameters=401_000_000, + n_embedding_parameters=None, memory_usage_mb=1242, similarity_fn_name="cosine", training_datasets=listconranker_training_datasets, diff --git a/mteb/models/model_implementations/llm2clip_models.py b/mteb/models/model_implementations/llm2clip_models.py index 6398b650a5..dfaedc8e5d 100644 --- a/mteb/models/model_implementations/llm2clip_models.py +++ b/mteb/models/model_implementations/llm2clip_models.py @@ -194,6 +194,7 @@ def encode( release_date="2024-11-07", modalities=["image", "text"], n_parameters=579_000_000, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=None, embed_dim=1280, @@ -219,6 +220,7 @@ def encode( release_date="2024-11-07", modalities=["image", "text"], n_parameters=578_000_000, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=None, embed_dim=1280, @@ -243,6 +245,7 @@ def encode( release_date="2024-11-07", modalities=["image", "text"], n_parameters=361_000_000, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=None, embed_dim=1280, diff --git a/mteb/models/model_implementations/llm2vec_models.py b/mteb/models/model_implementations/llm2vec_models.py index 4699016597..2bc4c0ea50 100644 --- a/mteb/models/model_implementations/llm2vec_models.py +++ b/mteb/models/model_implementations/llm2vec_models.py @@ -145,6 +145,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: # TODO: Not sure what to put here as a model is made of two peft repos, each with a different revision release_date="2024-04-09", n_parameters=7_505_000_000, + n_embedding_parameters=None, memory_usage_mb=28629, max_tokens=8192, embed_dim=4096, @@ -174,6 +175,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="1cb7b735326d13a8541db8f57f35da5373f5e9c6", release_date="2024-04-09", n_parameters=7_505_000_000, + n_embedding_parameters=None, memory_usage_mb=28629, max_tokens=8192, embed_dim=4096, @@ -203,6 +205,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="0ae69bdd5816105778b971c3138e8f8a18eaa3ae", release_date="2024-04-09", n_parameters=7_111_000_000, + n_embedding_parameters=131_072_000, memory_usage_mb=27126, max_tokens=32768, embed_dim=4096, @@ -232,6 +235,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="2c055a5d77126c0d3dc6cd8ffa30e2908f4f45f8", release_date="2024-04-09", n_parameters=7_111_000_000, + n_embedding_parameters=131_072_000, memory_usage_mb=27126, max_tokens=32768, embed_dim=4096, @@ -261,6 +265,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="2c055a5d77126c0d3dc6cd8ffa30e2908f4f45f8", release_date="2024-04-09", n_parameters=7_111_000_000, + n_embedding_parameters=None, memory_usage_mb=27126, max_tokens=32768, embed_dim=4096, @@ -290,6 +295,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="a76944871d169ebe7c97eb921764cd063afed785", release_date="2024-04-09", n_parameters=7_111_000_000, + n_embedding_parameters=None, memory_usage_mb=27126, max_tokens=32768, embed_dim=4096, @@ -319,6 +325,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="a5943d406c6b016fef3f07906aac183cf1a0b47d", release_date="2024-04-09", n_parameters=7_111_000_000, + n_embedding_parameters=65_536_000, memory_usage_mb=27126, max_tokens=32768, embed_dim=4096, @@ -348,6 +355,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="a5943d406c6b016fef3f07906aac183cf1a0b47d", release_date="2024-04-09", n_parameters=7_111_000_000, + n_embedding_parameters=65_536_000, memory_usage_mb=27126, max_tokens=32768, embed_dim=4096, diff --git a/mteb/models/model_implementations/mcinext_models.py b/mteb/models/model_implementations/mcinext_models.py index 9c3ebc7f78..4740754e08 100644 --- a/mteb/models/model_implementations/mcinext_models.py +++ b/mteb/models/model_implementations/mcinext_models.py @@ -358,6 +358,7 @@ def encode( revision="1", release_date="2025-05-10", n_parameters=124_441_344, + n_embedding_parameters=None, memory_usage_mb=475, embed_dim=768, license="not specified", @@ -426,6 +427,7 @@ def encode( revision="1", release_date="2025-05-10", n_parameters=38_736_384, + n_embedding_parameters=None, memory_usage_mb=148, embed_dim=512, license="not specified", @@ -493,6 +495,7 @@ def encode( revision="1", release_date="2025-05-10", n_parameters=124_441_344, + n_embedding_parameters=None, memory_usage_mb=475, embed_dim=768, license="not specified", diff --git a/mteb/models/model_implementations/mdbr_models.py b/mteb/models/model_implementations/mdbr_models.py index e52c66f540..eee86be59c 100644 --- a/mteb/models/model_implementations/mdbr_models.py +++ b/mteb/models/model_implementations/mdbr_models.py @@ -45,6 +45,7 @@ "Transformers", ], n_parameters=22_861_056, + n_embedding_parameters=11_720_448, memory_usage_mb=86, max_tokens=512, embed_dim=768, @@ -79,6 +80,7 @@ "Transformers", ], n_parameters=22_958_592, + n_embedding_parameters=11_720_448, memory_usage_mb=86, max_tokens=512, embed_dim=1024, diff --git a/mteb/models/model_implementations/misc_models.py b/mteb/models/model_implementations/misc_models.py index 12925d8f58..52b8e66e77 100644 --- a/mteb/models/model_implementations/misc_models.py +++ b/mteb/models/model_implementations/misc_models.py @@ -18,6 +18,7 @@ release_date="2024-10-31", languages=["eng-Latn"], n_parameters=7110660096, + n_embedding_parameters=None, memory_usage_mb=13563, max_tokens=32768.0, embed_dim=None, @@ -47,6 +48,7 @@ languages=[], loader=sentence_transformers_loader, n_parameters=278043648, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, max_tokens=514.0, embed_dim=768, @@ -148,6 +150,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=None, embed_dim=768, @@ -215,6 +218,7 @@ languages=[], loader=sentence_transformers_loader, n_parameters=2506172416, + n_embedding_parameters=None, memory_usage_mb=9560, max_tokens=8192.0, embed_dim=2048, @@ -250,6 +254,7 @@ trust_remote_code=True, ), n_parameters=278043648, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, max_tokens=514.0, embed_dim=768, @@ -299,6 +304,7 @@ trust_remote_code=True, ), n_parameters=559890432, + n_embedding_parameters=256_002_048, memory_usage_mb=2136, max_tokens=514.0, embed_dim=1024, @@ -348,6 +354,7 @@ trust_remote_code=True, ), n_parameters=117653760, + n_embedding_parameters=96_014_208, memory_usage_mb=449, max_tokens=512.0, embed_dim=384, @@ -394,6 +401,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=17389824, + n_embedding_parameters=11_720_448, memory_usage_mb=66, max_tokens=512.0, embed_dim=384, @@ -418,6 +426,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=22713216, + n_embedding_parameters=11_720_448, memory_usage_mb=87, max_tokens=512.0, embed_dim=384, @@ -442,6 +451,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=15615360, + n_embedding_parameters=11_720_448, memory_usage_mb=60, max_tokens=512.0, embed_dim=384, @@ -466,6 +476,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=15615360, + n_embedding_parameters=11_720_448, memory_usage_mb=60, max_tokens=512.0, embed_dim=384, @@ -490,6 +501,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=17389824, + n_embedding_parameters=11_720_448, memory_usage_mb=66, max_tokens=512.0, embed_dim=384, @@ -514,6 +526,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=17389824, + n_embedding_parameters=11_720_448, memory_usage_mb=66, max_tokens=512.0, embed_dim=384, @@ -537,6 +550,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=19164288, + n_embedding_parameters=11_720_448, memory_usage_mb=73, max_tokens=512.0, embed_dim=384, @@ -560,6 +574,7 @@ languages=["fra-Latn"], loader=sentence_transformers_loader, n_parameters=559890432, + n_embedding_parameters=256_002_048, memory_usage_mb=2136, max_tokens=514.0, embed_dim=1024, @@ -583,6 +598,7 @@ languages=["ara-Arab"], loader=sentence_transformers_loader, n_parameters=135193344, + n_embedding_parameters=49_152_000, memory_usage_mb=516, max_tokens=512.0, embed_dim=768, @@ -615,6 +631,7 @@ languages=["ara-Arab"], loader=sentence_transformers_loader, n_parameters=117653760, + n_embedding_parameters=96_014_208, memory_usage_mb=449, max_tokens=512.0, embed_dim=384, @@ -640,6 +657,7 @@ languages=["ara-Arab"], loader=sentence_transformers_loader, n_parameters=278043648, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, max_tokens=514.0, embed_dim=768, @@ -674,6 +692,7 @@ languages=["ara-Arab"], loader=sentence_transformers_loader, n_parameters=470926848, + n_embedding_parameters=384_885_504, memory_usage_mb=1796, max_tokens=512.0, embed_dim=768, @@ -708,6 +727,7 @@ languages=["ara-Arab"], loader=sentence_transformers_loader, n_parameters=109486464, + n_embedding_parameters=23_444_736, memory_usage_mb=418, max_tokens=514.0, embed_dim=768, @@ -742,6 +762,7 @@ languages=["ara-Arab"], loader=sentence_transformers_loader, n_parameters=162841344, + n_embedding_parameters=76_800_000, memory_usage_mb=621, max_tokens=512.0, embed_dim=768, @@ -774,6 +795,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=31_254_528, memory_usage_mb=None, max_tokens=512.0, embed_dim=1024, @@ -797,6 +819,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=514.0, embed_dim=768, @@ -829,6 +852,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=1279887360, + n_embedding_parameters=65_536_000, memory_usage_mb=2441, max_tokens=2048.0, embed_dim=2048, @@ -852,6 +876,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=1279887360, + n_embedding_parameters=65_536_000, memory_usage_mb=2441, max_tokens=2048.0, embed_dim=2048, @@ -875,6 +900,7 @@ languages=["fra-Latn", "eng-Latn"], loader=sentence_transformers_loader, n_parameters=1279887360, + n_embedding_parameters=65_536_000, memory_usage_mb=2441, max_tokens=2048.0, embed_dim=2048, @@ -899,6 +925,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=109482752, + n_embedding_parameters=23_440_896, memory_usage_mb=209, max_tokens=512.0, embed_dim=768, @@ -928,6 +955,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=335142400, + n_embedding_parameters=31_254_528, memory_usage_mb=639, max_tokens=512.0, embed_dim=1024, @@ -957,6 +985,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=33360512, + n_embedding_parameters=11_720_448, memory_usage_mb=64, max_tokens=512.0, embed_dim=384, @@ -986,6 +1015,7 @@ languages=["pol-Latn"], loader=sentence_transformers_loader, n_parameters=103705344, + n_embedding_parameters=None, memory_usage_mb=396, max_tokens=512.0, embed_dim=768, @@ -1009,6 +1039,7 @@ languages=["pol-Latn"], loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=514.0, embed_dim=768, @@ -1032,6 +1063,7 @@ languages=["pol-Latn"], loader=sentence_transformers_loader, n_parameters=278043648, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, max_tokens=514.0, embed_dim=768, @@ -1063,6 +1095,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=23_440_896, memory_usage_mb=None, max_tokens=4096.0, embed_dim=None, @@ -1092,6 +1125,7 @@ languages=["pol-Latn"], loader=sentence_transformers_loader, n_parameters=559890432, + n_embedding_parameters=256_002_048, memory_usage_mb=2136, max_tokens=514.0, embed_dim=1024, @@ -1123,6 +1157,7 @@ languages=["pol-Latn"], loader=sentence_transformers_loader, n_parameters=117653760, + n_embedding_parameters=96_014_208, memory_usage_mb=449, max_tokens=512.0, embed_dim=384, @@ -1154,6 +1189,7 @@ languages=["pol-Latn"], loader=sentence_transformers_loader, n_parameters=124442880, + n_embedding_parameters=38_400_768, memory_usage_mb=475, max_tokens=514.0, embed_dim=768, @@ -1185,6 +1221,7 @@ languages=["pol-Latn"], loader=sentence_transformers_loader, n_parameters=434961408, + n_embedding_parameters=131_073_024, memory_usage_mb=1659, max_tokens=514.0, embed_dim=1024, @@ -1271,6 +1308,7 @@ languages=udever_languages, loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=385_351_680, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -1300,6 +1338,7 @@ languages=udever_languages, loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=642_252_800, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -1329,6 +1368,7 @@ languages=udever_languages, loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=256_901_120, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -1358,6 +1398,7 @@ languages=udever_languages, loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=1_027_604_480, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -1387,6 +1428,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=109482240, + n_embedding_parameters=23_440_896, memory_usage_mb=418, max_tokens=512.0, embed_dim=768, @@ -1437,6 +1479,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=22713216, + n_embedding_parameters=11_720_448, memory_usage_mb=87, max_tokens=512.0, embed_dim=384, @@ -1487,6 +1530,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=335141888, + n_embedding_parameters=31_254_528, memory_usage_mb=1278, max_tokens=512.0, embed_dim=1024, @@ -1537,6 +1581,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=33360000, + n_embedding_parameters=11_720_448, memory_usage_mb=127, max_tokens=512.0, embed_dim=384, @@ -1587,6 +1632,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=1_026_793_472, memory_usage_mb=None, max_tokens=None, embed_dim=4096, @@ -1616,6 +1662,7 @@ languages=["deu-Latn"], loader=sentence_transformers_loader, n_parameters=335736320, + n_embedding_parameters=31_848_448, memory_usage_mb=1281, max_tokens=512.0, embed_dim=1024, @@ -1640,6 +1687,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=33360000, + n_embedding_parameters=11_720_448, memory_usage_mb=127, max_tokens=512.0, embed_dim=384, @@ -1678,6 +1726,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=33360000, + n_embedding_parameters=11720448, memory_usage_mb=127, max_tokens=512.0, embed_dim=384, @@ -1701,6 +1750,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=22713216, + n_embedding_parameters=11_720_448, memory_usage_mb=87, max_tokens=512.0, embed_dim=384, @@ -1724,6 +1774,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, max_tokens=514.0, embed_dim=768, @@ -1747,6 +1798,7 @@ languages=["eng-Latn"], loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=23_440_896, memory_usage_mb=None, max_tokens=512.0, embed_dim=None, @@ -1770,6 +1822,7 @@ languages=None, loader=sentence_transformers_loader, n_parameters=98688000, + n_embedding_parameters=None, memory_usage_mb=158, max_tokens=512.0, embed_dim=1024, @@ -1793,6 +1846,7 @@ languages=["ara-Arab", "eng-Latn"], loader=sentence_transformers_loader, n_parameters=559890432, + n_embedding_parameters=256_002_048, memory_usage_mb=2136, max_tokens=514.0, embed_dim=1024, @@ -1833,6 +1887,7 @@ release_date="2024-09-04", languages=["zho-Hans", "eng-Latn"], n_parameters=2724880896, + n_embedding_parameters=282_822_912, memory_usage_mb=5197, max_tokens=512.0, embed_dim=2304, @@ -1857,6 +1912,7 @@ languages=["ara-Arab", "eng-Latn"], loader=sentence_transformers_loader, n_parameters=135193344, + n_embedding_parameters=49_152_000, memory_usage_mb=516, max_tokens=512.0, embed_dim=768, @@ -1888,6 +1944,7 @@ languages=["zho-Hans"], loader=sentence_transformers_loader, n_parameters=None, + n_embedding_parameters=16_226_304, memory_usage_mb=None, # Not visible on repo max_tokens=512, embed_dim=128, @@ -1916,6 +1973,7 @@ languages=["zho-Hans"], loader=sentence_transformers_loader, n_parameters=int(74.2 * 1e6), + n_embedding_parameters=16_226_304, memory_usage_mb=283, max_tokens=1024, embed_dim=768, @@ -1939,6 +1997,7 @@ languages=["zho-Hans"], loader=sentence_transformers_loader, n_parameters=int(326 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=1244, max_tokens=512, embed_dim=1024, @@ -1963,6 +2022,7 @@ languages=["zho-Hans"], loader=sentence_transformers_loader, n_parameters=int(326 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=1242, max_tokens=512, embed_dim=768, @@ -1987,6 +2047,7 @@ languages=["zho-Hans"], loader=sentence_transformers_loader, n_parameters=int(326 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=1244, max_tokens=512, embed_dim=1024, @@ -2010,6 +2071,7 @@ languages=["zho-Hans"], loader=sentence_transformers_loader, n_parameters=int(326 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=1242, max_tokens=512, embed_dim=768, @@ -2043,6 +2105,7 @@ release_date="2023-10-10", languages=["eng-Latn"], n_parameters=int(335 * 1e6), + n_embedding_parameters=31_254_528, memory_usage_mb=1278, max_tokens=512, embed_dim=1024, diff --git a/mteb/models/model_implementations/mixedbread_ai_models.py b/mteb/models/model_implementations/mixedbread_ai_models.py index 0376267c76..0cb85daf8f 100644 --- a/mteb/models/model_implementations/mixedbread_ai_models.py +++ b/mteb/models/model_implementations/mixedbread_ai_models.py @@ -31,6 +31,7 @@ revision="990580e27d329c7408b3741ecff85876e128e203", release_date="2024-03-07", # initial commit of hf model. n_parameters=335_000_000, + n_embedding_parameters=31_254_528, memory_usage_mb=639, max_tokens=512, embed_dim=1024, @@ -75,6 +76,7 @@ revision="7e639ca8e344af398876ead3b19ec3c0b9068f49", release_date="2024-03-04", # initial commit of hf model. n_parameters=335_000_000, + n_embedding_parameters=31_254_528, memory_usage_mb=None, max_tokens=512, embed_dim=768, @@ -106,6 +108,7 @@ revision="2f741ec33328bb57e4704e1238fc59a4a5745705", release_date="2024-08-13", # initial commit of hf model. n_parameters=24_100_000, + n_embedding_parameters=11_720_448, memory_usage_mb=None, max_tokens=512, embed_dim=384, diff --git a/mteb/models/model_implementations/mme5_models.py b/mteb/models/model_implementations/mme5_models.py index e52c79277d..49051fef27 100644 --- a/mteb/models/model_implementations/mme5_models.py +++ b/mteb/models/model_implementations/mme5_models.py @@ -16,7 +16,8 @@ revision="cbb328b9bf9ff5362c852c3166931903226d46f1", release_date="2025-02-12", languages=["eng-Latn"], - n_parameters=10_600_000_000, # 10.6B + n_parameters=10_600_000_000, + n_embedding_parameters=None, # 10.6B memory_usage_mb=20300, max_tokens=128_000, embed_dim=4096, diff --git a/mteb/models/model_implementations/moco_models.py b/mteb/models/model_implementations/moco_models.py index 71e0144a2a..9def2deb8a 100644 --- a/mteb/models/model_implementations/moco_models.py +++ b/mteb/models/model_implementations/moco_models.py @@ -130,6 +130,7 @@ def encode( release_date="2024-06-03", modalities=["image"], n_parameters=86_600_000, + n_embedding_parameters=None, memory_usage_mb=330, max_tokens=None, embed_dim=768, @@ -154,6 +155,7 @@ def encode( release_date="2024-06-03", modalities=["image"], n_parameters=304_000_000, + n_embedding_parameters=None, memory_usage_mb=1161, max_tokens=None, embed_dim=1024, diff --git a/mteb/models/model_implementations/mod_models.py b/mteb/models/model_implementations/mod_models.py index bd04cb7687..cf2a2bed71 100644 --- a/mteb/models/model_implementations/mod_models.py +++ b/mteb/models/model_implementations/mod_models.py @@ -175,6 +175,7 @@ def instruction_template( revision="acbb5b70fdab262226a6af2bc62001de8021b05c", release_date="2025-12-14", n_parameters=4021774336, + n_embedding_parameters=None, memory_usage_mb=7671, embed_dim=2560, max_tokens=32768, diff --git a/mteb/models/model_implementations/model2vec_models.py b/mteb/models/model_implementations/model2vec_models.py index 1b68b9a27a..55d229b554 100644 --- a/mteb/models/model_implementations/model2vec_models.py +++ b/mteb/models/model_implementations/model2vec_models.py @@ -173,6 +173,7 @@ def encode( revision="5f4f5ca159b7321a8b39739bba0794fa0debddf4", release_date="2024-09-21", n_parameters=int(103 * 1e6), + n_embedding_parameters=int(103 * 1e6), memory_usage_mb=391, max_tokens=np.inf, # Theoretically infinite embed_dim=256, @@ -199,6 +200,7 @@ def encode( revision="38ebd7f10f71e67fa8db898290f92b82e9cfff2b", release_date="2024-09-21", n_parameters=int(102 * 1e6), + n_embedding_parameters=int(102 * 1e6), memory_usage_mb=391, max_tokens=np.inf, embed_dim=256, @@ -224,6 +226,7 @@ def encode( revision="02460ae401a22b09d2c6652e23371398329551e2", release_date="2024-09-21", n_parameters=int(7.56 * 1e6), + n_embedding_parameters=int(7.56 * 1e6), memory_usage_mb=29, max_tokens=np.inf, embed_dim=256, @@ -249,6 +252,7 @@ def encode( revision="2cf4ec4e1f51aeca6c55cf9b93097d00711a6305", release_date="2024-09-21", n_parameters=int(128 * 1e6), + n_embedding_parameters=int(128 * 1e6), memory_usage_mb=489, max_tokens=np.inf, embed_dim=256, @@ -274,6 +278,7 @@ def encode( revision="86db093558fbced2072b929eb1690bce5272bd4b", release_date="2024-10-29", n_parameters=int(2 * 1e6), + n_embedding_parameters=int(2 * 1e6), memory_usage_mb=7, max_tokens=np.inf, embed_dim=64, @@ -299,6 +304,7 @@ def encode( revision="81b1802ada41afcd0987a37dc15e569c9fa76f04", release_date="2024-10-29", n_parameters=int(3.78 * 1e6), + n_embedding_parameters=int(3.78 * 1e6), memory_usage_mb=14, max_tokens=np.inf, embed_dim=128, @@ -324,6 +330,7 @@ def encode( revision="dcbec7aa2d52fc76754ac6291803feedd8c619ce", release_date="2024-10-29", n_parameters=int(7.56 * 1e6), + n_embedding_parameters=int(7.56 * 1e6), memory_usage_mb=29, max_tokens=np.inf, embed_dim=256, @@ -349,6 +356,7 @@ def encode( revision="38ebd7f10f71e67fa8db898290f92b82e9cfff2a", release_date="2025-05-23", n_parameters=128 * 1e6, + n_embedding_parameters=128 * 1e6, memory_usage_mb=489, max_tokens=np.inf, embed_dim=256, @@ -374,6 +382,7 @@ def encode( revision="bac5e3b12fb8c650e92a19c41b436732c4f16e9e", release_date="2025-01-03", n_parameters=1 * 1e5, + n_embedding_parameters=1 * 1e5, memory_usage_mb=0, max_tokens=np.inf, embed_dim=64, @@ -398,6 +407,7 @@ def encode( revision="34ba71e35c393fdad7ed695113f653feb407b16b", release_date="2025-01-03", n_parameters=5 * 1e5, + n_embedding_parameters=5 * 1e5, memory_usage_mb=2, max_tokens=np.inf, embed_dim=64, @@ -422,6 +432,7 @@ def encode( revision="2b7fed222594708da6d88bcda92ae9b434b7ddd1", release_date="2025-01-03", n_parameters=1 * 1e6, + n_embedding_parameters=1 * 1e6, memory_usage_mb=2, max_tokens=np.inf, embed_dim=64, @@ -446,6 +457,7 @@ def encode( revision="1d7bbe04d6713e425161146bfdc71473cbed498a", release_date="2025-01-03", n_parameters=1.95 * 1e6, + n_embedding_parameters=1.95 * 1e6, memory_usage_mb=7, max_tokens=np.inf, embed_dim=64, @@ -470,6 +482,7 @@ def encode( revision="387d350015e963744f4fafe56a574b7cd48646c9", release_date="2025-01-03", n_parameters=7.81 * 1e6, + n_embedding_parameters=7.81 * 1e6, memory_usage_mb=30, max_tokens=np.inf, embed_dim=256, diff --git a/mteb/models/model_implementations/moka_models.py b/mteb/models/model_implementations/moka_models.py index 61bfa1b477..d67aef7849 100644 --- a/mteb/models/model_implementations/moka_models.py +++ b/mteb/models/model_implementations/moka_models.py @@ -97,6 +97,7 @@ revision="764b537a0e50e5c7d64db883f2d2e051cbe3c64c", release_date="2023-06-06", # first commit n_parameters=int(102 * 1e6), + n_embedding_parameters=16_226_304, memory_usage_mb=390, embed_dim=768, # They don't give a specific license but commercial use is not allowed @@ -123,6 +124,7 @@ revision="44c696631b2a8c200220aaaad5f987f096e986df", release_date="2023-06-02", # first commit n_parameters=None, + n_embedding_parameters=10_817_536, memory_usage_mb=None, # Can't be seen on HF page embed_dim=512, # They don't give a specific license but commercial use is not allowed @@ -149,6 +151,7 @@ revision="12900375086c37ba5d83d1e417b21dc7d1d1f388", release_date="2023-06-21", # first commit n_parameters=None, + n_embedding_parameters=21_635_072, memory_usage_mb=None, # Can't be seen on HF page embed_dim=768, # They don't give a specific license but commercial use is not allowed diff --git a/mteb/models/model_implementations/nbailab.py b/mteb/models/model_implementations/nbailab.py index 7cf776d69b..483b75548f 100644 --- a/mteb/models/model_implementations/nbailab.py +++ b/mteb/models/model_implementations/nbailab.py @@ -12,6 +12,7 @@ revision="b95656350a076aeafd2d23763660f80655408cc6", release_date="2022-11-23", n_parameters=1_780_000_000, + n_embedding_parameters=91_812_096, memory_usage_mb=678, embed_dim=4096, license="apache-2.0", @@ -34,6 +35,7 @@ revision="f9d0fc184adab4dc354d85e1854b7634540d7550", release_date="2021-04-29", n_parameters=355087360, + n_embedding_parameters=51_200_000, memory_usage_mb=1359, embed_dim=1024, license="cc-by-4.0", @@ -56,6 +58,7 @@ revision="9417c3f62a3adc99f17ff92bff446f35d011f994", release_date="2021-01-13", n_parameters=177853440, + n_embedding_parameters=91_812_096, memory_usage_mb=681, embed_dim=768, license="cc-by-4.0", diff --git a/mteb/models/model_implementations/no_instruct_sentence_models.py b/mteb/models/model_implementations/no_instruct_sentence_models.py index e4c4bdd9a7..0cbbf5d4b5 100644 --- a/mteb/models/model_implementations/no_instruct_sentence_models.py +++ b/mteb/models/model_implementations/no_instruct_sentence_models.py @@ -110,6 +110,7 @@ def encode( revision="b38747000553d8268915c95a55fc87e707c9aadd", release_date="2024-05-01", # first commit n_parameters=33_400_000, + n_embedding_parameters=11_720_448, memory_usage_mb=127, max_tokens=512, embed_dim=384, diff --git a/mteb/models/model_implementations/nomic_models.py b/mteb/models/model_implementations/nomic_models.py index 7a12fefb88..c448cb578d 100644 --- a/mteb/models/model_implementations/nomic_models.py +++ b/mteb/models/model_implementations/nomic_models.py @@ -215,6 +215,7 @@ def encode( release_date="2024-02-10", # first commit citation=NOMIC_CITATION, n_parameters=137_000_000, + n_embedding_parameters=None, memory_usage_mb=522, max_tokens=8192, embed_dim=768, @@ -249,6 +250,7 @@ def encode( revision="0759316f275aa0cb93a5b830973843ca66babcf5", release_date="2024-01-31", # first commit n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=522, max_tokens=8192, embed_dim=768, @@ -284,6 +286,7 @@ def encode( revision="7d948905c5d5d3874fa55a925d68e49dbf411e5f", release_date="2024-01-15", # first commit n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=8192, embed_dim=768, @@ -312,6 +315,7 @@ def encode( revision="b53d557b15ae63852847c222d336c1609eced93c", release_date="2024-01-15", # first commit n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=8192, embed_dim=768, @@ -340,6 +344,7 @@ def encode( revision="5960f1566fb7cb1adf1eb6e816639cf4646d9b12", release_date="2024-12-29", n_parameters=149_000_000, + n_embedding_parameters=None, memory_usage_mb=568, max_tokens=8192, embed_dim=768, @@ -479,6 +484,7 @@ def encode( revision="1066b6599d099fbb93dfcb64f9c37a7c9e503e85", release_date="2025-02-07", n_parameters=475292928, + n_embedding_parameters=None, memory_usage_mb=1813, max_tokens=512, embed_dim=768, diff --git a/mteb/models/model_implementations/nomic_models_vision.py b/mteb/models/model_implementations/nomic_models_vision.py index c86e44893b..3cb1db1f0f 100644 --- a/mteb/models/model_implementations/nomic_models_vision.py +++ b/mteb/models/model_implementations/nomic_models_vision.py @@ -175,6 +175,7 @@ def encode( release_date="2024-06-08", modalities=["image", "text"], n_parameters=92_900_000, + n_embedding_parameters=None, memory_usage_mb=355, max_tokens=2048, embed_dim=768, diff --git a/mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py b/mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py index a730bdd0fc..f3ac386871 100644 --- a/mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py +++ b/mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py @@ -162,6 +162,7 @@ def encode( release_date="2025-06-27", modalities=["image", "text"], n_parameters=2_418_000_000, + n_embedding_parameters=None, memory_usage_mb=4610, max_tokens=8192, embed_dim=2048, @@ -189,6 +190,7 @@ def encode( release_date="2025-06-27", modalities=["image", "text"], n_parameters=4_407_000_000, + n_embedding_parameters=None, memory_usage_mb=8403, max_tokens=8192, embed_dim=3072, diff --git a/mteb/models/model_implementations/nvidia_models.py b/mteb/models/model_implementations/nvidia_models.py index 21208bcc1b..7176cdd27a 100644 --- a/mteb/models/model_implementations/nvidia_models.py +++ b/mteb/models/model_implementations/nvidia_models.py @@ -204,6 +204,7 @@ def __init__( revision="7604d305b621f14095a1aa23d351674c2859553a", release_date="2024-09-09", # initial commit of hf model. n_parameters=7_850_000_000, + n_embedding_parameters=None, memory_usage_mb=14975, embed_dim=4096, license="cc-by-nc-4.0", @@ -235,6 +236,7 @@ def __init__( revision="570834afd5fef5bf3a3c2311a2b6e0a66f6f4f2c", release_date="2024-09-13", # initial commit of hf model. n_parameters=7_850_000_000, + n_embedding_parameters=None, memory_usage_mb=14975, embed_dim=4096, license="cc-by-nc-4.0", @@ -624,6 +626,7 @@ def _extract_embeddings( revision="84a375593d27d3528beb4e104822515659e093b4", release_date="2025-10-23", n_parameters=7_504_924_672, + n_embedding_parameters=None, memory_usage_mb=28629, embed_dim=4096, license="https://huggingface.co/nvidia/llama-embed-nemotron-8b/blob/main/LICENSE", diff --git a/mteb/models/model_implementations/octen_models.py b/mteb/models/model_implementations/octen_models.py index 7c104a9795..c5dca56418 100644 --- a/mteb/models/model_implementations/octen_models.py +++ b/mteb/models/model_implementations/octen_models.py @@ -208,6 +208,7 @@ def instruction_template( revision="6e188e3b072c3e3678b235ad84e6e97bcbb71e8f", release_date="2025-12-30", n_parameters=4021774336, + n_embedding_parameters=None, memory_usage_mb=7671, embed_dim=2560, max_tokens=32768, @@ -238,6 +239,7 @@ def instruction_template( revision="f7db178d5a82fb841f606a6a67c423cead2fdbba", release_date="2025-12-23", n_parameters=7567295488, + n_embedding_parameters=None, memory_usage_mb=14433, embed_dim=4096, max_tokens=32768, diff --git a/mteb/models/model_implementations/openai_models.py b/mteb/models/model_implementations/openai_models.py index aa8d1ec29b..688e12ce80 100644 --- a/mteb/models/model_implementations/openai_models.py +++ b/mteb/models/model_implementations/openai_models.py @@ -185,6 +185,7 @@ def _to_numpy(self, embedding_response) -> np.ndarray: embed_dim=1536, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://openai.com/index/new-embedding-models-and-api-updates/", @@ -213,6 +214,7 @@ def _to_numpy(self, embedding_response) -> np.ndarray: framework=["API"], use_instructions=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, public_training_code=None, public_training_data=None, # assumed @@ -238,6 +240,7 @@ def _to_numpy(self, embedding_response) -> np.ndarray: framework=["API"], use_instructions=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, public_training_code=None, public_training_data=None, # assumed @@ -262,6 +265,7 @@ def _to_numpy(self, embedding_response) -> np.ndarray: embed_dim=512, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://openai.com/index/new-embedding-models-and-api-updates/", @@ -292,6 +296,7 @@ def _to_numpy(self, embedding_response) -> np.ndarray: framework=["API"], use_instructions=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, public_training_code=None, public_training_data=None, # assumed diff --git a/mteb/models/model_implementations/openclip_models.py b/mteb/models/model_implementations/openclip_models.py index 0211d97339..362be93e78 100644 --- a/mteb/models/model_implementations/openclip_models.py +++ b/mteb/models/model_implementations/openclip_models.py @@ -133,6 +133,7 @@ def encode( release_date="2023-04-26", modalities=["image", "text"], n_parameters=428_000_000, + n_embedding_parameters=None, memory_usage_mb=1633, max_tokens=77, embed_dim=768, @@ -159,6 +160,7 @@ def encode( release_date="2023-04-26", modalities=["image", "text"], n_parameters=151_000_000, + n_embedding_parameters=None, memory_usage_mb=576, max_tokens=77, embed_dim=512, @@ -185,6 +187,7 @@ def encode( release_date="2023-04-26", modalities=["image", "text"], n_parameters=150_000_000, + n_embedding_parameters=None, memory_usage_mb=572, max_tokens=77, embed_dim=512, @@ -211,6 +214,7 @@ def encode( release_date="2023-01-23", modalities=["image", "text"], n_parameters=2_540_000_000, + n_embedding_parameters=None, memory_usage_mb=9689, max_tokens=77, embed_dim=1280, @@ -237,6 +241,7 @@ def encode( release_date="2023-03-06", modalities=["image", "text"], n_parameters=1_367_000_000, + n_embedding_parameters=None, memory_usage_mb=5215, max_tokens=77, embed_dim=1024, @@ -263,6 +268,7 @@ def encode( release_date="2022-09-15", modalities=["image", "text"], n_parameters=986_000_000, + n_embedding_parameters=None, memory_usage_mb=3762, max_tokens=77, embed_dim=1024, @@ -289,6 +295,7 @@ def encode( release_date="2022-09-15", modalities=["image", "text"], n_parameters=428_000_000, + n_embedding_parameters=None, memory_usage_mb=1631, max_tokens=77, embed_dim=768, @@ -315,6 +322,7 @@ def encode( release_date="2022-09-15", modalities=["image", "text"], n_parameters=151_000_000, + n_embedding_parameters=None, memory_usage_mb=577, max_tokens=77, embed_dim=512, diff --git a/mteb/models/model_implementations/opensearch_neural_sparse_models.py b/mteb/models/model_implementations/opensearch_neural_sparse_models.py index 891835e374..5e877b0103 100644 --- a/mteb/models/model_implementations/opensearch_neural_sparse_models.py +++ b/mteb/models/model_implementations/opensearch_neural_sparse_models.py @@ -140,6 +140,7 @@ def encode( revision="a8abaa916125ee512a7a8f4d706d07eb0128a8e6", release_date="2025-06-18", n_parameters=137_394_234, + n_embedding_parameters=23_440_896, memory_usage_mb=549, embed_dim=30522, license="apache-2.0", @@ -166,6 +167,7 @@ def encode( revision="babf71f3c48695e2e53a978208e8aba48335e3c0", release_date="2025-03-28", n_parameters=66_985_530, + n_embedding_parameters=23_440_896, memory_usage_mb=267, embed_dim=30522, license="apache-2.0", @@ -188,6 +190,7 @@ def encode( revision="8921a26c78b8559d6604eb1f5c0b74c079bee38f", release_date="2024-07-17", n_parameters=66_985_530, + n_embedding_parameters=23_440_896, memory_usage_mb=267, embed_dim=30522, license="apache-2.0", @@ -211,6 +214,7 @@ def encode( revision="4af867a426867dfdd744097531046f4289a32fdd", release_date="2024-07-18", n_parameters=22_744_506, + n_embedding_parameters=11_720_448, memory_usage_mb=86, embed_dim=30522, license="apache-2.0", @@ -233,6 +237,7 @@ def encode( revision="98cdcbd72867c547f72f2b7b7bed9cdf9f09922d", release_date="2024-03-07", n_parameters=132_955_194, + n_embedding_parameters=23_440_896, memory_usage_mb=507, embed_dim=30522, license="apache-2.0", diff --git a/mteb/models/model_implementations/ops_moa_models.py b/mteb/models/model_implementations/ops_moa_models.py index 5a142ff1a3..c88f90923b 100644 --- a/mteb/models/model_implementations/ops_moa_models.py +++ b/mteb/models/model_implementations/ops_moa_models.py @@ -33,6 +33,7 @@ def encode(self, sentences: list[str], **kwargs) -> Array: languages=["zho-Hans"], loader=OPSWrapper, n_parameters=int(343 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=1308, max_tokens=512, embed_dim=1536, @@ -65,6 +66,7 @@ def encode(self, sentences: list[str], **kwargs) -> Array: languages=["zho-Hans"], loader=OPSWrapper, n_parameters=int(343 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=1242, max_tokens=512, embed_dim=1536, diff --git a/mteb/models/model_implementations/ordalietech_solon_embeddings_mini_beta_1_1.py b/mteb/models/model_implementations/ordalietech_solon_embeddings_mini_beta_1_1.py index 2d9b40492c..90eedad7ad 100644 --- a/mteb/models/model_implementations/ordalietech_solon_embeddings_mini_beta_1_1.py +++ b/mteb/models/model_implementations/ordalietech_solon_embeddings_mini_beta_1_1.py @@ -4,6 +4,7 @@ name="OrdalieTech/Solon-embeddings-mini-beta-1.1", languages=["fra-Latn"], n_parameters=210_000_000, + n_embedding_parameters=None, public_training_code=None, memory_usage_mb=808.0, open_weights=True, diff --git a/mteb/models/model_implementations/pawan_models.py b/mteb/models/model_implementations/pawan_models.py index 11a4746b17..ac1e3dc333 100644 --- a/mteb/models/model_implementations/pawan_models.py +++ b/mteb/models/model_implementations/pawan_models.py @@ -20,6 +20,7 @@ revision="32f295145802bdbd65699ad65fd27d2a5b69a909", release_date="2025-12-08", n_parameters=68_000_000, + n_embedding_parameters=None, memory_usage_mb=260, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/piccolo_models.py b/mteb/models/model_implementations/piccolo_models.py index 4c47c807be..2d33526a81 100644 --- a/mteb/models/model_implementations/piccolo_models.py +++ b/mteb/models/model_implementations/piccolo_models.py @@ -12,6 +12,7 @@ revision="47c0a63b8f667c3482e05b2fd45577bb19252196", release_date="2023-09-04", # first commit n_parameters=None, + n_embedding_parameters=16_226_304, memory_usage_mb=None, # can't see on model card embed_dim=768, license="mit", @@ -37,6 +38,7 @@ revision="05948c1d889355936bdf9db7d30df57dd78d25a3", release_date="2024-04-22", # first commit n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, # we don't know because they removed the model embed_dim=1024, license="not specified", diff --git a/mteb/models/model_implementations/promptriever_models.py b/mteb/models/model_implementations/promptriever_models.py index a04dfed8d7..9705a1b7fc 100644 --- a/mteb/models/model_implementations/promptriever_models.py +++ b/mteb/models/model_implementations/promptriever_models.py @@ -87,6 +87,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="01c7f73d771dfac7d292323805ebc428287df4f9-30b14e3813c0fa45facfd01a594580c3fe5ecf23", # base-peft revision release_date="2024-09-15", n_parameters=7_000_000_000, + n_embedding_parameters=None, memory_usage_mb=26703, max_tokens=4096, embed_dim=4096, @@ -123,6 +124,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: }, release_date="2024-09-15", n_parameters=8_000_000_000, + n_embedding_parameters=None, memory_usage_mb=30518, max_tokens=8192, embed_dim=4096, @@ -152,6 +154,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="5206a32e0bd3067aef1ce90f5528ade7d866253f-8b677258615625122c2eb7329292b8c402612c21", # base-peft revision release_date="2024-09-15", n_parameters=8_000_000_000, + n_embedding_parameters=None, memory_usage_mb=30518, max_tokens=8192, embed_dim=4096, @@ -185,6 +188,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="7231864981174d9bee8c7687c24c8344414eae6b-876d63e49b6115ecb6839893a56298fadee7e8f5", # base-peft revision release_date="2024-09-15", n_parameters=7_000_000_000, + n_embedding_parameters=131_072_000, memory_usage_mb=26703, training_datasets={ # "samaya-ai/msmarco-w-instructions", diff --git a/mteb/models/model_implementations/pylate_models.py b/mteb/models/model_implementations/pylate_models.py index adf52e37cc..90b26d95ff 100644 --- a/mteb/models/model_implementations/pylate_models.py +++ b/mteb/models/model_implementations/pylate_models.py @@ -352,6 +352,7 @@ def encode( public_training_data=None, release_date="2024-09-21", n_parameters=int(110 * 1e6), + n_embedding_parameters=23_440_896, memory_usage_mb=418, max_tokens=180, embed_dim=None, @@ -408,6 +409,7 @@ def encode( public_training_data=None, release_date="2024-08-16", n_parameters=int(559 * 1e6), + n_embedding_parameters=None, memory_usage_mb=1067, max_tokens=8192, embed_dim=None, @@ -464,6 +466,7 @@ def encode( public_training_data="https://huggingface.co/datasets/lightonai/ms-marco-en-bge-gemma", release_date="2025-04-30", n_parameters=int(149 * 1e6), + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=8192, embed_dim=None, diff --git a/mteb/models/model_implementations/qodo_models.py b/mteb/models/model_implementations/qodo_models.py index 525611a6d0..534af60324 100644 --- a/mteb/models/model_implementations/qodo_models.py +++ b/mteb/models/model_implementations/qodo_models.py @@ -36,6 +36,7 @@ revision="84bbef079b32e8823ec226d4e9e92902706b0eb6", release_date="2025-02-19", n_parameters=1_780_000_000, + n_embedding_parameters=232_928_256, memory_usage_mb=6776, embed_dim=1536, license="https://huggingface.co/Qodo/Qodo-Embed-1-1.5B/blob/main/LICENSE", @@ -59,6 +60,7 @@ revision="f9edd9bf7f687c0e832424058e265120f603cd81", release_date="2025-02-24", n_parameters=7_613_000_000, + n_embedding_parameters=None, memory_usage_mb=29040, embed_dim=3584, license="https://huggingface.co/Qodo/Qodo-Embed-1-1.5B/blob/main/LICENSE", diff --git a/mteb/models/model_implementations/qtack_models.py b/mteb/models/model_implementations/qtack_models.py index 5f8c0cdcbb..a64578b949 100644 --- a/mteb/models/model_implementations/qtack_models.py +++ b/mteb/models/model_implementations/qtack_models.py @@ -31,6 +31,7 @@ revision="7fbe6f9b4cc42615e0747299f837ad7769025492", release_date="2025-01-28", n_parameters=int(66.3 * 1e6), + n_embedding_parameters=23_440_896, memory_usage_mb=253, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/qwen3_models.py b/mteb/models/model_implementations/qwen3_models.py index 94e1f0e712..8865919ac3 100644 --- a/mteb/models/model_implementations/qwen3_models.py +++ b/mteb/models/model_implementations/qwen3_models.py @@ -147,6 +147,7 @@ def q3e_instruct_loader( revision="b22da495047858cce924d27d76261e96be6febc0", # Commit of @tomaarsen release_date="2025-06-05", n_parameters=595776512, + n_embedding_parameters=None, memory_usage_mb=1136, embed_dim=1024, max_tokens=32768, @@ -170,6 +171,7 @@ def q3e_instruct_loader( revision="636cd9bf47d976946cdbb2b0c3ca0cb2f8eea5ff", # Commit of @tomaarsen release_date="2025-06-05", n_parameters=4021774336, + n_embedding_parameters=None, memory_usage_mb=7671, embed_dim=2560, max_tokens=32768, @@ -193,6 +195,7 @@ def q3e_instruct_loader( revision="4e423935c619ae4df87b646a3ce949610c66241c", # Commit of @tomaarsen release_date="2025-06-05", n_parameters=7567295488, + n_embedding_parameters=None, memory_usage_mb=14433, embed_dim=4096, max_tokens=32768, diff --git a/mteb/models/model_implementations/qzhou_models.py b/mteb/models/model_implementations/qzhou_models.py index 7dd808e84e..7c72300cde 100644 --- a/mteb/models/model_implementations/qzhou_models.py +++ b/mteb/models/model_implementations/qzhou_models.py @@ -64,6 +64,7 @@ def instruction_template( revision="f1e6c03ee3882e7b9fa5cec91217715272e433b8", release_date="2025-08-24", n_parameters=7_070_619_136, + n_embedding_parameters=None, memory_usage_mb=14436, embed_dim=3584, license="apache-2.0", @@ -98,6 +99,7 @@ def instruction_template( revision="0321ccb126413d1e49c5ce908e802b63d35f18e2", release_date="2025-09-28", n_parameters=7_575_747_328, + n_embedding_parameters=None, memory_usage_mb=29431, embed_dim=1792, license="apache-2.0", diff --git a/mteb/models/model_implementations/rasgaard_models.py b/mteb/models/model_implementations/rasgaard_models.py index 2c9cc64fd3..c1ccdb9f77 100644 --- a/mteb/models/model_implementations/rasgaard_models.py +++ b/mteb/models/model_implementations/rasgaard_models.py @@ -12,6 +12,7 @@ revision="387897cfb09992e6d45ea9cd7b28b9fcf119e23a", release_date="2025-10-08", n_parameters=22893312, + n_embedding_parameters=22893312, memory_usage_mb=87, max_tokens=np.inf, embed_dim=256, diff --git a/mteb/models/model_implementations/reasonir_model.py b/mteb/models/model_implementations/reasonir_model.py index 49bccaffe4..a79b19d8c7 100644 --- a/mteb/models/model_implementations/reasonir_model.py +++ b/mteb/models/model_implementations/reasonir_model.py @@ -50,6 +50,7 @@ def instruction_template( revision="c3d0690370ff4a8c3d3882d8dfa85c43650034fa", release_date="2025-04-29", n_parameters=7_500_000_000, + n_embedding_parameters=None, memory_usage_mb=None, embed_dim=4096, license="cc-by-nc-4.0", diff --git a/mteb/models/model_implementations/repllama_models.py b/mteb/models/model_implementations/repllama_models.py index 485b864670..6c358022f7 100644 --- a/mteb/models/model_implementations/repllama_models.py +++ b/mteb/models/model_implementations/repllama_models.py @@ -179,6 +179,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: "mMARCO-NL", # translation not trained on }, n_parameters=7_000_000, + n_embedding_parameters=131_072_000, memory_usage_mb=27, max_tokens=4096, embed_dim=4096, @@ -208,6 +209,7 @@ def loader_inner(**kwargs: Any) -> EncoderProtocol: revision="01c7f73d771dfac7d292323805ebc428287df4f9-ad5c1d0938a1e02954bcafb4d811ba2f34052e71", # base-peft revision release_date="2024-09-15", n_parameters=7_000_000, + n_embedding_parameters=None, memory_usage_mb=27, max_tokens=4096, embed_dim=4096, diff --git a/mteb/models/model_implementations/rerankers_custom.py b/mteb/models/model_implementations/rerankers_custom.py index badf3d0065..72ee18d147 100644 --- a/mteb/models/model_implementations/rerankers_custom.py +++ b/mteb/models/model_implementations/rerankers_custom.py @@ -231,6 +231,7 @@ def predict( revision="0a97706f3827389da43b83348d5d18c9d53876fa", release_date="2020-05-28", n_parameters=None, + n_embedding_parameters=31_254_528, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -256,6 +257,7 @@ def predict( revision="126747772a932960028d9f4dc93bd5d9c4869be4", release_date="2024-09-26", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=531, max_tokens=None, embed_dim=None, @@ -319,6 +321,7 @@ def predict( revision="953dc6f6f85a1b2dbfca4c34a2796e7dde08d41e", release_date="2024-06-24", n_parameters=None, + n_embedding_parameters=256_002_048, memory_usage_mb=2166, max_tokens=None, embed_dim=None, diff --git a/mteb/models/model_implementations/rerankers_monot5_based.py b/mteb/models/model_implementations/rerankers_monot5_based.py index 7b01a772c8..fb70152c23 100644 --- a/mteb/models/model_implementations/rerankers_monot5_based.py +++ b/mteb/models/model_implementations/rerankers_monot5_based.py @@ -327,6 +327,7 @@ def get_prediction_tokens(self, *args, **kwargs): revision="77f8e3f7b1eb1afe353aa21a7c3a2fc8feca702e", release_date="2022-03-28", n_parameters=None, + n_embedding_parameters=16_449_536, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -369,6 +370,7 @@ def get_prediction_tokens(self, *args, **kwargs): url={https://arxiv.org/abs/2206.02873}, }""", n_parameters=None, + n_embedding_parameters=24_674_304, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -393,6 +395,7 @@ def get_prediction_tokens(self, *args, **kwargs): revision="48cfad1d8dd587670393f27ee8ec41fde63e3d98", release_date="2022-03-28", n_parameters=None, + n_embedding_parameters=32_899_072, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -426,6 +429,7 @@ def get_prediction_tokens(self, *args, **kwargs): revision="bc0c419a438c81f592f878ce32430a1823f5db6c", release_date="2022-03-28", n_parameters=None, + n_embedding_parameters=32_899_072, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -482,6 +486,7 @@ def get_prediction_tokens(self, *args, **kwargs): # "qed": ["train"], ), n_parameters=None, + n_embedding_parameters=24_674_304, memory_usage_mb=944, max_tokens=None, embed_dim=None, @@ -528,6 +533,7 @@ def get_prediction_tokens(self, *args, **kwargs): # "qed": ["train"], ), n_parameters=None, + n_embedding_parameters=32_899_072, memory_usage_mb=2987, max_tokens=None, embed_dim=None, @@ -574,6 +580,7 @@ def get_prediction_tokens(self, *args, **kwargs): # "qed": ["train"], ), n_parameters=None, + n_embedding_parameters=65_798_144, memory_usage_mb=10871, max_tokens=None, embed_dim=None, @@ -620,6 +627,7 @@ def get_prediction_tokens(self, *args, **kwargs): # "qed": ["train"], ), n_parameters=None, + n_embedding_parameters=131_596_288, memory_usage_mb=42980, max_tokens=None, embed_dim=None, @@ -644,6 +652,7 @@ def get_prediction_tokens(self, *args, **kwargs): revision="01c7f73d771dfac7d292323805ebc428287df4f9", release_date="2023-07-18", n_parameters=None, + n_embedding_parameters=131_072_000, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -686,6 +695,7 @@ def get_prediction_tokens(self, *args, **kwargs): url={https://arxiv.org/abs/2307.09288}, }""", n_parameters=None, + n_embedding_parameters=131_072_000, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -710,6 +720,7 @@ def get_prediction_tokens(self, *args, **kwargs): revision="3ad372fc79158a2148299e3318516c786aeded6c", release_date="2023-12-11", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -746,6 +757,7 @@ def get_prediction_tokens(self, *args, **kwargs): # "jhu-clsp/FollowIR-train" ), n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=13813, max_tokens=None, embed_dim=None, @@ -896,6 +908,7 @@ def get_prediction_tokens(self, *args, **kwargs): """, training_datasets={"MSMARCO"}, n_parameters=None, + n_embedding_parameters=192_086_016, memory_usage_mb=None, max_tokens=None, embed_dim=None, @@ -919,6 +932,7 @@ def get_prediction_tokens(self, *args, **kwargs): revision="e1a4317e102a525ea9e16745ad21394a4f1bffbc", release_date="2022-11-04", n_parameters=None, + n_embedding_parameters=1_024_458_752, memory_usage_mb=None, max_tokens=None, embed_dim=None, diff --git a/mteb/models/model_implementations/richinfoai_models.py b/mteb/models/model_implementations/richinfoai_models.py index 04ea49cc24..4bf082bde4 100644 --- a/mteb/models/model_implementations/richinfoai_models.py +++ b/mteb/models/model_implementations/richinfoai_models.py @@ -15,6 +15,7 @@ revision="f8d5a707656c55705027678e311f9202c8ced12c", release_date="2025-03-25", n_parameters=int(326 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=1242, embed_dim=1792, license="mit", diff --git a/mteb/models/model_implementations/ru_sentence_models.py b/mteb/models/model_implementations/ru_sentence_models.py index 0ab9a3b9b2..98837f9299 100644 --- a/mteb/models/model_implementations/ru_sentence_models.py +++ b/mteb/models/model_implementations/ru_sentence_models.py @@ -244,6 +244,7 @@ revision="5441c5ea8026d4f6d7505ec004845409f1259fb1", release_date="2021-05-24", n_parameters=11_900_000, + n_embedding_parameters=9_223_968, memory_usage_mb=45, embed_dim=312, license="mit", @@ -270,6 +271,7 @@ revision="dad72b8f77c5eef6995dd3e4691b758ba56b90c3", release_date="2021-10-28", n_parameters=29_400_000, + n_embedding_parameters=26_154_336, memory_usage_mb=112, embed_dim=312, license="mit", @@ -297,6 +299,7 @@ revision="af977d5dfa46a3635e29bf0ef383f2df2a08d47a", release_date="2020-11-20", n_parameters=427_000_000, + n_embedding_parameters=123_021_312, memory_usage_mb=1629, embed_dim=1024, license="mit", @@ -323,6 +326,7 @@ revision="05300876c2b83f46d3ddd422a7f17e45cf633bb0", release_date="2021-05-18", n_parameters=427_000_000, + n_embedding_parameters=123_021_312, memory_usage_mb=1629, embed_dim=1024, license="not specified", @@ -351,6 +355,7 @@ revision="436a489a2087d61aa670b3496a9915f84e46c861", release_date="2024-06-10", n_parameters=427_000_000, + n_embedding_parameters=38_603_520, memory_usage_mb=473, embed_dim=768, license="apache-2.0", @@ -412,6 +417,7 @@ revision="0cc6cfe48e260fb0474c753087a69369e88709ae", release_date="2024-07-05", n_parameters=359_026_688, + n_embedding_parameters=47_273_984, memory_usage_mb=1370, embed_dim=1024, license="apache-2.0", @@ -463,6 +469,7 @@ revision="bdd30b0e19757e6940c92c7aff19e8fc0a60dff4", release_date="2023-02-07", n_parameters=124_000_000, + n_embedding_parameters=38_603_520, memory_usage_mb=473, embed_dim=768, license="apache-2.0", @@ -494,6 +501,7 @@ revision="4036cab694767a299f2b9e6492909664d9414229", release_date="2020-03-04", n_parameters=1280_000_000, + n_embedding_parameters=91_812_096, memory_usage_mb=4883, embed_dim=768, license="not specified", @@ -530,6 +538,7 @@ revision="e348066b4a7279b97138038299bddc6580a9169a", release_date="2022-06-28", n_parameters=107_000_000, + n_embedding_parameters=91_812_096, memory_usage_mb=408, embed_dim=768, license="not specified", @@ -565,6 +574,7 @@ revision="78b5122d6365337dd4114281b0d08cd1edbb3bc8", release_date="2020-03-04", n_parameters=107_000_000, + n_embedding_parameters=91_812_096, memory_usage_mb=408, embed_dim=768, license="not specified", @@ -590,6 +600,7 @@ revision="cf0714e606d4af551e14ad69a7929cd6b0da7f7e", release_date="2021-06-10", n_parameters=129_000_000, + n_embedding_parameters=42_303_744, memory_usage_mb=492, embed_dim=768, license="not specified", @@ -618,6 +629,7 @@ revision="8ce0cf757446ce9bb2d5f5a4ac8103c7a1049054", release_date="2024-06-21", n_parameters=29_200_000, + n_embedding_parameters=26_154_336, memory_usage_mb=111, embed_dim=312, license="mit", @@ -641,6 +653,7 @@ revision="19b279b78afd945b5ccae78f63e284909814adc2", release_date="2025-03-02", n_parameters=32_300_000, + n_embedding_parameters=26_154_336, memory_usage_mb=123, embed_dim=312, license="mit", @@ -669,6 +682,7 @@ revision="1940b046c6b5e125df11722b899130329d0a46da", release_date="2024-06-27", n_parameters=129_000_000, + n_embedding_parameters=42_303_744, memory_usage_mb=490, embed_dim=768, license="mit", @@ -720,6 +734,7 @@ use_instructions=True, reference="https://huggingface.co/ai-forever/ru-en-RoSBERTa", n_parameters=404_000_000, + n_embedding_parameters=100_869_120, memory_usage_mb=1540, max_tokens=512, embed_dim=1024, @@ -886,6 +901,7 @@ use_instructions=True, reference="https://huggingface.co/ai-forever/FRIDA", n_parameters=823_000_000, + n_embedding_parameters=143_847_936, memory_usage_mb=3141, max_tokens=512, embed_dim=1536, @@ -918,6 +934,7 @@ revision="0ad5b29bfecd806cecc9d66b927d828a736594dc", release_date="2025-09-23", n_parameters=3_227_176_961, + n_embedding_parameters=None, memory_usage_mb=12865, embed_dim=2048, license="mit", @@ -950,6 +967,7 @@ revision="914c8c8aed14042ed890fc2c662d5e9e66b2faa7", release_date="2025-03-10", n_parameters=128_000_000, + n_embedding_parameters=42_303_744, memory_usage_mb=489, embed_dim=768, license="mit", @@ -1025,6 +1043,7 @@ use_instructions=True, reference="https://huggingface.co/collections/deepvk/user2-6802650d7210f222ec60e05f", n_parameters=34_400_000, + n_embedding_parameters=None, memory_usage_mb=131, max_tokens=8192, embed_dim=384, @@ -1058,6 +1077,7 @@ use_instructions=True, reference="https://huggingface.co/collections/deepvk/user2-6802650d7210f222ec60e05f", n_parameters=149_000_000, + n_embedding_parameters=None, memory_usage_mb=568, max_tokens=8192, embed_dim=768, diff --git a/mteb/models/model_implementations/ruri_models.py b/mteb/models/model_implementations/ruri_models.py index 165dff9e48..092987ad88 100644 --- a/mteb/models/model_implementations/ruri_models.py +++ b/mteb/models/model_implementations/ruri_models.py @@ -38,6 +38,7 @@ revision="24899e5de370b56d179604a007c0d727bf144504", release_date="2025-04-07", n_parameters=36_705_536, + n_embedding_parameters=None, memory_usage_mb=140, embed_dim=256, license="apache-2.0", @@ -69,6 +70,7 @@ revision="07a8b0aba47d29d2ca21f89b915c1efe2c23d1cc", release_date="2025-04-09", n_parameters=36_705_536, + n_embedding_parameters=None, memory_usage_mb=140, embed_dim=256, license="apache-2.0", @@ -98,6 +100,7 @@ revision="e3114c6ee10dbab8b4b235fbc6dcf9dd4d5ac1a6", release_date="2025-04-09", n_parameters=132_140_544, + n_embedding_parameters=None, memory_usage_mb=504, embed_dim=512, license="apache-2.0", @@ -127,6 +130,7 @@ revision="18b60fb8c2b9df296fb4212bb7d23ef94e579cd3", release_date="2025-04-09", n_parameters=314_611_968, + n_embedding_parameters=None, memory_usage_mb=1200, embed_dim=768, license="apache-2.0", @@ -157,6 +161,7 @@ revision="db18646e673b713cd0518a5bb0fefdce21e77cd9", release_date="2024-12-05", n_parameters=68_087_808, + n_embedding_parameters=25_165_824, memory_usage_mb=260, embed_dim=768, license="apache-2.0", @@ -186,6 +191,7 @@ revision="8ce03882903668a01c83ca3b8111ac025a3bc734", release_date="2024-12-05", n_parameters=111_207_168, + n_embedding_parameters=25_165_824, memory_usage_mb=424, embed_dim=768, license="apache-2.0", @@ -215,6 +221,7 @@ revision="42898ef34a5574977380ebf0dfd28cbfbd36438b", release_date="2024-12-06", n_parameters=337_441_792, + n_embedding_parameters=33_554_432, memory_usage_mb=1287, embed_dim=1024, license="apache-2.0", @@ -245,6 +252,7 @@ revision="bc56ce90cd7a979f6eb199fc52dfe700bfd94bc3", release_date="2024-08-28", n_parameters=68_087_808, + n_embedding_parameters=25_165_824, memory_usage_mb=130, embed_dim=768, license="apache-2.0", @@ -274,6 +282,7 @@ revision="1ae40b8b6c78518a499425086bab8fc16c2e4b0e", release_date="2024-08-28", n_parameters=111_207_168, + n_embedding_parameters=25_165_824, memory_usage_mb=212, embed_dim=768, license="apache-2.0", @@ -304,6 +313,7 @@ revision="a011c39b13e8bc137ee13c6bc82191ece46c414c", release_date="2024-08-28", n_parameters=337_441_792, + n_embedding_parameters=33_554_432, memory_usage_mb=644, embed_dim=1024, license="apache-2.0", diff --git a/mteb/models/model_implementations/salesforce_models.py b/mteb/models/model_implementations/salesforce_models.py index b33d2b62e2..3d5d1e5bbb 100644 --- a/mteb/models/model_implementations/salesforce_models.py +++ b/mteb/models/model_implementations/salesforce_models.py @@ -58,6 +58,7 @@ def instruction_template( revision="91762139d94ed4371a9fa31db5551272e0b83818", release_date="2024-06-14", # initial commit of hf model. n_parameters=7_110_000_000, + n_embedding_parameters=None, memory_usage_mb=13563, embed_dim=4096, license="cc-by-nc-4.0", @@ -96,6 +97,7 @@ def instruction_template( revision="c73d8631a005876ed5abde34db514b1fb6566973", release_date="2025-01-17", # initial commit of hf model. n_parameters=2_610_000_000, + n_embedding_parameters=None, memory_usage_mb=4986, embed_dim=2304, license="cc-by-nc-4.0", @@ -134,6 +136,7 @@ def instruction_template( revision="938c560d1c236aa563b2dbdf084f28ab28bccb11", release_date="2024-01-24", # initial commit of hf model. n_parameters=7_110_000_000, + n_embedding_parameters=None, memory_usage_mb=13563, embed_dim=4096, license="cc-by-nc-4.0", diff --git a/mteb/models/model_implementations/samilpwc_models.py b/mteb/models/model_implementations/samilpwc_models.py index 2c0a650b68..e83724ec80 100644 --- a/mteb/models/model_implementations/samilpwc_models.py +++ b/mteb/models/model_implementations/samilpwc_models.py @@ -51,6 +51,7 @@ def instruct_loader(*args, **kwargs): revision="33358978be40f36491045f9c2a359d38c3f50047", release_date="2025-08-12", n_parameters=560_000_000, + n_embedding_parameters=256_002_048, memory_usage_mb=2136, embed_dim=1024, license="apache-2.0", diff --git a/mteb/models/model_implementations/sarashina_embedding_models.py b/mteb/models/model_implementations/sarashina_embedding_models.py index 89c18d4ac1..732b0987ae 100644 --- a/mteb/models/model_implementations/sarashina_embedding_models.py +++ b/mteb/models/model_implementations/sarashina_embedding_models.py @@ -124,6 +124,7 @@ def sarashina_instruction_template( revision="1f3408afaa7b617e3445d891310a9c26dd0c68a5", release_date="2025-07-30", n_parameters=1_224_038_144, + n_embedding_parameters=183_500_800, memory_usage_mb=4669, embed_dim=1792, license="https://huggingface.co/sbintuitions/sarashina-embedding-v2-1b/blob/main/LICENSE", @@ -150,6 +151,7 @@ def sarashina_instruction_template( revision="d060fcd8984075071e7fad81baff035cbb3b6c7e", release_date="2024-11-22", n_parameters=1_224_038_144, + n_embedding_parameters=183_500_800, memory_usage_mb=4669, embed_dim=1792, license="https://huggingface.co/sbintuitions/sarashina-embedding-v1-1b/blob/main/LICENSE", diff --git a/mteb/models/model_implementations/searchmap_models.py b/mteb/models/model_implementations/searchmap_models.py index 5cf27e1881..6ab604cfd2 100644 --- a/mteb/models/model_implementations/searchmap_models.py +++ b/mteb/models/model_implementations/searchmap_models.py @@ -27,6 +27,7 @@ use_instructions=True, release_date="2025-03-05", n_parameters=435_000_000, + n_embedding_parameters=None, memory_usage_mb=1660, embed_dim=4096, license="mit", diff --git a/mteb/models/model_implementations/seed_1_6_embedding_models.py b/mteb/models/model_implementations/seed_1_6_embedding_models.py index 238e435529..39f50816a0 100644 --- a/mteb/models/model_implementations/seed_1_6_embedding_models.py +++ b/mteb/models/model_implementations/seed_1_6_embedding_models.py @@ -431,6 +431,7 @@ def encode( embed_dim=2048, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://seed1-6-embedding.github.io/", diff --git a/mteb/models/model_implementations/seed_1_6_embedding_models_1215.py b/mteb/models/model_implementations/seed_1_6_embedding_models_1215.py index 40a403b527..b45602d009 100644 --- a/mteb/models/model_implementations/seed_1_6_embedding_models_1215.py +++ b/mteb/models/model_implementations/seed_1_6_embedding_models_1215.py @@ -616,6 +616,7 @@ def encode( embed_dim=2048, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://console.volcengine.com/ark/region:ark+cn-beijing/model/detail?Id=doubao-embedding-vision", diff --git a/mteb/models/model_implementations/seed_models.py b/mteb/models/model_implementations/seed_models.py index f120a9c6f4..382ed19866 100644 --- a/mteb/models/model_implementations/seed_models.py +++ b/mteb/models/model_implementations/seed_models.py @@ -253,6 +253,7 @@ def encode( embed_dim=2048, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://seed1-5-embedding.github.io/", diff --git a/mteb/models/model_implementations/sentence_transformers_models.py b/mteb/models/model_implementations/sentence_transformers_models.py index 8c51b09731..aa25cbbabf 100644 --- a/mteb/models/model_implementations/sentence_transformers_models.py +++ b/mteb/models/model_implementations/sentence_transformers_models.py @@ -121,6 +121,7 @@ revision="8b3219a92973c328a8e22fadcfa821b5dc75636a", release_date="2021-08-30", n_parameters=22_700_000, + n_embedding_parameters=11_720_448, memory_usage_mb=87, embed_dim=384, license="apache-2.0", @@ -152,6 +153,7 @@ revision="364dd28d28dcd3359b537f3cf1f5348ba679da62", release_date="2021-08-30", n_parameters=33_400_000, + n_embedding_parameters=11_720_448, memory_usage_mb=127, embed_dim=384, license="apache-2.0", @@ -183,6 +185,7 @@ revision="bf3bf13ab40c3157080a7ab344c831b9ad18b5eb", release_date="2019-11-01", # release date of paper n_parameters=118_000_000, + n_embedding_parameters=96_014_208, memory_usage_mb=449, embed_dim=768, license="apache-2.0", @@ -214,6 +217,7 @@ revision="79f2382ceacceacdf38563d7c5d16b9ff8d725d6", release_date="2019-11-01", # release date of paper n_parameters=278_000_000, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, embed_dim=768, license="apache-2.0", @@ -256,6 +260,7 @@ revision="e34fab64a3011d2176c99545a93d5cbddc9a91b7", release_date="2019-11-01", # release date of paper n_parameters=471_000_000, + n_embedding_parameters=384_885_504, memory_usage_mb=1796, embed_dim=768, license="apache-2.0", @@ -294,6 +299,7 @@ revision="b207367332321f8e44f96e224ef15bc607f4dbf0", release_date="2021-08-30", n_parameters=22_700_000, + n_embedding_parameters=11_720_448, memory_usage_mb=87, embed_dim=384, license="apache-2.0", @@ -325,6 +331,7 @@ revision="9a3225965996d404b775526de6dbfe85d3368642", release_date="2021-08-30", n_parameters=109_000_000, + n_embedding_parameters=23_444_736, memory_usage_mb=418, embed_dim=768, license="apache-2.0", @@ -435,6 +442,7 @@ revision="7264ea07c5365a11d7e6d87dbb6195889a13054f", release_date="2025-01-15", n_parameters=108_420_096, + n_embedding_parameters=None, memory_usage_mb=413, embed_dim=1024, license="apache-2.0", @@ -468,6 +476,7 @@ revision="abe8c1493371369031bcb1e02acb754cf4e162fa", release_date="2022-06-25", # release date of model on HF n_parameters=150_000_000, + n_embedding_parameters=23_440_896, memory_usage_mb=572, embed_dim=768, license=None, @@ -498,6 +507,7 @@ revision="98f70f14cdf12d7ea217ed2fd4e808b0195f1e7e", release_date="2024-11-10", n_parameters=272_000_000, + n_embedding_parameters=32_769_024, memory_usage_mb=1037, embed_dim=1024, license="apache-2.0", @@ -544,6 +554,7 @@ revision="50c53e206f8b01c9621484a3c0aafce4e55efebf", release_date="2022-02-09", n_parameters=110_000_000, + n_embedding_parameters=24_674_304, memory_usage_mb=209, embed_dim=768, license="apache-2.0", @@ -567,6 +578,7 @@ revision="1fc08ea477205aa54a3e5b13f0971ae16b86410a", release_date="2022-02-09", n_parameters=335_000_000, + n_embedding_parameters=32_899_072, memory_usage_mb=639, embed_dim=768, license="apache-2.0", @@ -590,6 +602,7 @@ revision="2965d31b368fb14117688e0bde77cbd720e91f53", release_date="2024-03-27", n_parameters=3_000_000_000, + n_embedding_parameters=32_899_072, memory_usage_mb=2367, embed_dim=768, license="apache-2.0", @@ -613,6 +626,7 @@ revision="4d122282ba80e807e9e6eb8c358269e92796365d", release_date="2024-03-27", n_parameters=11_000_000_000, + n_embedding_parameters=None, memory_usage_mb=9279, embed_dim=768, license="apache-2.0", @@ -646,6 +660,7 @@ revision="a2c8ac47f998531948d4cbe32a0b577a7037a5e3", release_date="2022-02-09", n_parameters=335_000_000, + n_embedding_parameters=32_899_072, memory_usage_mb=639, embed_dim=768, license="apache-2.0", @@ -681,6 +696,7 @@ revision="23a8d667a1ad2578af181ce762867003c498d1bf", release_date="2022-02-09", n_parameters=1_240_000_000, + n_embedding_parameters=32_899_072, memory_usage_mb=2367, embed_dim=768, license="apache-2.0", @@ -715,6 +731,7 @@ revision="73f2a9156a3dcc2194dfdb2bf201cd7d17e17884", release_date="2022-02-09", n_parameters=4_860_000_000, + n_embedding_parameters=None, memory_usage_mb=9279, embed_dim=768, license="apache-2.0", @@ -750,6 +767,7 @@ revision="7027e9594267928589816394bdd295273ddc0739", release_date="2022-02-09", n_parameters=110_000_000, + n_embedding_parameters=24_674_304, memory_usage_mb=209, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/shuu_model.py b/mteb/models/model_implementations/shuu_model.py index 79921a5666..9c5d492ed7 100644 --- a/mteb/models/model_implementations/shuu_model.py +++ b/mteb/models/model_implementations/shuu_model.py @@ -10,6 +10,7 @@ revision="044a7a4b552f86e284817234c336bccf16f895ce", release_date="2025-04-21", n_parameters=151668480, + n_embedding_parameters=None, memory_usage_mb=607, embed_dim=768, license="apache-2.0", diff --git a/mteb/models/model_implementations/siglip_models.py b/mteb/models/model_implementations/siglip_models.py index f28fc8662f..155f90f556 100644 --- a/mteb/models/model_implementations/siglip_models.py +++ b/mteb/models/model_implementations/siglip_models.py @@ -136,6 +136,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=877_000_000, + n_embedding_parameters=None, memory_usage_mb=3347, max_tokens=16, embed_dim=1152, @@ -160,6 +161,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=878_000_000, + n_embedding_parameters=None, memory_usage_mb=3349, max_tokens=64, embed_dim=1152, @@ -184,6 +186,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=1_130_000_000, + n_embedding_parameters=None, memory_usage_mb=4306, max_tokens=64, embed_dim=1152, @@ -208,6 +211,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=371_000_000, + n_embedding_parameters=None, memory_usage_mb=1414, max_tokens=64, embed_dim=768, @@ -232,6 +236,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=203_000_000, + n_embedding_parameters=None, memory_usage_mb=775, max_tokens=64, embed_dim=768, @@ -256,6 +261,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=204_000_000, + n_embedding_parameters=None, memory_usage_mb=777, max_tokens=64, embed_dim=768, @@ -280,6 +286,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=203_000_000, + n_embedding_parameters=None, memory_usage_mb=776, max_tokens=64, embed_dim=768, @@ -304,6 +311,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=203_000_000, + n_embedding_parameters=None, memory_usage_mb=775, max_tokens=64, embed_dim=768, @@ -328,6 +336,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=652_000_000, + n_embedding_parameters=None, memory_usage_mb=2488, max_tokens=64, embed_dim=1024, @@ -352,6 +361,7 @@ def encode( release_date="2024-01-08", modalities=["image", "text"], n_parameters=652_000_000, + n_embedding_parameters=None, memory_usage_mb=2489, max_tokens=64, embed_dim=1024, diff --git a/mteb/models/model_implementations/sonar_models.py b/mteb/models/model_implementations/sonar_models.py index 09478ea7c3..ad344969df 100644 --- a/mteb/models/model_implementations/sonar_models.py +++ b/mteb/models/model_implementations/sonar_models.py @@ -224,7 +224,8 @@ use_instructions=False, # it does take a language code as input revision="a551c586dcf4a49c8fd847de369412d556a7f2f2", release_date="2021-05-21", - n_parameters=None, # it is really multiple models so not sure how to calculate this + n_parameters=None, + n_embedding_parameters=None, # it is really multiple models so not sure how to calculate this max_tokens=512, # https://github.com/facebookresearch/SONAR/blob/549d287466443bd8720f938047882630c1c5c3f7/sonar/models/sonar_text/builder.py#L139 embed_dim=1024, license="mit", diff --git a/mteb/models/model_implementations/spartan8806_atles_champion.py b/mteb/models/model_implementations/spartan8806_atles_champion.py index c23b0ebdbf..cae1efaafd 100644 --- a/mteb/models/model_implementations/spartan8806_atles_champion.py +++ b/mteb/models/model_implementations/spartan8806_atles_champion.py @@ -12,6 +12,7 @@ revision="d4c74d7000bbd25f3597fc0f2dcde59ef1386e8f", release_date="2025-11-15", n_parameters=110_000_000, + n_embedding_parameters=23_444_736, memory_usage_mb=420, max_tokens=512, embed_dim=768, diff --git a/mteb/models/model_implementations/stella_models.py b/mteb/models/model_implementations/stella_models.py index 198a3d87f0..d4e8f07918 100644 --- a/mteb/models/model_implementations/stella_models.py +++ b/mteb/models/model_implementations/stella_models.py @@ -66,6 +66,7 @@ revision="1bb50bc7bb726810eac2140e62155b88b0df198f", release_date="2024-07-12", n_parameters=435_000_000, + n_embedding_parameters=None, memory_usage_mb=1660, max_tokens=8192, embed_dim=4096, @@ -101,6 +102,7 @@ revision="d03be74b361d4eb24f42a2fe5bd2e29917df4604", release_date="2024-07-12", n_parameters=1_540_000_000, + n_embedding_parameters=232_928_256, memory_usage_mb=5887, max_tokens=131072, embed_dim=8960, @@ -130,6 +132,7 @@ revision="d5d39eb8cd11c80a63df53314e59997074469f09", release_date="2024-02-17", n_parameters=None, + n_embedding_parameters=21_635_072, memory_usage_mb=None, # can't see on model card embed_dim=1792, license="not specified", @@ -157,6 +160,7 @@ revision="82254892a0fba125aa2abf3a4800d2dd12821343", release_date="2024-02-17", n_parameters=None, + n_embedding_parameters=16_226_304, memory_usage_mb=None, # can't see on model card embed_dim=1792, license="mit", @@ -185,6 +189,7 @@ revision="17bb1c32a93a8fc5f6fc9e91d5ea86da99983cfe", release_date="2024-02-27", n_parameters=int(326 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=1242, embed_dim=1792, license="mit", @@ -209,6 +214,7 @@ revision="b1075144f440ab4409c05622c1179130ebd57d03", release_date="2024-06-04", n_parameters=int(326 * 1e6), + n_embedding_parameters=21_635_072, memory_usage_mb=1242, embed_dim=1792, license="mit", diff --git a/mteb/models/model_implementations/tarka_models.py b/mteb/models/model_implementations/tarka_models.py index a09fc38aac..339f64f050 100644 --- a/mteb/models/model_implementations/tarka_models.py +++ b/mteb/models/model_implementations/tarka_models.py @@ -327,6 +327,7 @@ revision="b0ffecc4ef0d873e517507ed080e43b88b2704b9", release_date="2025-11-04", n_parameters=155_714_304, + n_embedding_parameters=None, embed_dim=768, max_tokens=2048, license="gemma", @@ -361,6 +362,7 @@ revision="a850d6a329145474727424fed6b12b62096b8ba3", release_date="2025-11-11", n_parameters=354_483_968, + n_embedding_parameters=None, memory_usage_mb=676, embed_dim=1024, max_tokens=128000, diff --git a/mteb/models/model_implementations/text2vec_models.py b/mteb/models/model_implementations/text2vec_models.py index a22b74c3c1..0ed9a20b17 100644 --- a/mteb/models/model_implementations/text2vec_models.py +++ b/mteb/models/model_implementations/text2vec_models.py @@ -22,6 +22,7 @@ revision="183bb99aa7af74355fb58d16edf8c13ae7c5433e", release_date="2022-01-23", n_parameters=int(102 * 1e6), + n_embedding_parameters=16_226_304, embed_dim=768, license="apache-2.0", max_tokens=512, @@ -51,6 +52,7 @@ revision="e90c150a9c7fb55a67712a766d6820c55fb83cdd", release_date="2023-06-19", n_parameters=118 * 1e6, + n_embedding_parameters=30_720_000, memory_usage_mb=450, embed_dim=768, license="apache-2.0", @@ -95,6 +97,7 @@ # So probably best not to. loader=sentence_transformers_loader, n_parameters=117654272, + n_embedding_parameters=96_014_208, memory_usage_mb=449, embed_dim=384, license="apache-2.0", diff --git a/mteb/models/model_implementations/ua_sentence_models.py b/mteb/models/model_implementations/ua_sentence_models.py index d9765d32f7..7d1188ab83 100644 --- a/mteb/models/model_implementations/ua_sentence_models.py +++ b/mteb/models/model_implementations/ua_sentence_models.py @@ -8,6 +8,7 @@ model_type=["dense"], loader=sentence_transformers_loader, n_parameters=278_000_000, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, max_tokens=512, embed_dim=768, diff --git a/mteb/models/model_implementations/uae_models.py b/mteb/models/model_implementations/uae_models.py index b7f4c862cb..d2e7fcb23a 100644 --- a/mteb/models/model_implementations/uae_models.py +++ b/mteb/models/model_implementations/uae_models.py @@ -72,6 +72,7 @@ def encode( revision="369c368f70f16a613f19f5598d4f12d9f44235d4", release_date="2023-12-04", # initial commit of hf model. n_parameters=int(335 * 1e6), + n_embedding_parameters=31_254_528, memory_usage_mb=1278, max_tokens=512, embed_dim=1024, diff --git a/mteb/models/model_implementations/vdr_models.py b/mteb/models/model_implementations/vdr_models.py index b9d542e542..a8ab03bbdd 100644 --- a/mteb/models/model_implementations/vdr_models.py +++ b/mteb/models/model_implementations/vdr_models.py @@ -38,6 +38,7 @@ def instruction_template( release_date="2024-01-08", modalities=["text"], # TODO: integrate with image n_parameters=2_000_000_000, + n_embedding_parameters=233_373_696, memory_usage_mb=4213, max_tokens=32768, embed_dim=1536, diff --git a/mteb/models/model_implementations/vi_vn_models.py b/mteb/models/model_implementations/vi_vn_models.py index e698704390..291d354054 100644 --- a/mteb/models/model_implementations/vi_vn_models.py +++ b/mteb/models/model_implementations/vi_vn_models.py @@ -16,6 +16,7 @@ loader=sentence_transformers_loader, open_weights=True, n_parameters=568_000_000, + n_embedding_parameters=256_002_048, memory_usage_mb=2167, embed_dim=1024, license="cc-by-4.0", @@ -41,6 +42,7 @@ loader=sentence_transformers_loader, open_weights=True, n_parameters=568_000_000, + n_embedding_parameters=256_002_048, memory_usage_mb=2167, embed_dim=1024, license="cc-by-4.0", @@ -66,6 +68,7 @@ loader=sentence_transformers_loader, open_weights=True, n_parameters=568_000_000, + n_embedding_parameters=256_002_048, memory_usage_mb=2166, embed_dim=1024, license="cc-by-4.0", @@ -98,6 +101,7 @@ use_instructions=False, open_weights=True, n_parameters=278_000_000, + n_embedding_parameters=192_001_536, memory_usage_mb=1061, embed_dim=768, license="apache-2.0", @@ -129,6 +133,7 @@ use_instructions=False, open_weights=True, n_parameters=135_000_000, + n_embedding_parameters=49_152_768, memory_usage_mb=517, max_tokens=256, embed_dim=768, @@ -167,6 +172,7 @@ use_instructions=False, open_weights=True, n_parameters=135_000_000, + n_embedding_parameters=49_152_768, memory_usage_mb=515, max_tokens=256, embed_dim=768, diff --git a/mteb/models/model_implementations/vista_models.py b/mteb/models/model_implementations/vista_models.py index 0ee7bdc250..9a4128489b 100644 --- a/mteb/models/model_implementations/vista_models.py +++ b/mteb/models/model_implementations/vista_models.py @@ -258,6 +258,7 @@ def encode( release_date="2024-06-06", modalities=["image", "text"], n_parameters=196_000_000, + n_embedding_parameters=None, memory_usage_mb=1631, max_tokens=512, embed_dim=768, @@ -286,6 +287,7 @@ def encode( release_date="2024-06-06", modalities=["image", "text"], n_parameters=872_909_505, + n_embedding_parameters=None, memory_usage_mb=4263, max_tokens=8192, embed_dim=1024, diff --git a/mteb/models/model_implementations/vlm2vec_models.py b/mteb/models/model_implementations/vlm2vec_models.py index 07fd51d086..8ba13eee15 100644 --- a/mteb/models/model_implementations/vlm2vec_models.py +++ b/mteb/models/model_implementations/vlm2vec_models.py @@ -280,6 +280,7 @@ def encode( release_date="2024-10-08", modalities=["image", "text"], n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=131072, embed_dim=3072, @@ -304,6 +305,7 @@ def encode( release_date="2024-10-08", modalities=["image", "text"], n_parameters=4_150_000_000, + n_embedding_parameters=None, memory_usage_mb=7909, max_tokens=131072, embed_dim=3072, diff --git a/mteb/models/model_implementations/voyage_models.py b/mteb/models/model_implementations/voyage_models.py index d262d8b13c..45492f2b20 100644 --- a/mteb/models/model_implementations/voyage_models.py +++ b/mteb/models/model_implementations/voyage_models.py @@ -308,6 +308,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2025/01/07/voyage-3-large/", @@ -336,6 +337,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2025/05/20/voyage-3-5/", @@ -363,6 +365,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2025/05/20/voyage-3-5/", @@ -390,6 +393,7 @@ def _batched_encode( embed_dim=1024, # Same as original after unpacking from bits open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2025/05/20/voyage-3-5/", @@ -417,6 +421,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2024/05/05/voyage-large-2-instruct-instruction-tuned-and-rank-1-on-mteb/", @@ -443,6 +448,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2024/06/03/domain-specific-embeddings-finance-edition-voyage-finance-2/", @@ -469,6 +475,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2024/04/15/domain-specific-embeddings-and-retrieval-legal-edition-voyage-law-2/", @@ -495,6 +502,7 @@ def _batched_encode( embed_dim=1536, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2024/01/23/voyage-code-2-elevate-your-code-retrieval/", @@ -521,6 +529,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2024/12/04/voyage-code-3/", @@ -548,6 +557,7 @@ def _batched_encode( embed_dim=1536, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2023/10/29/voyage-embeddings/", @@ -574,6 +584,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2023/10/29/voyage-embeddings/", @@ -599,6 +610,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2024/06/10/voyage-multilingual-2-multilingual-embedding-model/", @@ -625,6 +637,7 @@ def _batched_encode( embed_dim=1024, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2024/09/18/voyage-3/", @@ -651,6 +664,7 @@ def _batched_encode( embed_dim=512, open_weights=False, n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://blog.voyageai.com/2024/09/18/voyage-3/", @@ -679,6 +693,7 @@ def _batched_encode( open_weights=False, # from their card https://huggingface.co/voyageai/voyage-3-m-exp#model-information n_parameters=int(6918 * 1e6), + n_embedding_parameters=None, memory_usage_mb=None, license=None, reference="https://huggingface.co/voyageai/voyage-3-m-exp", diff --git a/mteb/models/model_implementations/voyage_v.py b/mteb/models/model_implementations/voyage_v.py index 814cc6c671..3caeef48ac 100644 --- a/mteb/models/model_implementations/voyage_v.py +++ b/mteb/models/model_implementations/voyage_v.py @@ -215,6 +215,7 @@ def encode( revision="1", release_date="2024-11-10", n_parameters=None, + n_embedding_parameters=None, memory_usage_mb=None, max_tokens=32768, embed_dim=1024, diff --git a/mteb/models/model_implementations/xyz_models.py b/mteb/models/model_implementations/xyz_models.py index 4d9c7a7823..0bcc052dcb 100644 --- a/mteb/models/model_implementations/xyz_models.py +++ b/mteb/models/model_implementations/xyz_models.py @@ -31,6 +31,7 @@ revision="4004120220b99baea764a1d3508427248ac3bccf", release_date="2024-09-13", n_parameters=326000000, + n_embedding_parameters=21_635_072, memory_usage_mb=1242, max_tokens=512, embed_dim=768, diff --git a/mteb/models/model_implementations/youtu_models.py b/mteb/models/model_implementations/youtu_models.py index f8b9d3c011..42c374fa1a 100644 --- a/mteb/models/model_implementations/youtu_models.py +++ b/mteb/models/model_implementations/youtu_models.py @@ -121,6 +121,7 @@ def instruction_template( release_date="2025-09-28", open_weights=True, n_parameters=2672957440, + n_embedding_parameters=None, memory_usage_mb=None, embed_dim=2048, license="apache-2.0", diff --git a/mteb/models/model_implementations/yuan_models.py b/mteb/models/model_implementations/yuan_models.py index 4578dccd17..13c0ca6703 100644 --- a/mteb/models/model_implementations/yuan_models.py +++ b/mteb/models/model_implementations/yuan_models.py @@ -20,6 +20,7 @@ revision="b5ebcace6f4fc6e5a4d1852557eb2dc2d1040cee", release_date="2025-11-24", n_parameters=326000000, + n_embedding_parameters=21_635_072, memory_usage_mb=1242, embed_dim=1792, license="apache-2.0", diff --git a/mteb/models/model_implementations/yuan_models_en.py b/mteb/models/model_implementations/yuan_models_en.py index 40512455df..38ed7c14cb 100644 --- a/mteb/models/model_implementations/yuan_models_en.py +++ b/mteb/models/model_implementations/yuan_models_en.py @@ -43,6 +43,7 @@ def instruction_template( revision="b2fd15da3bcae3473c8529593825c15068f09fce", release_date="2025-11-27", n_parameters=595776512, + n_embedding_parameters=None, memory_usage_mb=2272, embed_dim=1024, max_tokens=2048, diff --git a/mteb/models/model_meta.py b/mteb/models/model_meta.py index 750e7e36b0..e5b4c8c14e 100644 --- a/mteb/models/model_meta.py +++ b/mteb/models/model_meta.py @@ -10,6 +10,7 @@ from pathlib import Path from typing import TYPE_CHECKING, Any, Literal, cast +import numpy as np from huggingface_hub import ( ModelCard, get_safetensors_metadata, @@ -27,6 +28,8 @@ SafetensorsParsingError, ) from pydantic import BaseModel, ConfigDict, field_validator, model_validator +from sentence_transformers.models import Transformer +from torch import nn from transformers import AutoConfig from mteb._helpful_enum import HelpfulStrEnum @@ -99,8 +102,9 @@ class ModelMeta(BaseModel): loader: The function that loads the model. If None it assumes that the model is not implemented. loader_kwargs: The keyword arguments to pass to the loader function. name: The name of the model, ideally the name on huggingface. It should be in the format "organization/model_name". - n_parameters: The number of parameters in the model, e.g. 7_000_000 for a 7M parameter model. Can be None if the number of parameters is not known (e.g. for proprietary models) or - if the loader returns a SentenceTransformer model from which it can be derived. + n_parameters: The total number of parameters in the model, e.g. `7_000_000` for a 7M parameter model. Can be none in case the number of parameters is unknown. + n_embedding_parameters: The number of parameters used for the embedding layer. Can be None if the number of embedding parameters is not known (e.g. for proprietary models). + n_active_parameters_override: The number of active parameters used bu model. Should be used **only** for Mixture of Experts models. memory_usage_mb: The memory usage of the model in MB. Can be None if the memory usage is not known (e.g. for proprietary models). To calculate it use the `calculate_memory_usage_mb` method. max_tokens: The maximum number of tokens the model can handle. Can be None if the maximum number of tokens is not known (e.g. for proprietary models). @@ -139,6 +143,8 @@ class ModelMeta(BaseModel): release_date: StrDate | None languages: list[ISOLanguageScript] | None n_parameters: int | None + n_active_parameters_override: int | None = None + n_embedding_parameters: int | None = None memory_usage_mb: float | None max_tokens: float | None embed_dim: int | None @@ -197,6 +203,16 @@ def is_cross_encoder(self) -> bool: """ return "cross-encoder" in self.model_type + @property + def n_active_parameters(self): + """Number of active parameters. Assumed to be `n_parameters - n_embedding_parameters`. Can be overwritten using `n_active_parameters_override` e.g. for MoE models.""" + if self.n_active_parameters_override is not None: + return self.n_active_parameters_override + + if self.n_parameters is not None and self.n_embedding_parameters is not None: + return self.n_parameters - self.n_embedding_parameters + return None + @field_validator("similarity_fn_name", mode="before") @classmethod def _validate_similarity_fn_name(cls, value: str) -> ScoringFunction | None: @@ -389,6 +405,14 @@ def from_sentence_transformer_model( else model.model_card_data.base_model ) meta = cls._from_hub(name, revision, compute_metadata) + try: + first = model[0] + + if isinstance(first, Transformer): + emb = first.auto_model.get_input_embeddings() + meta.n_embedding_parameters = int(np.prod(emb.weight.shape)) + except Exception as e: + logger.warning(f"Could not calculate embedding parameters for {name}: {e}") meta.revision = model.model_card_data.base_model_revision or meta.revision meta.max_tokens = model.max_seq_length meta.embed_dim = model.get_sentence_embedding_dimension() @@ -460,6 +484,15 @@ def from_cross_encoder( from mteb.models import CrossEncoderWrapper meta = cls._from_hub(model.model.name_or_path, revision, compute_metadata) + try: + emb = model.model.get_input_embeddings() + + if isinstance(emb, nn.Embedding): + meta.n_embedding_parameters = int(np.prod(emb.weight.shape)) + except Exception as e: + logger.warning( + f"Could not calculate embedding parameters for {model.model.name_or_path}: {e}" + ) meta.revision = model.config._commit_hash or meta.revision meta.loader = CrossEncoderWrapper meta.embed_dim = None diff --git a/tests/test_models/test_model_meta.py b/tests/test_models/test_model_meta.py index 6b44767d69..1d47e40867 100644 --- a/tests/test_models/test_model_meta.py +++ b/tests/test_models/test_model_meta.py @@ -160,6 +160,8 @@ def test_model_to_python(): release_date='2021-08-30', languages=['eng-Latn'], n_parameters=22700000, + n_active_parameters_override=None, + n_embedding_parameters=11720448, memory_usage_mb=87.0, max_tokens=256.0, embed_dim=384,