From 990b18820b384ba93af98a1ded44eb2bdb6bd48e Mon Sep 17 00:00:00 2001 From: fzoll Date: Tue, 13 Jan 2026 19:29:06 +0100 Subject: [PATCH 1/2] Adding voyage-4 model --- .../model_implementations/voyage_models.py | 27 +++++++++++++++++++ 1 file changed, 27 insertions(+) diff --git a/mteb/models/model_implementations/voyage_models.py b/mteb/models/model_implementations/voyage_models.py index c35baa35d3..55a0eb5aa4 100644 --- a/mteb/models/model_implementations/voyage_models.py +++ b/mteb/models/model_implementations/voyage_models.py @@ -206,6 +206,32 @@ def _batched_encode( PromptType.document.value: "document", } +voyage_4 = ModelMeta( + name="voyageai/voyage-4", + model_type=["dense"], + revision="1", + release_date="2026-01-15", + languages=None, # supported languages not specified + loader=VoyageModel, + loader_kwargs=dict( + max_tokens=32000, + model_prompts=model_prompts, + ), + max_tokens=32000, + embed_dim=1024, + open_weights=False, + n_parameters=None, + memory_usage_mb=None, + license=None, + reference="https://blog.voyageai.com/2026/01/15/voyage-4/", + similarity_fn_name="cosine", + framework=["API"], + use_instructions=True, + training_datasets=VOYAGE_TRAINING_DATA, + public_training_code=None, + public_training_data=None, +) + voyage_4_lite = ModelMeta( name="voyageai/voyage-4-lite", model_type=["dense"], @@ -310,6 +336,7 @@ def _batched_encode( training_datasets=VOYAGE_TRAINING_DATA, public_training_code=None, public_training_data=None, + superseded_by="voyageai/voyage-4", ) voyage_3_5_int8 = ModelMeta( From daa019cde77f3e3416f9655e78672e37d04d1add Mon Sep 17 00:00:00 2001 From: fzoll Date: Tue, 13 Jan 2026 21:11:12 +0100 Subject: [PATCH 2/2] Adding voyage-4 model configs --- mteb/models/model_implementations/voyage_models.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/mteb/models/model_implementations/voyage_models.py b/mteb/models/model_implementations/voyage_models.py index 55a0eb5aa4..c3a299da0f 100644 --- a/mteb/models/model_implementations/voyage_models.py +++ b/mteb/models/model_implementations/voyage_models.py @@ -25,6 +25,9 @@ # Total token limits per model based on VoyageAI documentation VOYAGE_TOTAL_TOKEN_LIMITS = { + "voyage-4-large": 120_000, + "voyage-4": 320_000, + "voyage-4-lite": 1_000_000, "voyage-3.5-lite": 1_000_000, "voyage-3.5": 320_000, "voyage-2": 320_000,