diff --git a/mteb/models/qzhou_models.py b/mteb/models/qzhou_models.py index bab9fb969e..6fdb90afcb 100644 --- a/mteb/models/qzhou_models.py +++ b/mteb/models/qzhou_models.py @@ -42,6 +42,8 @@ def instruction_template( "TweetSentimentExtractionClassification": ["train"], } +qzhou_zh_training_data = {"LCQMC": ["train"], "PAWSX": ["train"]} + QZhou_Embedding = ModelMeta( loader=partial( InstructSentenceTransformerWrapper, @@ -78,3 +80,32 @@ def instruction_template( # "infgrad/retrieval_data_llm": ["train"], }, ) + +QZhou_Embedding_Zh = ModelMeta( + loader=partial( + InstructSentenceTransformerWrapper, + model_name="Kingsoft-LLM/QZhou-Embedding-Zh", + revision="0321ccb126413d1e49c5ce908e802b63d35f18e2", + instruction_template=instruction_template, + apply_instruction_to_passages=False, + ), + name="Kingsoft-LLM/QZhou-Embedding-Zh", + languages=["zho-Hans"], + open_weights=True, + revision="0321ccb126413d1e49c5ce908e802b63d35f18e2", + release_date="2025-09-28", + n_parameters=7_575_747_328, + memory_usage_mb=29431, + embed_dim=1792, + license="apache-2.0", + max_tokens=8192, + reference="http://huggingface.co/Kingsoft-LLM/QZhou-Embedding-Zh", + similarity_fn_name="cosine", + framework=["Sentence Transformers", "PyTorch"], + use_instructions=True, + public_training_code=None, + public_training_data=None, + training_datasets={ + **qzhou_zh_training_data, + }, +)