diff --git a/mteb/abstasks/TaskMetadata.py b/mteb/abstasks/TaskMetadata.py index 09582d779b..c7b6839015 100644 --- a/mteb/abstasks/TaskMetadata.py +++ b/mteb/abstasks/TaskMetadata.py @@ -98,9 +98,15 @@ "Summarization", "InstructionRetrieval", "Speed", - "ZeroShotClassification", - "ImageTextPairClassification", + "Any2AnyMultiChoice", + "Any2AnyRetrieval", "Any2TextMutipleChoice", + "ImageClustering", + "ImageClassification", + "ImageMultilabelClassification", + "ImageTextPairClassification", + "VisualSTS", + "ZeroShotClassification", ] TASK_CATEGORY = Literal[ diff --git a/mteb/models/e5_v.py b/mteb/models/e5_v.py index b3287f274c..70bc20cabf 100644 --- a/mteb/models/e5_v.py +++ b/mteb/models/e5_v.py @@ -5,6 +5,7 @@ import torch from PIL import Image +from torch.utils.data import DataLoader from tqdm import tqdm from transformers import LlavaNextForConditionalGeneration, LlavaNextProcessor @@ -56,9 +57,23 @@ def get_text_embeddings(self, texts: list[str], batch_size: int = 8): all_text_embeddings.append(text_outputs.cpu()) return torch.cat(all_text_embeddings, dim=0) - def get_image_embeddings(self, images: list[Image.Image], batch_size: int = 8): + def get_image_embeddings( + self, images: list[Image.Image] | DataLoader, batch_size: int = 8 + ): all_image_embeddings = [] + if isinstance(images, DataLoader): + for batch_images in tqdm(images): + img_inputs = self.processor( + [self.img_prompt] * len(batch_images), + batch_images, + return_tensors="pt", + padding=True, + ).to("cuda") + image_outputs = self.model( + **img_inputs, output_hidden_states=True, return_dict=True + ).hidden_states[-1][:, -1, :] + all_image_embeddings.append(image_outputs.cpu()) with torch.no_grad(): for i in tqdm(range(0, len(images), batch_size)): batch_images = images[i : i + batch_size] @@ -95,24 +110,41 @@ def get_fused_embeddings( all_fused_embeddings = [] if texts is not None and images is not None: - if len(texts) != len(images): - raise ValueError( - "The number of texts and images must have the same length" - ) - with torch.no_grad(): - for i in tqdm(range(0, len(images), batch_size)): - batch_texts = texts[i : i + batch_size] - batch_images = images[i : i + batch_size] - prompts = [ - self.composed_prompt.format(text) for text in batch_texts - ] - inputs = self.processor( - prompts, batch_images, return_tensors="pt", padding=True - ).to("cuda") - outputs = self.model( - **inputs, output_hidden_states=True, return_dict=True - ).hidden_states[-1][:, -1, :] - all_fused_embeddings.append(outputs.cpu()) + if isinstance(images, DataLoader): + with torch.no_grad(): + for index, batch_images in enumerate(tqdm(images)): + batch_texts = texts[ + index * batch_size : (index + 1) * batch_size + ] + prompts = [ + self.composed_prompt.format(text) for text in batch_texts + ] + inputs = self.processor( + prompts, batch_images, return_tensors="pt", padding=True + ).to("cuda") + outputs = self.model( + **inputs, output_hidden_states=True, return_dict=True + ).hidden_states[-1][:, -1, :] + all_fused_embeddings.append(outputs.cpu()) + else: + if len(texts) != len(images): + raise ValueError( + "The number of texts and images must have the same length" + ) + with torch.no_grad(): + for i in tqdm(range(0, len(images), batch_size)): + batch_texts = texts[i : i + batch_size] + batch_images = images[i : i + batch_size] + prompts = [ + self.composed_prompt.format(text) for text in batch_texts + ] + inputs = self.processor( + prompts, batch_images, return_tensors="pt", padding=True + ).to("cuda") + outputs = self.model( + **inputs, output_hidden_states=True, return_dict=True + ).hidden_states[-1][:, -1, :] + all_fused_embeddings.append(outputs.cpu()) return torch.cat(all_fused_embeddings, dim=0) elif texts is not None: diff --git a/mteb/models/vista_models.py b/mteb/models/vista_models.py index 007bbfe37f..c86fdcd5b6 100644 --- a/mteb/models/vista_models.py +++ b/mteb/models/vista_models.py @@ -1,13 +1,18 @@ from __future__ import annotations from functools import partial +from typing import Any import torch from PIL import Image +from torch.utils.data import DataLoader +from torchvision import transforms from tqdm import tqdm from mteb.model_meta import ModelMeta +tensor_to_image = transforms.Compose([transforms.ToPILImage()]) + def vista_loader(**kwargs): try: # a temporal fix for the dependency issues of vista models. @@ -27,6 +32,7 @@ def __init__( negatives_cross_device: bool = False, temperature: float = 0.02, from_pretrained=None, + **kwargs: Any, ): super().__init__( model_name_bge=model_name_bge, @@ -88,15 +94,21 @@ def encode_text(self, texts): t_reps = torch.nn.functional.normalize(t_reps, dim=-1) return t_reps.contiguous() - def encode(self, images=None, texts=None): + def encode(self, images=None, texts=None, tensors=False): if images is not None: if isinstance(images, list): - images = [ - self.preprocess_val( - img if isinstance(img, Image.Image) else Image.open(img) - ) - for img in images - ] + if not tensors: + images = [ + self.preprocess_val( + img if isinstance(img, Image.Image) else Image.open(img) + ) + for img in images + ] + else: + images = [ + self.preprocess_val(tensor_to_image(image)) + for image in images + ] images = torch.stack(images) if texts is not None: texts = self.tokenizer(texts, return_tensors="pt", padding=True) @@ -119,31 +131,52 @@ def get_text_embeddings(self, texts: list[str], batch_size: int = 32): all_text_embeddings.append(batch_embeddings.cpu()) return torch.cat(all_text_embeddings, dim=0) - def get_image_embeddings(self, images: list[Image.Image], batch_size: int = 32): + def get_image_embeddings( + self, images: list[Image.Image] | DataLoader, batch_size: int = 32 + ): all_image_embeddings = [] - for i in tqdm(range(0, len(images), batch_size)): - batch_images = images[i : i + batch_size] + + if isinstance(images, DataLoader): with torch.no_grad(): - batch_embeddings = self.encode(images=batch_images) - all_image_embeddings.append(batch_embeddings.cpu()) + for batch in tqdm(images): + batch_embeddings = self.encode(images=batch, tensors=True) + all_image_embeddings.append(batch_embeddings.cpu()) + else: + with torch.no_grad(): + for i in tqdm(range(0, len(images), batch_size)): + batch_images = images[i : i + batch_size] + batch_embeddings = self.encode(images=batch_images) + all_image_embeddings.append(batch_embeddings.cpu()) return torch.cat(all_image_embeddings, dim=0) def get_fused_embeddings( self, texts: list[str] = None, - images: list[Image.Image] = None, + images: list[Image.Image] | DataLoader = None, batch_size: int = 32, ): all_embeddings = [] - assert len(texts) == len(images) - for i in tqdm(range(0, len(texts), batch_size)): - batch_texts = texts[i : i + batch_size] - batch_images = images[i : i + batch_size] + + if isinstance(images, DataLoader): + with torch.no_grad(): + for index, batch_images in enumerate(tqdm(images)): + batch_texts = texts[ + index * batch_size : (index + 1) * batch_size + ] + batch_embeddings = self.encode( + images=batch_images, texts=batch_texts, tensors=True + ) + all_embeddings.append(batch_embeddings.cpu()) + else: + assert len(texts) == len(images) with torch.no_grad(): - batch_embeddings = self.encode( - images=batch_images, texts=batch_texts - ) - all_embeddings.append(batch_embeddings.cpu()) + for i in tqdm(range(0, len(texts), batch_size)): + batch_texts = texts[i : i + batch_size] + batch_images = images[i : i + batch_size] + batch_embeddings = self.encode( + images=batch_images, texts=batch_texts + ) + all_embeddings.append(batch_embeddings.cpu()) return torch.cat(all_embeddings, dim=0) def calculate_probs(self, text_embeddings, image_embeddings): diff --git a/mteb/tasks/Image/Any2AnyMultiChoice/eng/ImageCoDeT2IMultiChoice.py b/mteb/tasks/Image/Any2AnyMultiChoice/eng/ImageCoDeT2IMultiChoice.py index 1f00290cdd..46fbb5b990 100644 --- a/mteb/tasks/Image/Any2AnyMultiChoice/eng/ImageCoDeT2IMultiChoice.py +++ b/mteb/tasks/Image/Any2AnyMultiChoice/eng/ImageCoDeT2IMultiChoice.py @@ -13,7 +13,7 @@ class ImageCoDeT2IMultiChoice(AbsTaskAny2AnyMultiChoice): "path": "JamieSJS/imagecode-multi", "revision": "d28adfd8b34fefa546fdf94bdc352622b2575f6c", }, - type="Retrieval", + type="Any2AnyMultiChoice", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/BLINKIT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/BLINKIT2IRetrieval.py index ca265fd898..cd1ce67e4a 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/BLINKIT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/BLINKIT2IRetrieval.py @@ -14,7 +14,7 @@ class BLINKIT2IRetrieval(AbsTaskAny2AnyRetrieval): "revision": "359b66f11c25d19bc8f7108d98e660a5857f3d26", "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/BLINKIT2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/BLINKIT2TRetrieval.py index 2c652c6388..d0fb86ba90 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/BLINKIT2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/BLINKIT2TRetrieval.py @@ -14,7 +14,7 @@ class BLINKIT2TRetrieval(AbsTaskAny2AnyRetrieval): "revision": "4ab83c87ac5b24e3b730f86d585671493a3a423c", "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/CIRRIT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/CIRRIT2IRetrieval.py index 2e45933ea3..b215dfda06 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/CIRRIT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/CIRRIT2IRetrieval.py @@ -14,7 +14,7 @@ class CIRRIT2IRetrieval(AbsTaskAny2AnyRetrieval): "revision": "503301cd99348035b9675883a543aa1ded0cf07c", "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/CUB200I2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/CUB200I2IRetrieval.py index c33f706c63..048f5a33bf 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/CUB200I2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/CUB200I2IRetrieval.py @@ -13,7 +13,7 @@ class CUB200I2I(AbsTaskAny2AnyRetrieval): "path": "isaacchung/cub200_retrieval", "revision": "ad08c1307b15a226bf1b64e62656a17f1f85f7ec", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/FORBI2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/FORBI2IRetrieval.py index 051aa324e6..c358ee6507 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/FORBI2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/FORBI2IRetrieval.py @@ -11,9 +11,9 @@ class FORBI2I(AbsTaskAny2AnyRetrieval): reference="https://github.com/pxiangwu/FORB", dataset={ "path": "isaacchung/forb_retrieval", - "revision": "336607d5bcc853fb7f7276c2c9721d4b5b1ca8e4", + "revision": "26ab4bd972854becada339afc80f5f3ffc047e2b", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/Fashion200kI2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/Fashion200kI2TRetrieval.py index 3e24c8691f..04fad6e352 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/Fashion200kI2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/Fashion200kI2TRetrieval.py @@ -14,7 +14,7 @@ class Fashion200kI2TRetrieval(AbsTaskAny2AnyRetrieval): "revision": "96a313715ecf67f5dfe70c4fa52406bc7bdfbeee", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/Fashion200kT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/Fashion200kT2IRetrieval.py index f54a3a38b2..54a1c24cf1 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/Fashion200kT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/Fashion200kT2IRetrieval.py @@ -14,7 +14,7 @@ class Fashion200kT2IRetrieval(AbsTaskAny2AnyRetrieval): "revision": "1b86e2dde50e671d5c83d07a79e8b1d8c696964b", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/FashionIQIT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/FashionIQIT2IRetrieval.py index 6072354fe6..45b8e10576 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/FashionIQIT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/FashionIQIT2IRetrieval.py @@ -14,7 +14,7 @@ class FashionIQIT2IRetrieval(AbsTaskAny2AnyRetrieval): "revision": "e6f0ec70becc413d940cd62b2cfa3b1d3a08c31a", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/Flickr30kI2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/Flickr30kI2TRetrieval.py index f7278bcf37..267cf860b9 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/Flickr30kI2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/Flickr30kI2TRetrieval.py @@ -13,7 +13,7 @@ class Flickr30kI2TRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/flickr30k", "revision": "a4cf34ac79215f9e2cd6a10342d84f606fc41cc3", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/Flickr30kT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/Flickr30kT2IRetrieval.py index 44164c90b6..576e6afa50 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/Flickr30kT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/Flickr30kT2IRetrieval.py @@ -13,7 +13,7 @@ class Flickr30kT2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/flickr30k", "revision": "a4cf34ac79215f9e2cd6a10342d84f606fc41cc3", }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/GLDv2I2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/GLDv2I2TRetrieval.py index 9539ef31b3..67b238a470 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/GLDv2I2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/GLDv2I2TRetrieval.py @@ -13,7 +13,7 @@ class GLDv2I2TRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/gld-v2-i2t", "revision": "d8c3e53160860f76de73ed3041a8593672fe5928", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/HatefulMemesI2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/HatefulMemesI2TRetrieval.py index c92a497914..40323d3636 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/HatefulMemesI2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/HatefulMemesI2TRetrieval.py @@ -68,7 +68,7 @@ class HatefulMemesI2TRetrieval(AbsTaskAny2AnyRetrieval): "revision": "c9a9a6c3ef0765622a6de0af6ebb68f323ad73ba", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/HatefulMemesT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/HatefulMemesT2IRetrieval.py index 067396752a..fec70177db 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/HatefulMemesT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/HatefulMemesT2IRetrieval.py @@ -68,7 +68,7 @@ class HatefulMemesT2IRetrieval(AbsTaskAny2AnyRetrieval): "revision": "c9a9a6c3ef0765622a6de0af6ebb68f323ad73ba", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/ImageCoDeT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/ImageCoDeT2IRetrieval.py index 3fae916f6b..6e34640459 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/ImageCoDeT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/ImageCoDeT2IRetrieval.py @@ -13,7 +13,7 @@ class ImageCoDeT2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/imagecode", "revision": "a424cd523ffb157b69a875fb5e71c1d51be54089", }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/InfoSeekIT2ITRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/InfoSeekIT2ITRetrieval.py index e35da59fcb..abc71666aa 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/InfoSeekIT2ITRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/InfoSeekIT2ITRetrieval.py @@ -14,7 +14,7 @@ class InfoSeekIT2ITRetrieval(AbsTaskAny2AnyRetrieval): "revision": "78ee7f7708aac75d3afac5dcab1c9e03cb62664c", "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2it", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/InfoSeekIT2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/InfoSeekIT2TRetrieval.py index 4d88a7ac80..a856969e75 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/InfoSeekIT2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/InfoSeekIT2TRetrieval.py @@ -14,7 +14,7 @@ class InfoSeekIT2TRetrieval(AbsTaskAny2AnyRetrieval): "revision": "d4f4606f7a42bbf311c2957419ef3734fe81c47f", "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/METI2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/METI2IRetrieval.py index e46b2635e5..b0578c5944 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/METI2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/METI2IRetrieval.py @@ -13,7 +13,7 @@ class METI2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/met", "revision": "08ceaa61c0d172214abb3b8e82971d8f69d2aec0", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/MSCOCOI2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/MSCOCOI2TRetrieval.py index dff57f5a53..8652b2e8e0 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/MSCOCOI2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/MSCOCOI2TRetrieval.py @@ -14,7 +14,7 @@ class MSCOCOI2TRetrieval(AbsTaskAny2AnyRetrieval): "revision": "cca3a3e223763e6519a4d68936bc9279034d75d2", "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/MSCOCOT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/MSCOCOT2IRetrieval.py index 9ce5fd839e..4797e98911 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/MSCOCOT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/MSCOCOT2IRetrieval.py @@ -14,7 +14,7 @@ class MSCOCOT2IRetrieval(AbsTaskAny2AnyRetrieval): "revision": "cfe15bd2791dde5f8f20aebecf0b4eb3812972d6", "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/MemotionI2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/MemotionI2TRetrieval.py index 5eda9cd295..c9d671d9d6 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/MemotionI2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/MemotionI2TRetrieval.py @@ -97,7 +97,7 @@ class MemotionI2TRetrieval(AbsTaskAny2AnyRetrieval): "revision": "cdb15b61d84d56db73e0e59535dfea81ea3c22f4", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/MemotionT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/MemotionT2IRetrieval.py index b82b6367a5..331e628f24 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/MemotionT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/MemotionT2IRetrieval.py @@ -96,7 +96,7 @@ class MemotionT2IRetrieval(AbsTaskAny2AnyRetrieval): "revision": "cdb15b61d84d56db73e0e59535dfea81ea3c22f4", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/NIGHTSI2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/NIGHTSI2IRetrieval.py index 3c7798c77c..ae0d91a6b5 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/NIGHTSI2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/NIGHTSI2IRetrieval.py @@ -13,7 +13,7 @@ class NIGHTSI2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "MRBench/mbeir_nights_task4", "revision": "c9583e052be7ad52d870c62a207a2e887ba9b8aa", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/OVENIT2ITRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/OVENIT2ITRetrieval.py index 0a720ec995..9bac08fa34 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/OVENIT2ITRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/OVENIT2ITRetrieval.py @@ -13,7 +13,7 @@ class OVENIT2ITRetrieval(AbsTaskAny2AnyRetrieval): "path": "MRBench/mbeir_oven_task8", "revision": "350d14b7258189654e26a2be93dc0bd6bee09b76", }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2it", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/OVENIT2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/OVENIT2TRetrieval.py index 2c171c778d..0877cfdf33 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/OVENIT2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/OVENIT2TRetrieval.py @@ -13,7 +13,7 @@ class OVENIT2TRetrieval(AbsTaskAny2AnyRetrieval): "path": "MRBench/mbeir_oven_task6", "revision": "2192074af29422bc1dc41cf07936f198b8c69bd0", }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/ROxfordI2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/ROxfordI2IRetrieval.py index 39502a46d8..dc43e34e29 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/ROxfordI2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/ROxfordI2IRetrieval.py @@ -13,7 +13,7 @@ class ROxfordI2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/r-oxford", "revision": "d8daad98b4e4896a7f7fa1b3485a22420242d4fc", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/RP2kI2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/RP2kI2IRetrieval.py index 321bb818be..61cd189fce 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/RP2kI2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/RP2kI2IRetrieval.py @@ -13,7 +13,7 @@ class RP2kI2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/rp2k", "revision": "f8f82d4eb1aa4dc4dbf2c768596c8110a3703765", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/RParisI2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/RParisI2IRetrieval.py index a112ded273..258ec836c6 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/RParisI2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/RParisI2IRetrieval.py @@ -13,7 +13,7 @@ class RParisI2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/r-paris", "revision": "bafc3a08fdffd72558021ce3a41250833d7e0e88", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/SOPI2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/SOPI2IRetrieval.py index 09b33aac7d..5d754fe0e6 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/SOPI2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/SOPI2IRetrieval.py @@ -13,7 +13,7 @@ class SOPI2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/stanford-online-products", "revision": "0b3a1622902e6258425e673405bdfb1e5dfa8618", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/SciMMIRI2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/SciMMIRI2TRetrieval.py index cc96d134a0..0f7acedab0 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/SciMMIRI2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/SciMMIRI2TRetrieval.py @@ -73,7 +73,7 @@ class SciMMIRI2TRetrieval(AbsTaskAny2AnyRetrieval): "revision": "eea276dc58c52eab33e9476acb137ff5530b78e9", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/SciMMIRT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/SciMMIRT2IRetrieval.py index 41c2c98e79..987a00ea6d 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/SciMMIRT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/SciMMIRT2IRetrieval.py @@ -73,7 +73,7 @@ class SciMMIRT2IRetrieval(AbsTaskAny2AnyRetrieval): "revision": "eea276dc58c52eab33e9476acb137ff5530b78e9", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/SketchyI2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/SketchyI2IRetrieval.py index c89091f41d..5a4b13ec94 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/SketchyI2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/SketchyI2IRetrieval.py @@ -13,7 +13,7 @@ class SketchyI2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "JamieSJS/sketchy", "revision": "c8b8c1b7a2f0a92f1bfaaa1c9afc22aa42c61d5b", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/StanfordCarsI2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/StanfordCarsI2IRetrieval.py index 4a053f8cc0..e98633e899 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/StanfordCarsI2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/StanfordCarsI2IRetrieval.py @@ -13,7 +13,7 @@ class StanfordCarsI2I(AbsTaskAny2AnyRetrieval): "path": "isaacchung/stanford_cars_retrieval", "revision": "b27a0612211af3598bd11fe28af20928f20cce06", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/TUBerlinT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/TUBerlinT2IRetrieval.py index 754fa14911..fe1c2891db 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/TUBerlinT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/TUBerlinT2IRetrieval.py @@ -14,7 +14,7 @@ class TUBerlinT2IRetrieval(AbsTaskAny2AnyRetrieval): "revision": "0cd78cd1ddbd3cafa9f319c638ebd77836ec9ff6", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/VQA2IT2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/VQA2IT2TRetrieval.py index cb5c3b38e5..58e1c5d31e 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/VQA2IT2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/VQA2IT2TRetrieval.py @@ -14,7 +14,7 @@ class VQA2IT2TRetrieval(AbsTaskAny2AnyRetrieval): "revision": "69882b6ba0b443dd62e633e546725b0f13b7e3aa", "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/VidoreBenchRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/VidoreBenchRetrieval.py index 6365b7adb3..fc73789541 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/VidoreBenchRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/VidoreBenchRetrieval.py @@ -100,7 +100,7 @@ class VidoreArxivQARetrieval(AbsTaskAny2AnyRetrieval): "path": "vidore/arxivqa_test_subsampled", "revision": "fe2b0e055eaac82d8f6801ebc8e85d8832248133", }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/VisualNewsI2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/VisualNewsI2TRetrieval.py index bf99c199a8..a36f5ea5fe 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/VisualNewsI2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/VisualNewsI2TRetrieval.py @@ -13,7 +13,7 @@ class VisualNewsI2TRetrieval(AbsTaskAny2AnyRetrieval): "path": "MRBench/mbeir_visualnews_task3", "revision": "aaee58895a66e4d619168849267ed2bb40d37043", }, - type="Retrieval", + type="Any2AnyRetrieval", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/VisualNewsT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/VisualNewsT2IRetrieval.py index 8bd3f8278f..aae9882d52 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/VisualNewsT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/VisualNewsT2IRetrieval.py @@ -13,7 +13,7 @@ class VisualNewsT2IRetrieval(AbsTaskAny2AnyRetrieval): "path": "MRBench/mbeir_visualnews_task0", "revision": "94c519d850dba2b0058c2fc9b5da6142a59aa285", }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/VizWizIT2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/VizWizIT2TRetrieval.py index 5565ca9f50..076f003b2b 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/VizWizIT2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/VizWizIT2TRetrieval.py @@ -14,7 +14,7 @@ class VizWizIT2TRetrieval(AbsTaskAny2AnyRetrieval): "revision": "044af162d55f82ab603fa16ffcf7f1e4dbf300e9", "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="it2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/WebQAT2ITRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/WebQAT2ITRetrieval.py index b3f21869ed..fabbf48ed4 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/WebQAT2ITRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/WebQAT2ITRetrieval.py @@ -13,7 +13,7 @@ class WebQAT2ITRetrieval(AbsTaskAny2AnyRetrieval): "path": "MRBench/mbeir_webqa_task2", "revision": "53db4c9f9c93cb74926a1c9d04dea7d7acac2f21", }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2it", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/eng/WebQAT2TRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/eng/WebQAT2TRetrieval.py index f53415087e..a98ee514a9 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/eng/WebQAT2TRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/eng/WebQAT2TRetrieval.py @@ -13,7 +13,7 @@ class WebQAT2TRetrieval(AbsTaskAny2AnyRetrieval): "path": "MRBench/mbeir_webqa_task1", "revision": "468b42a2b2e767d80d2d93f5ae5d42f135a10478", }, - type="Retrieval", + type="Any2AnyRetrieval", category="s2p", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Any2AnyRetrieval/multilingual/WITT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/multilingual/WITT2IRetrieval.py index 5de06b937f..ee8b8c4148 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/multilingual/WITT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/multilingual/WITT2IRetrieval.py @@ -101,7 +101,7 @@ class WITT2IRetrieval(MultilingualTask, AbsTaskAny2AnyRetrieval): "revision": "91ac153f1371a98b209ed763205e25e115ecd06e", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=_LANGUAGES, diff --git a/mteb/tasks/Image/Any2AnyRetrieval/multilingual/XFlickr30kCoT2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/multilingual/XFlickr30kCoT2IRetrieval.py index 65c886f314..507639a4df 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/multilingual/XFlickr30kCoT2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/multilingual/XFlickr30kCoT2IRetrieval.py @@ -84,7 +84,7 @@ class XFlickr30kCoT2IRetrieval(MultilingualTask, AbsTaskAny2AnyRetrieval): "revision": "0af2c2eba58b27a71898787e286be04befdd7a20", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=_LANGUAGES, diff --git a/mteb/tasks/Image/Any2AnyRetrieval/multilingual/XM3600T2IRetrieval.py b/mteb/tasks/Image/Any2AnyRetrieval/multilingual/XM3600T2IRetrieval.py index 687c9f0446..7e78db8193 100644 --- a/mteb/tasks/Image/Any2AnyRetrieval/multilingual/XM3600T2IRetrieval.py +++ b/mteb/tasks/Image/Any2AnyRetrieval/multilingual/XM3600T2IRetrieval.py @@ -129,7 +129,7 @@ class XM3600T2IRetrieval(MultilingualTask, AbsTaskAny2AnyRetrieval): "revision": "8d3e5665526c55a5855cd6ddfbaba2032bc7cee4", # "trust_remote_code": True, }, - type="Retrieval", + type="Any2AnyRetrieval", category="t2i", eval_splits=["test"], eval_langs=_LANGUAGES, diff --git a/mteb/tasks/Image/Any2TextMultipleChoice/eng/CVBench.py b/mteb/tasks/Image/Any2TextMultipleChoice/eng/CVBench.py index e42ec28f76..bb3c5db181 100644 --- a/mteb/tasks/Image/Any2TextMultipleChoice/eng/CVBench.py +++ b/mteb/tasks/Image/Any2TextMultipleChoice/eng/CVBench.py @@ -36,10 +36,10 @@ class CVBenchCount(AbsTaskAny2TextMultipleChoice): dialect=[], modalities=["text", "image"], sample_creation="found", - bibtex_citation="""@article{wu2024scimmir, - title={placeholder}, - author={placeholder and others}, - journal={arXiv preprint arXiv:2401.13478}, + bibtex_citation="""@article{tong2024cambrian, + title={Cambrian-1: A fully open, vision-centric exploration of multimodal llms}, + author={Tong, Shengbang and Brown, Ellis and Wu, Penghao and Woo, Sanghyun and Middepogu, Manoj and Akula, Sai Charitha and Yang, Jihan and Yang, Shusheng and Iyer, Adithya and Pan, Xichen and others}, + journal={arXiv preprint arXiv:2406.16860}, year={2024} }""", descriptive_stats={ @@ -96,10 +96,10 @@ class CVBenchRelation(AbsTaskAny2TextMultipleChoice): dialect=[], modalities=["text", "image"], sample_creation="found", - bibtex_citation="""@article{wu2024scimmir, - title={placeholder}, - author={placeholder and others}, - journal={arXiv preprint arXiv:2401.13478}, + bibtex_citation="""@article{tong2024cambrian, + title={Cambrian-1: A fully open, vision-centric exploration of multimodal llms}, + author={Tong, Shengbang and Brown, Ellis and Wu, Penghao and Woo, Sanghyun and Middepogu, Manoj and Akula, Sai Charitha and Yang, Jihan and Yang, Shusheng and Iyer, Adithya and Pan, Xichen and others}, + journal={arXiv preprint arXiv:2406.16860}, year={2024} }""", descriptive_stats={ @@ -158,10 +158,10 @@ class CVBenchDepth(AbsTaskAny2TextMultipleChoice): dialect=[], modalities=["text", "image"], sample_creation="found", - bibtex_citation="""@article{wu2024scimmir, - title={placeholder}, - author={placeholder and others}, - journal={arXiv preprint arXiv:2401.13478}, + bibtex_citation="""@article{tong2024cambrian, + title={Cambrian-1: A fully open, vision-centric exploration of multimodal llms}, + author={Tong, Shengbang and Brown, Ellis and Wu, Penghao and Woo, Sanghyun and Middepogu, Manoj and Akula, Sai Charitha and Yang, Jihan and Yang, Shusheng and Iyer, Adithya and Pan, Xichen and others}, + journal={arXiv preprint arXiv:2406.16860}, year={2024} }""", descriptive_stats={ diff --git a/mteb/tasks/Image/Clustering/eng/CIFAR.py b/mteb/tasks/Image/Clustering/eng/CIFAR.py index 61250cc3f5..e9a0429cf9 100644 --- a/mteb/tasks/Image/Clustering/eng/CIFAR.py +++ b/mteb/tasks/Image/Clustering/eng/CIFAR.py @@ -13,7 +13,7 @@ class CIFAR10Clustering(AbsTaskImageClustering): "path": "uoft-cs/cifar10", "revision": "0b2714987fa478483af9968de7c934580d0bb9a2", }, - type="Clustering", + type="ImageClustering", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Clustering/eng/ImageNet.py b/mteb/tasks/Image/Clustering/eng/ImageNet.py index daf8ab8dae..381b3d9d91 100644 --- a/mteb/tasks/Image/Clustering/eng/ImageNet.py +++ b/mteb/tasks/Image/Clustering/eng/ImageNet.py @@ -13,7 +13,7 @@ class ImageNetDog15Clustering(AbsTaskImageClustering): "path": "JamieSJS/imagenet-dog-15", "revision": "bfb6ad3b2109d26c9daddf14f98d315daa35ee72", }, - type="Clustering", + type="ImageClustering", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/Clustering/eng/TinyImageNet.py b/mteb/tasks/Image/Clustering/eng/TinyImageNet.py index 14123e2111..96c557e3ab 100644 --- a/mteb/tasks/Image/Clustering/eng/TinyImageNet.py +++ b/mteb/tasks/Image/Clustering/eng/TinyImageNet.py @@ -13,7 +13,7 @@ class TinyImageNet(AbsTaskImageClustering): "path": "zh-plus/tiny-imagenet", "revision": "5a77092c28e51558c5586e9c5eb71a7e17a5e43f", }, - type="Clustering", + type="ImageClustering", category="s2s", eval_splits=["valid"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/BirdsnapClassification.py b/mteb/tasks/Image/ImageClassification/eng/BirdsnapClassification.py index f29259ae2a..cf9a18cc46 100644 --- a/mteb/tasks/Image/ImageClassification/eng/BirdsnapClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/BirdsnapClassification.py @@ -13,7 +13,7 @@ class BirdsnapClassification(AbsTaskImageClassification): "path": "isaacchung/birdsnap", "revision": "e09b9dea248d579376684268cbedba28cd66b9b4", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/CIFAR.py b/mteb/tasks/Image/ImageClassification/eng/CIFAR.py index 2fe4fc2808..7560bff77e 100644 --- a/mteb/tasks/Image/ImageClassification/eng/CIFAR.py +++ b/mteb/tasks/Image/ImageClassification/eng/CIFAR.py @@ -13,7 +13,7 @@ class CIFAR10Classification(AbsTaskImageClassification): "path": "uoft-cs/cifar10", "revision": "0b2714987fa478483af9968de7c934580d0bb9a2", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/Caltech101Classification.py b/mteb/tasks/Image/ImageClassification/eng/Caltech101Classification.py index 5c79a41046..0e00980428 100644 --- a/mteb/tasks/Image/ImageClassification/eng/Caltech101Classification.py +++ b/mteb/tasks/Image/ImageClassification/eng/Caltech101Classification.py @@ -14,7 +14,7 @@ class Caltech101Classification(AbsTaskImageClassification): "name": "with_background_category", "revision": "851374102055782c84f89b1b4e9d128a6568847b", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/Country211Classification.py b/mteb/tasks/Image/ImageClassification/eng/Country211Classification.py index 5f34c09a14..7fcbd4b209 100644 --- a/mteb/tasks/Image/ImageClassification/eng/Country211Classification.py +++ b/mteb/tasks/Image/ImageClassification/eng/Country211Classification.py @@ -13,7 +13,7 @@ class Country211Classification(AbsTaskImageClassification): "path": "clip-benchmark/wds_country211", "revision": "1699f138f0558342a1cbf99f7cf36b4361bb5ebc", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/DTDClassification.py b/mteb/tasks/Image/ImageClassification/eng/DTDClassification.py index aabb03f02a..6362785cb7 100644 --- a/mteb/tasks/Image/ImageClassification/eng/DTDClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/DTDClassification.py @@ -13,7 +13,7 @@ class DTDClassification(AbsTaskImageClassification): "path": "tanganke/dtd", "revision": "d2afa97d9f335b1a6b3b09c637aef667f98f966e", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/EuroSATClassification.py b/mteb/tasks/Image/ImageClassification/eng/EuroSATClassification.py index 6ef26a0dba..45638643de 100644 --- a/mteb/tasks/Image/ImageClassification/eng/EuroSATClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/EuroSATClassification.py @@ -13,7 +13,7 @@ class EuroSATClassification(AbsTaskImageClassification): "path": "timm/eurosat-rgb", "revision": "b4e28552cd5f3932b6abc37eb20d3e84901ad728", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/FER2013Classification.py b/mteb/tasks/Image/ImageClassification/eng/FER2013Classification.py index ea987fb4e2..49323aa4b6 100644 --- a/mteb/tasks/Image/ImageClassification/eng/FER2013Classification.py +++ b/mteb/tasks/Image/ImageClassification/eng/FER2013Classification.py @@ -13,7 +13,7 @@ class FER2013Classification(AbsTaskImageClassification): "path": "clip-benchmark/wds_fer2013", "revision": "9399b94167523fe5c40b3a857e24ef931ee4395b", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/FGVCAircraftClassification.py b/mteb/tasks/Image/ImageClassification/eng/FGVCAircraftClassification.py index 74659b5e92..3db3ef2d8c 100644 --- a/mteb/tasks/Image/ImageClassification/eng/FGVCAircraftClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/FGVCAircraftClassification.py @@ -13,7 +13,7 @@ class FGVCAircraftClassification(AbsTaskImageClassification): "path": "HuggingFaceM4/FGVC-Aircraft", "revision": "91860adfc9a09aabca5cddb5247442109b38e213", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/Food101Classification.py b/mteb/tasks/Image/ImageClassification/eng/Food101Classification.py index 34b2592e20..c508486997 100644 --- a/mteb/tasks/Image/ImageClassification/eng/Food101Classification.py +++ b/mteb/tasks/Image/ImageClassification/eng/Food101Classification.py @@ -13,7 +13,7 @@ class Food101Classification(AbsTaskImageClassification): "path": "ethz/food101", "revision": "e06acf2a88084f04bce4d4a525165d68e0a36c38", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["validation"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/GTSRBClassification.py b/mteb/tasks/Image/ImageClassification/eng/GTSRBClassification.py index 6596151327..29c5ccc4c0 100644 --- a/mteb/tasks/Image/ImageClassification/eng/GTSRBClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/GTSRBClassification.py @@ -13,7 +13,7 @@ class GTSRBClassification(AbsTaskImageClassification): "path": "clip-benchmark/wds_gtsrb", "revision": "1c13eff0803d2b02c9dc8dfe85e67770b3f0f3c5", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/Imagenet1k.py b/mteb/tasks/Image/ImageClassification/eng/Imagenet1k.py index d3b8474808..c8bfd62ce8 100644 --- a/mteb/tasks/Image/ImageClassification/eng/Imagenet1k.py +++ b/mteb/tasks/Image/ImageClassification/eng/Imagenet1k.py @@ -13,7 +13,7 @@ class Imagenet1kClassification(AbsTaskImageClassification): "path": "clip-benchmark/wds_imagenet1k", "revision": "b24c7a5a3ef12df09089055d1795e2ce7c7e7397", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/MNISTClassification.py b/mteb/tasks/Image/ImageClassification/eng/MNISTClassification.py index 4ea68ddea3..5e9b9a86af 100644 --- a/mteb/tasks/Image/ImageClassification/eng/MNISTClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/MNISTClassification.py @@ -13,7 +13,7 @@ class MNISTClassification(AbsTaskImageClassification): "path": "ylecun/mnist", "revision": "b06aab39e05f7bcd9635d18ed25d06eae523c574", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/OxfordFlowersClassification.py b/mteb/tasks/Image/ImageClassification/eng/OxfordFlowersClassification.py index d07badc30f..9e4a6f6aaa 100644 --- a/mteb/tasks/Image/ImageClassification/eng/OxfordFlowersClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/OxfordFlowersClassification.py @@ -13,7 +13,7 @@ class OxfordFlowersClassification(AbsTaskImageClassification): "path": "nelorth/oxford-flowers", "revision": "a37b1891609c0376fa81eced756e7863e1bd873b", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/OxfordPetsClassification.py b/mteb/tasks/Image/ImageClassification/eng/OxfordPetsClassification.py index 603dad1278..09935a2735 100644 --- a/mteb/tasks/Image/ImageClassification/eng/OxfordPetsClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/OxfordPetsClassification.py @@ -13,7 +13,7 @@ class OxfordPetsClassification(AbsTaskImageClassification): "path": "isaacchung/OxfordPets", "revision": "557b480fae8d69247be74d9503b378a09425096f", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/PatchCamelyonClassification.py b/mteb/tasks/Image/ImageClassification/eng/PatchCamelyonClassification.py index a6f9466672..0032266eaa 100644 --- a/mteb/tasks/Image/ImageClassification/eng/PatchCamelyonClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/PatchCamelyonClassification.py @@ -13,7 +13,7 @@ class PatchCamelyonClassification(AbsTaskImageClassification): "path": "clip-benchmark/wds_vtab-pcam", "revision": "502695fe1a141108650e3c5b91c8b5e0ff84ed49", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/RESISC45Classification.py b/mteb/tasks/Image/ImageClassification/eng/RESISC45Classification.py index c767e3b334..d73abc76b9 100644 --- a/mteb/tasks/Image/ImageClassification/eng/RESISC45Classification.py +++ b/mteb/tasks/Image/ImageClassification/eng/RESISC45Classification.py @@ -13,7 +13,7 @@ class RESISC45Classification(AbsTaskImageClassification): "path": "timm/resisc45", "revision": "fe12fc5f1b7606543b0355eda392f1ddc54625c6", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/STL10Classification.py b/mteb/tasks/Image/ImageClassification/eng/STL10Classification.py index 02593fe4e3..fe25c9d3d7 100644 --- a/mteb/tasks/Image/ImageClassification/eng/STL10Classification.py +++ b/mteb/tasks/Image/ImageClassification/eng/STL10Classification.py @@ -13,7 +13,7 @@ class STL10Classification(AbsTaskImageClassification): "path": "tanganke/stl10", "revision": "49ae7f94508f7feae62baf836db284306eab0b0f", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/SUN397Classification.py b/mteb/tasks/Image/ImageClassification/eng/SUN397Classification.py index d23844ec4f..f7593a3373 100644 --- a/mteb/tasks/Image/ImageClassification/eng/SUN397Classification.py +++ b/mteb/tasks/Image/ImageClassification/eng/SUN397Classification.py @@ -13,7 +13,7 @@ class SUN397Classification(AbsTaskImageClassification): "path": "dpdl-benchmark/sun397", "revision": "7e6af6a2499ad708618be868e1471eac0aca1168", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/StanfordCarsClassification.py b/mteb/tasks/Image/ImageClassification/eng/StanfordCarsClassification.py index e4561b2165..4c049f540d 100644 --- a/mteb/tasks/Image/ImageClassification/eng/StanfordCarsClassification.py +++ b/mteb/tasks/Image/ImageClassification/eng/StanfordCarsClassification.py @@ -13,7 +13,7 @@ class StanfordCarsClassification(AbsTaskImageClassification): "path": "isaacchung/StanfordCars", "revision": "09ffe9bc7864d3f1e851529e5c4b7e05601a04fb", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageClassification/eng/UCF101Classification.py b/mteb/tasks/Image/ImageClassification/eng/UCF101Classification.py index ef82d99d9e..41c923b538 100644 --- a/mteb/tasks/Image/ImageClassification/eng/UCF101Classification.py +++ b/mteb/tasks/Image/ImageClassification/eng/UCF101Classification.py @@ -17,7 +17,7 @@ class UCF101Classification(AbsTaskImageClassification): "path": "flwrlabs/ucf101", "revision": "1098eed48f2929443f47c39f3b5c814e16369c11", }, - type="Classification", + type="ImageClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ImageMultilabelClassification/eng/PascalVOC2007.py b/mteb/tasks/Image/ImageMultilabelClassification/eng/PascalVOC2007.py index fa0628b351..1a02997aec 100644 --- a/mteb/tasks/Image/ImageMultilabelClassification/eng/PascalVOC2007.py +++ b/mteb/tasks/Image/ImageMultilabelClassification/eng/PascalVOC2007.py @@ -16,7 +16,7 @@ class VOC2007Classification(AbsTaskImageMultilabelClassification): "name": "voc2007_main", "revision": "dbafdb9e1506c9c419c5c4672e409463cd21ba50", }, - type="MultilabelClassification", + type="ImageMultilabelClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/VisualSTS/en/STS12VisualSTS.py b/mteb/tasks/Image/VisualSTS/en/STS12VisualSTS.py index 8d78bb7238..c036b54042 100644 --- a/mteb/tasks/Image/VisualSTS/en/STS12VisualSTS.py +++ b/mteb/tasks/Image/VisualSTS/en/STS12VisualSTS.py @@ -13,7 +13,7 @@ class STS12VisualSTS(AbsTaskVisualSTS): }, description="SemEval-2012 Task 6." + "then rendered into images.", reference="https://arxiv.org/abs/2402.08183/", - type="STS", + type="VisualSTS", category="i2i", modalities=["image"], eval_splits=["test"], diff --git a/mteb/tasks/Image/VisualSTS/en/STS13VisualSTS.py b/mteb/tasks/Image/VisualSTS/en/STS13VisualSTS.py index 1b02248d35..cf4c0aa6c4 100644 --- a/mteb/tasks/Image/VisualSTS/en/STS13VisualSTS.py +++ b/mteb/tasks/Image/VisualSTS/en/STS13VisualSTS.py @@ -13,7 +13,7 @@ class STS13VisualSTS(AbsTaskVisualSTS): }, description="SemEval STS 2013 dataset." + "then rendered into images.", reference="https://arxiv.org/abs/2402.08183/", - type="STS", + type="VisualSTS", category="i2i", modalities=["image"], eval_splits=["test"], diff --git a/mteb/tasks/Image/VisualSTS/en/STS14VisualSTS.py b/mteb/tasks/Image/VisualSTS/en/STS14VisualSTS.py index a427fdae0b..46dce36f80 100644 --- a/mteb/tasks/Image/VisualSTS/en/STS14VisualSTS.py +++ b/mteb/tasks/Image/VisualSTS/en/STS14VisualSTS.py @@ -14,7 +14,7 @@ class STS14VisualSTS(AbsTaskVisualSTS): description="SemEval STS 2014 dataset. Currently only the English dataset." + "rendered into images.", reference="https://arxiv.org/abs/2402.08183/", - type="STS", + type="VisualSTS", category="i2i", modalities=["image"], eval_splits=["test"], diff --git a/mteb/tasks/Image/VisualSTS/en/STS15VisualSTS.py b/mteb/tasks/Image/VisualSTS/en/STS15VisualSTS.py index 12c9a74c81..a9aca02c39 100644 --- a/mteb/tasks/Image/VisualSTS/en/STS15VisualSTS.py +++ b/mteb/tasks/Image/VisualSTS/en/STS15VisualSTS.py @@ -13,7 +13,7 @@ class STS15VisualSTS(AbsTaskVisualSTS): }, description="SemEval STS 2015 dataset" + "rendered into images.", reference="https://arxiv.org/abs/2402.08183/", - type="STS", + type="VisualSTS", category="i2i", modalities=["image"], eval_splits=["test"], diff --git a/mteb/tasks/Image/VisualSTS/en/STS16VisualSTS.py b/mteb/tasks/Image/VisualSTS/en/STS16VisualSTS.py index ae1e2900dd..b64e040282 100644 --- a/mteb/tasks/Image/VisualSTS/en/STS16VisualSTS.py +++ b/mteb/tasks/Image/VisualSTS/en/STS16VisualSTS.py @@ -13,7 +13,7 @@ class STS16VisualSTS(AbsTaskVisualSTS): }, description="SemEval STS 2016 dataset" + "rendered into images.", reference="https://arxiv.org/abs/2402.08183/", - type="STS", + type="VisualSTS", category="i2i", modalities=["image"], eval_splits=["test"], diff --git a/mteb/tasks/Image/VisualSTS/multilingual/STS17MultilingualVisualSTS.py b/mteb/tasks/Image/VisualSTS/multilingual/STS17MultilingualVisualSTS.py index dc9e464dcf..b72988676a 100644 --- a/mteb/tasks/Image/VisualSTS/multilingual/STS17MultilingualVisualSTS.py +++ b/mteb/tasks/Image/VisualSTS/multilingual/STS17MultilingualVisualSTS.py @@ -33,7 +33,7 @@ class STS17MultilingualVisualSTS(AbsTaskVisualSTS, MultilingualTask): + "rendered into images." ), reference="https://arxiv.org/abs/2402.08183/", - type="STS", + type="VisualSTS", category="i2i", modalities=["image"], eval_splits=_SPLITS, diff --git a/mteb/tasks/Image/VisualSTS/multilingual/STSBenchmarkMultilingualVisualSTS.py b/mteb/tasks/Image/VisualSTS/multilingual/STSBenchmarkMultilingualVisualSTS.py index 8cf063d059..339be27c37 100644 --- a/mteb/tasks/Image/VisualSTS/multilingual/STSBenchmarkMultilingualVisualSTS.py +++ b/mteb/tasks/Image/VisualSTS/multilingual/STSBenchmarkMultilingualVisualSTS.py @@ -34,7 +34,7 @@ class STSBenchmarkMultilingualVisualSTS(AbsTaskVisualSTS, MultilingualTask): + "built upon multi-sts created by Philip May" ), reference="https://arxiv.org/abs/2402.08183/", - type="STS", + type="VisualSTS", category="i2i", modalities=["image"], eval_splits=_SPLITS, diff --git a/mteb/tasks/Image/ZeroshotClassification/eng/Country211.py b/mteb/tasks/Image/ZeroshotClassification/eng/Country211.py index ce3e7657d8..0a60e33003 100644 --- a/mteb/tasks/Image/ZeroshotClassification/eng/Country211.py +++ b/mteb/tasks/Image/ZeroshotClassification/eng/Country211.py @@ -17,7 +17,7 @@ class Country211Classification(AbsTaskZeroshotClassification): "path": "clip-benchmark/wds_country211", "revision": "1699f138f0558342a1cbf99f7cf36b4361bb5ebc", }, - type="Classification", + type="ZeroShotClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ZeroshotClassification/eng/Imagenet1k.py b/mteb/tasks/Image/ZeroshotClassification/eng/Imagenet1k.py index 6c96fad3ab..87dc8e277e 100644 --- a/mteb/tasks/Image/ZeroshotClassification/eng/Imagenet1k.py +++ b/mteb/tasks/Image/ZeroshotClassification/eng/Imagenet1k.py @@ -17,7 +17,7 @@ class Imagenet1kClassification(AbsTaskZeroshotClassification): "path": "clip-benchmark/wds_imagenet1k", "revision": "b24c7a5a3ef12df09089055d1795e2ce7c7e7397", }, - type="Classification", + type="ZeroShotClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/mteb/tasks/Image/ZeroshotClassification/eng/UCF101.py b/mteb/tasks/Image/ZeroshotClassification/eng/UCF101.py index 9274e7c1f5..b95021184c 100644 --- a/mteb/tasks/Image/ZeroshotClassification/eng/UCF101.py +++ b/mteb/tasks/Image/ZeroshotClassification/eng/UCF101.py @@ -19,7 +19,7 @@ class UCF101Classification(AbsTaskZeroshotClassification): "path": "flwrlabs/ucf101", "revision": "1098eed48f2929443f47c39f3b5c814e16369c11", }, - type="Classification", + type="ZeroShotClassification", category="i2t", eval_splits=["test"], eval_langs=["eng-Latn"], diff --git a/results-mieb/BAAI__bge-visualized-base/98db10b10d22620010d06f11733346e1c98c34aa/model_meta.json b/results-mieb/BAAI__bge-visualized-base/98db10b10d22620010d06f11733346e1c98c34aa/model_meta.json index 746dfa90fd..a73369f513 100644 --- a/results-mieb/BAAI__bge-visualized-base/98db10b10d22620010d06f11733346e1c98c34aa/model_meta.json +++ b/results-mieb/BAAI__bge-visualized-base/98db10b10d22620010d06f11733346e1c98c34aa/model_meta.json @@ -1 +1 @@ -{"name": "BAAI/bge-visualized", "revision": "98db10b10d22620010d06f11733346e1c98c34aa", "release_date": "2024-06-06", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "similarity_fn_name": null, "framework": [], "loader": "VisualizedBGEWrapper"} \ No newline at end of file +{"name": "BAAI/bge-visualized-base", "revision": "98db10b10d22620010d06f11733346e1c98c34aa", "release_date": "2024-06-06", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "similarity_fn_name": null, "framework": [], "loader": "vista_loader"} \ No newline at end of file diff --git a/results-mieb/BAAI__bge-visualized-m3/98db10b10d22620010d06f11733346e1c98c34aa/model_meta.json b/results-mieb/BAAI__bge-visualized-m3/98db10b10d22620010d06f11733346e1c98c34aa/model_meta.json index 992116b866..a2b05c9208 100644 --- a/results-mieb/BAAI__bge-visualized-m3/98db10b10d22620010d06f11733346e1c98c34aa/model_meta.json +++ b/results-mieb/BAAI__bge-visualized-m3/98db10b10d22620010d06f11733346e1c98c34aa/model_meta.json @@ -1 +1 @@ -{"name": "BAAI/bge-visualized-m3", "revision": "98db10b10d22620010d06f11733346e1c98c34aa", "release_date": "2024-06-06", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "similarity_fn_name": null, "framework": [], "loader": "VisualizedBGEWrapper"} \ No newline at end of file +{"name": "BAAI/bge-visualized-m3", "revision": "98db10b10d22620010d06f11733346e1c98c34aa", "release_date": "2024-06-06", "languages": ["eng_Latn"], "n_parameters": null, "memory_usage": null, "max_tokens": null, "embed_dim": null, "license": null, "open_source": true, "similarity_fn_name": null, "framework": [], "loader": "vista_loader"} \ No newline at end of file diff --git a/scripts/run_mieb.py b/scripts/run_mieb.py new file mode 100644 index 0000000000..8b00d64e9d --- /dev/null +++ b/scripts/run_mieb.py @@ -0,0 +1,45 @@ +from __future__ import annotations + +import mteb + +for model_name in [ + "openai/clip-vit-base-patch32", + "openai/clip-vit-base-patch16", + "openai/clip-vit-large-patch14", + "royokong/e5-v", + "BAAI/bge-visualized-base", + "BAAI/bge-visualized-m3", + "google/siglip-so400m-patch14-384", + "kakaobrain/align-base", + "jinaai/jina-clip-v1", + "nomic-ai/nomic-embed-vision-v1.5", + "Salesforce/blip-image-captioning-large", + "Salesforce/blip-image-captioning-base", + "Salesforce/blip2-opt-2.7b", + "Salesforce/blip2-opt-6.7b-coco", + "facebook/dinov2-small", + "facebook/dinov2-base", + "facebook/dinov2-large", + "facebook/dinov2-giant", + "laion/CLIP-ViT-B-32-DataComp.XL-s13B-b90K", + "laion/CLIP-ViT-B-16-DataComp.XL-s13B-b90K", + "laion/CLIP-ViT-L-14-DataComp.XL-s13B-b90K", + "nyu-visionx/moco-v3-vit-b", + "nyu-visionx/moco-v3-vit-l", +]: + model = mteb.get_model(model_name) + tasks = mteb.get_tasks( + task_types=[ + "Any2AnyRetrieval", + "AbsTaskAny2AnyMultiChoice", + "Any2TextMutipleChoice", + "ImageClustering", + "ImageClassification", + "ImageMultilabelClassification", + "ImageTextPairClassification", + "VisualSTS", + "ZeroShotClassification", + ] + ) + evaluation = mteb.MTEB(tasks=tasks) + results = evaluation.run(model, output_folder="results-mieb-final")