diff --git a/docs/adding_a_dataset.md b/docs/adding_a_dataset.md index 60ca5ceae0..2f34b271b6 100644 --- a/docs/adding_a_dataset.md +++ b/docs/adding_a_dataset.md @@ -100,7 +100,6 @@ class VGClustering(AbsTaskClustering): "revision": "d4c5a8ba10ae71224752c727094ac4c46947fa29", }, date=("2012-01-01", "2020-01-01"), - form="Written", domains=["Academic", "Non-fiction"], task_subtypes=["Scientific Reranking"], license="cc-by-nc-4.0", diff --git a/mteb/models/overview.py b/mteb/models/overview.py index d5ea6a5c55..be4acc6b08 100644 --- a/mteb/models/overview.py +++ b/mteb/models/overview.py @@ -38,6 +38,7 @@ e5_v, evaclip_models, fa_models, + geogpt_models, gme_v_models, google_models, gritlm_models, @@ -91,7 +92,6 @@ voyage_models, voyage_v, xyz_models, - geogpt_models, ) logger = logging.getLogger(__name__) diff --git a/mteb/tasks/Clustering/deu/BlurbsClusteringP2P.py b/mteb/tasks/Clustering/deu/BlurbsClusteringP2P.py index 859b13f5a7..c442ba1e38 100644 --- a/mteb/tasks/Clustering/deu/BlurbsClusteringP2P.py +++ b/mteb/tasks/Clustering/deu/BlurbsClusteringP2P.py @@ -25,7 +25,6 @@ class BlurbsClusteringP2P(AbsTaskClustering): eval_langs=["deu-Latn"], main_score="v_measure", date=None, - form=None, domains=["Written"], task_subtypes=None, license=None, diff --git a/mteb/tasks/Clustering/deu/BlurbsClusteringS2S.py b/mteb/tasks/Clustering/deu/BlurbsClusteringS2S.py index 354efa59ec..b4c5cafe22 100644 --- a/mteb/tasks/Clustering/deu/BlurbsClusteringS2S.py +++ b/mteb/tasks/Clustering/deu/BlurbsClusteringS2S.py @@ -33,7 +33,6 @@ class BlurbsClusteringS2S(AbsTaskClustering): eval_langs=["deu-Latn"], main_score="v_measure", date=None, - form=None, domains=["Written"], task_subtypes=None, license=None, diff --git a/mteb/tasks/Clustering/deu/TenKGnadClusteringS2S.py b/mteb/tasks/Clustering/deu/TenKGnadClusteringS2S.py index d4ac2f2581..4acb4ba840 100644 --- a/mteb/tasks/Clustering/deu/TenKGnadClusteringS2S.py +++ b/mteb/tasks/Clustering/deu/TenKGnadClusteringS2S.py @@ -23,7 +23,6 @@ class TenKGnadClusteringS2S(AbsTaskClustering): eval_langs=["deu-Latn"], main_score="v_measure", date=None, - form=None, domains=["News", "Non-fiction", "Written"], task_subtypes=["Topic classification"], license=None, diff --git a/mteb/tasks/Clustering/fra/AlloProfClusteringP2P.py b/mteb/tasks/Clustering/fra/AlloProfClusteringP2P.py index 83a22953fb..22a061d7d3 100644 --- a/mteb/tasks/Clustering/fra/AlloProfClusteringP2P.py +++ b/mteb/tasks/Clustering/fra/AlloProfClusteringP2P.py @@ -31,7 +31,6 @@ class AlloProfClusteringP2P(AbsTaskClustering): eval_langs=["fra-Latn"], main_score="v_measure", date=("1996-01-01", "2023-04-14"), - form=None, domains=["Encyclopaedic", "Written"], task_subtypes=["Thematic clustering"], license="mit", diff --git a/mteb/tasks/Clustering/fra/AlloProfClusteringS2S.py b/mteb/tasks/Clustering/fra/AlloProfClusteringS2S.py index 349faaec7f..058dbeb13b 100644 --- a/mteb/tasks/Clustering/fra/AlloProfClusteringS2S.py +++ b/mteb/tasks/Clustering/fra/AlloProfClusteringS2S.py @@ -31,7 +31,6 @@ class AlloProfClusteringS2S(AbsTaskClustering): eval_langs=["fra-Latn"], main_score="v_measure", date=("1996-01-01", "2023-04-14"), - form=None, domains=["Encyclopaedic", "Written"], task_subtypes=["Thematic clustering"], license="mit", diff --git a/mteb/tasks/Clustering/fra/HALClusteringS2S.py b/mteb/tasks/Clustering/fra/HALClusteringS2S.py index eaeb4924a0..5a75d26ad5 100644 --- a/mteb/tasks/Clustering/fra/HALClusteringS2S.py +++ b/mteb/tasks/Clustering/fra/HALClusteringS2S.py @@ -33,7 +33,6 @@ class HALClusteringS2S(AbsTaskClustering): eval_langs=["fra-Latn"], main_score="v_measure", date=("2000-03-29", "2024-05-24"), - form=None, domains=["Academic", "Written"], task_subtypes=["Thematic clustering"], license="apache-2.0", diff --git a/mteb/tasks/Clustering/zho/CMTEBClustering.py b/mteb/tasks/Clustering/zho/CMTEBClustering.py index 24ea372983..259688f896 100644 --- a/mteb/tasks/Clustering/zho/CMTEBClustering.py +++ b/mteb/tasks/Clustering/zho/CMTEBClustering.py @@ -149,7 +149,6 @@ class CLSClusteringS2S(AbsTaskClustering): eval_langs=["cmn-Hans"], main_score="v_measure", date=None, - form=None, domains=None, task_subtypes=None, license=None, @@ -185,7 +184,6 @@ class CLSClusteringP2P(AbsTaskClustering): eval_langs=["cmn-Hans"], main_score="v_measure", date=None, - form=None, domains=None, task_subtypes=None, license=None, @@ -339,7 +337,6 @@ class ThuNewsClusteringS2S(AbsTaskClustering): eval_langs=["cmn-Hans"], main_score="v_measure", date=None, - form=None, domains=None, task_subtypes=None, license=None, @@ -383,7 +380,6 @@ class ThuNewsClusteringP2P(AbsTaskClustering): eval_langs=["cmn-Hans"], main_score="v_measure", date=None, - form=None, domains=None, task_subtypes=None, license=None, diff --git a/mteb/tasks/Reranking/zho/CMTEBReranking.py b/mteb/tasks/Reranking/zho/CMTEBReranking.py index 2ad84444b2..a570bd3efb 100644 --- a/mteb/tasks/Reranking/zho/CMTEBReranking.py +++ b/mteb/tasks/Reranking/zho/CMTEBReranking.py @@ -20,7 +20,6 @@ class T2Reranking(AbsTaskReranking): eval_langs=["cmn-Hans"], main_score="map", date=None, - form=None, domains=[], task_subtypes=None, license="not specified", @@ -57,7 +56,6 @@ class MMarcoReranking(AbsTaskReranking): eval_langs=["cmn-Hans"], main_score="map", date=None, - form=None, domains=None, task_subtypes=None, license=None, @@ -133,7 +131,6 @@ class CMedQAv2(AbsTaskReranking): eval_langs=["cmn-Hans"], main_score="map", date=None, - form=None, domains=["Medical", "Written"], task_subtypes=None, license=None, diff --git a/mteb/tasks/Retrieval/zho/CMTEBRetrieval.py b/mteb/tasks/Retrieval/zho/CMTEBRetrieval.py index dd158e2858..610eff188c 100644 --- a/mteb/tasks/Retrieval/zho/CMTEBRetrieval.py +++ b/mteb/tasks/Retrieval/zho/CMTEBRetrieval.py @@ -278,6 +278,7 @@ class CmedqaRetrieval(AbsTaskRetrieval): prompt={ "query": "Given a Chinese community medical question, retrieve replies that best answer the question" }, + adapted_from=["CMedQAv2-reranking"], ) def load_data(self, **kwargs):