embeddings-benchmark · KennethEnevoldsen · Sep 10, 2024 · Sep 9, 2024 · Sep 9, 2024 · Sep 9, 2024
diff --git a/README.md b/README.md
@@ -38,7 +38,7 @@ pip install mteb
 
 ## Usage
 
-* Using a python script (see [scripts/run_mteb_english.py](https://github.com/embeddings-benchmark/mteb/blob/main/scripts/run_mteb_english.py) and [mteb/mtebscripts](https://github.com/embeddings-benchmark/mtebscripts) for more):
+* Using a python script:
 
 ```python
 import mteb
@@ -77,11 +77,11 @@ Click on each section below to see the details.
 <br /> 
 
 <details>
-  <summary>  Dataset selection </summary>
+  <summary>  Task selection </summary>
 
-### Dataset selection
+### Task selection
 
-Datasets can be selected by providing the list of datasets, but also
+Tasks can be selected by providing the list of datasets, but also
 
 * by their task (e.g. "Clustering" or "Classification")
 
@@ -121,11 +121,18 @@ evaluation = mteb.MTEB(tasks=[
 # for an example of a HF subset see "Subset" in the dataset viewer at: https://huggingface.co/datasets/mteb/bucc-bitext-mining
 ```
 
-There are also presets available for certain task collections, e.g. to select the 56 English datasets that form the "Overall MTEB English leaderboard":
+</details>
+
+<details>
+  <summary>  Running a benchmark </summary>
+
+`mteb` comes with a set of predefined benchmarks. These can be fetched using `get_benchmark` and run in a similar fashion to other sets of tasks. 
+For instance to select the 56 English datasets that form the "Overall MTEB English leaderboard":
 
 ```python
-from mteb import MTEB_MAIN_EN
-evaluation = mteb.MTEB(tasks=MTEB_MAIN_EN, task_langs=["en"])
+import mteb
+mteb_eng = mteb.get_benchmark("MTEB(eng)")
+evaluation = mteb.MTEB(tasks=mteb_eng, eval_splits=["test"])
 ```
 
 </details>

diff --git a/mteb/__init__.py b/mteb/__init__.py
@@ -2,7 +2,7 @@
 
 from importlib.metadata import version
 
-from mteb.benchmarks import (
+from mteb.benchmarks.benchmarks import (
     MTEB_MAIN_EN,
     MTEB_MAIN_RU,
     MTEB_RETRIEVAL_LAW,
@@ -14,7 +14,8 @@
 from mteb.models import get_model, get_model_meta
 from mteb.overview import TASKS_REGISTRY, get_task, get_tasks
 
-from .benchmarks import Benchmark
+from .benchmarks.benchmarks import Benchmark
+from .benchmarks.get_benchmark import get_benchmark
 
 __version__ = version("mteb")  # fetch version from install metadata
 
@@ -32,4 +33,5 @@
     "get_model_meta",
     "load_results",
     "Benchmark",
+    "get_benchmark",
 ]
diff --git a/mteb/benchmarks/__init__.py b/mteb/benchmarks/__init__.py
@@ -0,0 +1,3 @@
+from __future__ import annotations
+
+from mteb.benchmarks.benchmarks import *
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		from __future__ import annotations

		from mteb.benchmarks.benchmarks import *