diff --git a/mteb/tasks/Retrieval/deu/GermanDPRRetrieval.py b/mteb/tasks/Retrieval/deu/GermanDPRRetrieval.py index 5290ae6aa8..73c2f53839 100644 --- a/mteb/tasks/Retrieval/deu/GermanDPRRetrieval.py +++ b/mteb/tasks/Retrieval/deu/GermanDPRRetrieval.py @@ -83,6 +83,7 @@ def load_data(self, **kwargs): ) corpus.update(neg_docs) relevant_docs[q_id] = {k: 1 for k in pos_docs} + corpus = {doc["id"]: doc.get("title", "") + " " + doc["text"] for doc in corpus} self.queries = {self._EVAL_SPLIT: queries} self.corpus = {self._EVAL_SPLIT: corpus} self.relevant_docs = {self._EVAL_SPLIT: relevant_docs}