Skip to content

Commit 179702e

Browse files
authored
fix miracl loading (#3466)
1 parent ced1c1c commit 179702e

File tree

1 file changed

+2
-6
lines changed

1 file changed

+2
-6
lines changed

mteb/tasks/retrieval/multilingual/miracl_vision_retrieval.py

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@
3030
def _load_miracl_data(
3131
path: str,
3232
langs: list,
33-
splits: str,
33+
splits: list[str],
3434
revision: str | None = None,
3535
):
3636
corpus = {lang: dict.fromkeys(splits) for lang in langs}
@@ -108,10 +108,6 @@ def _load_miracl_data(
108108
relevant_docs[lang][split][query_id] = {}
109109
relevant_docs[lang][split][query_id][doc_id] = score
110110

111-
corpus = datasets.DatasetDict(corpus)
112-
queries = datasets.DatasetDict(queries)
113-
relevant_docs = datasets.DatasetDict(relevant_docs)
114-
115111
return corpus, queries, relevant_docs
116112

117113

@@ -156,7 +152,7 @@ def load_data(self) -> None:
156152

157153
self.corpus, self.queries, self.relevant_docs = _load_miracl_data(
158154
path=self.metadata.dataset["path"],
159-
splits=self.metadata.eval_splits[0],
155+
splits=self.metadata.eval_splits,
160156
langs=self.hf_subsets,
161157
revision=self.metadata.dataset["revision"],
162158
)

0 commit comments

Comments
 (0)