Skip to content

Commit 96f639b

Browse files
fix: Fixed eval split for MultilingualSentiment in C-MTEB (#1804)
* Fixed eval split for MultilingualSentiment in C-MTEB * FIxed splits for atec, bq and stsb in C-MTEB
1 parent b4d0eaa commit 96f639b

File tree

1 file changed

+41
-34
lines changed

1 file changed

+41
-34
lines changed

mteb/benchmarks/benchmarks.py

Lines changed: 41 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -1152,40 +1152,47 @@ def load_results(
11521152

11531153
C_MTEB = Benchmark(
11541154
name="MTEB(Chinese)",
1155-
tasks=get_tasks(
1156-
tasks=[
1157-
"T2Retrieval",
1158-
"MMarcoRetrieval",
1159-
"DuRetrieval",
1160-
"CovidRetrieval",
1161-
"CmedqaRetrieval",
1162-
"EcomRetrieval",
1163-
"MedicalRetrieval",
1164-
"VideoRetrieval",
1165-
"T2Reranking",
1166-
"MMarcoReranking",
1167-
"CMedQAv1-reranking",
1168-
"CMedQAv2-reranking",
1169-
"Ocnli",
1170-
"Cmnli",
1171-
"CLSClusteringS2S",
1172-
"CLSClusteringP2P",
1173-
"ThuNewsClusteringS2S",
1174-
"ThuNewsClusteringP2P",
1175-
"ATEC",
1176-
"BQ",
1177-
"LCQMC",
1178-
"PAWSX",
1179-
"STSB",
1180-
"AFQMC",
1181-
"QBQTC",
1182-
"TNews",
1183-
"IFlyTek",
1184-
"Waimai",
1185-
"OnlineShopping",
1186-
"MultilingualSentiment",
1187-
"JDReview",
1188-
],
1155+
tasks=MTEBTasks(
1156+
get_tasks(
1157+
tasks=[
1158+
"T2Retrieval",
1159+
"MMarcoRetrieval",
1160+
"DuRetrieval",
1161+
"CovidRetrieval",
1162+
"CmedqaRetrieval",
1163+
"EcomRetrieval",
1164+
"MedicalRetrieval",
1165+
"VideoRetrieval",
1166+
"T2Reranking",
1167+
"MMarcoReranking",
1168+
"CMedQAv1-reranking",
1169+
"CMedQAv2-reranking",
1170+
"Ocnli",
1171+
"Cmnli",
1172+
"CLSClusteringS2S",
1173+
"CLSClusteringP2P",
1174+
"ThuNewsClusteringS2S",
1175+
"ThuNewsClusteringP2P",
1176+
"LCQMC",
1177+
"PAWSX",
1178+
"AFQMC",
1179+
"QBQTC",
1180+
"TNews",
1181+
"IFlyTek",
1182+
"Waimai",
1183+
"OnlineShopping",
1184+
"JDReview",
1185+
],
1186+
)
1187+
+ get_tasks(tasks=["MultilingualSentiment"], eval_splits=["test"])
1188+
+ get_tasks(
1189+
tasks=[
1190+
"ATEC",
1191+
"BQ",
1192+
"STSB",
1193+
],
1194+
eval_splits=["validation"],
1195+
)
11891196
),
11901197
description="The Chinese Massive Text Embedding Benchmark (C-MTEB) is a comprehensive benchmark for Chinese text embeddings covering 6 tasks and 35 datasets.",
11911198
reference="https://github.com/FlagOpen/FlagEmbedding/tree/master/research/C_MTEB",

0 commit comments

Comments
 (0)