Skip to content

Commit f26e7b7

Browse files
committed
add codemmlu leaderboard
1 parent cb651f2 commit f26e7b7

File tree

2 files changed

+23
-23
lines changed

2 files changed

+23
-23
lines changed

leaderboards/codemmlu/index.html

Lines changed: 20 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -123,9 +123,9 @@ <h3 class="fw-light text-nowrap">
123123
alt="leaderboard"
124124
class="img-fluid"
125125
/></a>
126-
<a href="https://huggingface.co/datasets/Fsoft-AIC/RepoExec"
126+
<a href=""
127127
><img
128-
src="https://img.shields.io/badge/%F0%9F%A4%97%20Datasets-RepoExec-f9a602?style=for-the-badge"
128+
src="https://img.shields.io/badge/%F0%9F%A4%97%20Datasets-CodeMMLU-f9a602?style=for-the-badge"
129129
alt="data"
130130
class="img-fluid"
131131
/></a>
@@ -542,24 +542,24 @@ <h3>🙏 Acknowledgements</h3>
542542
var prompted = row["prompted"];
543543
var opendata = row["open-data"];
544544
var lazy = row["lazy"];
545-
if (prompted) {
546-
// add a symbol to indicate the model is prompted
547-
var promptedSymbol = document.createElement("span");
548-
promptedSymbol.textContent = "✨";
549-
modelCell.appendChild(promptedSymbol);
550-
}
551-
if (opendata.toUpperCase() == "FULL") {
552-
// add a symbol to indicate the model is fully open-sourced
553-
var promptedSymbol = document.createElement("span");
554-
promptedSymbol.textContent = "💚";
555-
modelCell.appendChild(promptedSymbol);
556-
} else if (opendata.toUpperCase() == "PARTIAL") {
557-
// add a symbol to indicate the model is partially open-sourced
558-
// i.e., a subset of the model implementation is close-sourced
559-
var promptedSymbol = document.createElement("span");
560-
promptedSymbol.textContent = "💙";
561-
modelCell.appendChild(promptedSymbol);
562-
}
545+
// if (prompted) {
546+
// // add a symbol to indicate the model is prompted
547+
// var promptedSymbol = document.createElement("span");
548+
// promptedSymbol.textContent = "✨";
549+
// modelCell.appendChild(promptedSymbol);
550+
// }
551+
// if (opendata.toUpperCase() == "FULL") {
552+
// // add a symbol to indicate the model is fully open-sourced
553+
// var promptedSymbol = document.createElement("span");
554+
// promptedSymbol.textContent = "💚";
555+
// modelCell.appendChild(promptedSymbol);
556+
// } else if (opendata.toUpperCase() == "PARTIAL") {
557+
// // add a symbol to indicate the model is partially open-sourced
558+
// // i.e., a subset of the model implementation is close-sourced
559+
// var promptedSymbol = document.createElement("span");
560+
// promptedSymbol.textContent = "💙";
561+
// modelCell.appendChild(promptedSymbol);
562+
// }
563563
dataRow.appendChild(modelCell);
564564
var passCell = document.createElement("td");
565565
passCell.classList.add("text-nowrap");

leaderboards/codemmlu/results.json

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -280,20 +280,20 @@
280280
"complete": 67
281281
},
282282
"prompted": true,
283-
"size": "None",
283+
"size": null,
284284
"direct_complete": false,
285285
"lazy": false,
286286
"elo_mle": 874
287287
},
288288
"GPT-3.5-turbo-0613": {
289289
"link": "",
290-
"open-data": "None",
290+
"open-data": null,
291291
"pass@1": {
292292
"instruct": null,
293293
"complete": 51.7
294294
},
295295
"prompted": true,
296-
"size": "None",
296+
"size": null,
297297
"direct_complete": false,
298298
"lazy": false,
299299
"elo_mle": 874

0 commit comments

Comments
 (0)