Skip to content

Commit 56ce8f1

Browse files
authored
evalplus: update
1 parent 052c968 commit 56ce8f1

File tree

2 files changed

+19
-7
lines changed

2 files changed

+19
-7
lines changed

leaderboard.html

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -167,7 +167,7 @@ <h3>📝 Notes</h3>
167167
<a href="https://github.com/evalplus/humanevalplus_release"
168168
>HumanEval+</a
169169
>
170-
version 0.1.9;
170+
version 0.1.10;
171171
<a href="https://github.com/evalplus/mbppplus_release">MBPP+</a>
172172
version 0.2.0.
173173
</li>

results.json

Lines changed: 18 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -531,20 +531,20 @@
531531
"link": "https://huggingface.co/microsoft/wavecoder-ultra-6.7b",
532532
"open-data": "NONE",
533533
"pass@1": {
534-
"humaneval": 73.8,
535-
"humaneval+": 67.1,
536-
"mbpp": 77.5,
537-
"mbpp+": 65.1
534+
"humaneval": 75.0,
535+
"humaneval+": 69.5,
536+
"mbpp": 74.9,
537+
"mbpp+": 63.5
538538
},
539-
"prompted": false,
539+
"prompted": true,
540540
"size": 7.0
541541
},
542542
"Magicoder-S-CL-7B": {
543543
"link": "https://huggingface.co/ise-uiuc/Magicoder-S-CL-7B",
544544
"open-data": "Partial",
545545
"pass@1": {
546546
"humaneval": 70.7,
547-
"humaneval+": 67.1,
547+
"humaneval+": 67.7,
548548
"mbpp": 70.6,
549549
"mbpp+": 60.1
550550
},
@@ -1187,6 +1187,18 @@
11871187
"prompted": true,
11881188
"size": 7.0
11891189
},
1190+
"Phi-3-mini-4k-instruct": {
1191+
"link": "https://huggingface.co/microsoft/Phi-3-mini-4k-instruct",
1192+
"open-data": "NONE",
1193+
"pass@1": {
1194+
"humaneval": 64.6,
1195+
"humaneval+": 59.1,
1196+
"mbpp": 65.9,
1197+
"mbpp+": 54.2
1198+
},
1199+
"prompted": true,
1200+
"size": 3.8
1201+
},
11901202
"phi-2-2.7B": {
11911203
"link": "https://huggingface.co/microsoft/phi-2",
11921204
"open-data": "NONE",

0 commit comments

Comments
 (0)