Skip to content

Commit effc006

Browse files
authored
update scores using latest versions
1 parent 253cadb commit effc006

File tree

1 file changed

+21
-21
lines changed

1 file changed

+21
-21
lines changed

results.json

Lines changed: 21 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -291,8 +291,8 @@
291291
"link": "https://huggingface.co/deepseek-ai/deepseek-coder-1.3b-instruct",
292292
"open-data": "NONE",
293293
"pass@1": {
294-
"humaneval": 65.2,
295-
"humaneval+": 59.8,
294+
"humaneval": 65.9,
295+
"humaneval+": 60.4,
296296
"mbpp": 65.3,
297297
"mbpp+": 54.8
298298
},
@@ -318,7 +318,7 @@
318318
"humaneval": 81.1,
319319
"humaneval+": 75.0,
320320
"mbpp": 80.4,
321-
"mbpp+": 70.7
321+
"mbpp+": 70.1
322322
},
323323
"prompted": true,
324324
"size": 33.0
@@ -339,8 +339,8 @@
339339
"link": "https://huggingface.co/deepseek-ai/deepseek-coder-6.7b-instruct",
340340
"open-data": "NONE",
341341
"pass@1": {
342-
"humaneval": 73.8,
343-
"humaneval+": 70.7,
342+
"humaneval": 74.4,
343+
"humaneval+": 71.3,
344344
"mbpp": 74.9,
345345
"mbpp+": 65.6
346346
},
@@ -567,8 +567,8 @@
567567
"link": "https://mistral.ai/news/mistral-large/",
568568
"open-data": "NONE",
569569
"pass@1": {
570-
"humaneval": 70.7,
571-
"humaneval+": 63.4,
570+
"humaneval": 69.5,
571+
"humaneval+": 62.2,
572572
"mbpp": 72.8,
573573
"mbpp+": 59.5
574574
},
@@ -663,8 +663,8 @@
663663
"link": "https://huggingface.co/openchat/openchat-3.5-0106",
664664
"open-data": "Partial",
665665
"pass@1": {
666-
"humaneval": 72.0,
667-
"humaneval+": 67.1,
666+
"humaneval": 72.6,
667+
"humaneval+": 67.7,
668668
"mbpp": 63.8,
669669
"mbpp+": 54.5
670670
},
@@ -747,8 +747,8 @@
747747
"link": "https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0",
748748
"open-data": "Partial",
749749
"pass@1": {
750-
"humaneval": 42.1,
751-
"humaneval+": 35.4,
750+
"humaneval": 43.3,
751+
"humaneval+": 37.2,
752752
"mbpp": 43.9,
753753
"mbpp+": 36.2
754754
},
@@ -927,8 +927,8 @@
927927
"link": "https://huggingface.co/WizardLM/WizardCoder-15B-V1.0",
928928
"open-data": "NONE",
929929
"pass@1": {
930-
"humaneval": 57.3,
931-
"humaneval+": 51.8,
930+
"humaneval": 56.7,
931+
"humaneval+": 50.6,
932932
"mbpp": 64.3,
933933
"mbpp+": 54.2
934934
},
@@ -963,8 +963,8 @@
963963
"link": "https://huggingface.co/WizardLM/WizardCoder-Python-7B-V1.0",
964964
"open-data": "NONE",
965965
"pass@1": {
966-
"humaneval": 48.2,
967-
"humaneval+": 42.7,
966+
"humaneval": 50.6,
967+
"humaneval+": 45.1,
968968
"mbpp": 58.5,
969969
"mbpp+": 49.5
970970
},
@@ -1024,7 +1024,7 @@
10241024
"open-data": "NONE",
10251025
"pass@1": {
10261026
"humaneval": 82.9,
1027-
"humaneval+": 76.8,
1027+
"humaneval+": 77.4,
10281028
"mbpp": 89.4,
10291029
"mbpp+": 73.3
10301030
},
@@ -1036,7 +1036,7 @@
10361036
"open-data": "NONE",
10371037
"pass@1": {
10381038
"humaneval": 70.7,
1039-
"humaneval+": 63.4,
1039+
"humaneval+": 64.0,
10401040
"mbpp": 83.6,
10411041
"mbpp+": 69.3
10421042
},
@@ -1203,7 +1203,7 @@
12031203
"link": "https://huggingface.co/microsoft/phi-2",
12041204
"open-data": "NONE",
12051205
"pass@1": {
1206-
"humaneval": 48.8,
1206+
"humaneval": 49.4,
12071207
"humaneval+": 45.1,
12081208
"mbpp": 64.0,
12091209
"mbpp+": 54.2
@@ -1216,7 +1216,7 @@
12161216
"open-data": "Partial",
12171217
"pass@1": {
12181218
"humaneval": 48.2,
1219-
"humaneval+": 40.9,
1219+
"humaneval+": 41.5,
12201220
"mbpp": 57.4,
12211221
"mbpp+": 48.7
12221222
},
@@ -1287,7 +1287,7 @@
12871287
"link": "https://huggingface.co/stabilityai/stable-code-3b",
12881288
"open-data": "Full",
12891289
"pass@1": {
1290-
"humaneval": 28.7,
1290+
"humaneval": 29.3,
12911291
"humaneval+": 25.6,
12921292
"mbpp": 54.8,
12931293
"mbpp+": 45.8
@@ -1300,7 +1300,7 @@
13001300
"open-data": "Partial",
13011301
"pass@1": {
13021302
"humaneval": 40.2,
1303-
"humaneval+": 33.5,
1303+
"humaneval+": 32.9,
13041304
"mbpp": 50.3,
13051305
"mbpp+": 41.3
13061306
},

0 commit comments

Comments
 (0)