Skip to content

Commit 02023dd

Browse files
authored
add grok, sonnet, o1-preview
1 parent 970429d commit 02023dd

File tree

1 file changed

+36
-0
lines changed

1 file changed

+36
-0
lines changed

results.json

Lines changed: 36 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -371,6 +371,42 @@
371371
"prompted": true,
372372
"size": 7.0
373373
},
374+
"Claude Sonnet 3.5 (June 2024)": {
375+
"link": "https://platform.openai.com/docs/models/",
376+
"open-data": "NONE",
377+
"pass@1": {
378+
"humaneval": 87.2,
379+
"humaneval+": 81.7,
380+
"mbpp": 89.4,
381+
"mbpp+": 74.3
382+
},
383+
"prompted": true,
384+
"size": null
385+
},
386+
"Grok Beta": {
387+
"link": "https://x.ai/blog/grok-2",
388+
"open-data": "NONE",
389+
"pass@1": {
390+
"humaneval": 88.4,
391+
"humaneval+": 80.5,
392+
"mbpp": 86.0,
393+
"mbpp+": 65.6
394+
},
395+
"prompted": true,
396+
"size": null
397+
},
398+
"O1 Preview (Sept 2024)": {
399+
"link": "https://platform.openai.com/docs/models/",
400+
"open-data": "NONE",
401+
"pass@1": {
402+
"humaneval": 96.3,
403+
"humaneval+": 89.0,
404+
"mbpp": 95.5,
405+
"mbpp+": 80.2
406+
},
407+
"prompted": true,
408+
"size": null
409+
},
374410
"O1 Mini (Sept 2024)": {
375411
"link": "https://platform.openai.com/docs/models/",
376412
"open-data": "NONE",

0 commit comments

Comments
 (0)