evalplus: add llama 3.1 8b

ganler · web-flow · commit d3d769b09250 · 2024-11-10T08:42:37.000-06:00
diff --git a/leaderboard.html b/leaderboard.html
@@ -93,7 +93,7 @@ <h1 class="text-nowrap mt-5">🏆 EvalPlus Leaderboard 🏆</h1>
     <h3 class="fw-light text-nowrap">
       <small id="warning">EvalPlus evaluates AI Coders with rigorous tests.<br /></small>
     </h3>
-    <p>📢 Beyond correctness, how's their code efficiency? Checkout <a href="./evalperf.html">🚀EvalPerf</a>!</p>
+    <p>📢 News: Beyond correctness, how's their code efficiency? Checkout <a href="./evalperf.html">🚀EvalPerf</a>!</p>
     <div class="d-flex flex-row justify-content-center gap-3">
       <a href="https://github.com/evalplus/evalplus"><img
           src="https://img.shields.io/badge/github-%23121011.svg?style=for-the-badge&logo=github&logoColor=white"
diff --git a/results.json b/results.json
@@ -527,6 +527,18 @@
     "prompted": false,
     "size": 8.0
   },
+  "Llama3.1-8B-instruct": {
+    "link": "https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct",
+    "open-data": "NONE",
+    "pass@1": {
+      "humaneval": 69.5,
+      "humaneval+": 62.8,
+      "mbpp": 66.4,
+      "mbpp+": 54.0
+    },
+    "prompted": true,
+    "size": 8.0
+  },
   "Llama3-8B-instruct": {
     "link": "https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct",
     "open-data": "NONE",