NOVADEDOG
diff --git a/‎energy-leaderboard-web/public/data/manifest.json‎
Lines changed: 16 additions & 0 deletions b/‎energy-leaderboard-web/public/data/manifest.json‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎energy-leaderboard-web/public/data/output_gpt-oss-120b_easy_16_12.json‎
Lines changed: 56 additions & 56 deletions b/‎energy-leaderboard-web/public/data/output_gpt-oss-120b_easy_16_12.json‎
Lines changed: 56 additions & 56 deletions
diff --git a/‎energy-leaderboard-web/public/data/output_gpt-oss-120b_hard_16_12.json‎
Lines changed: 69 additions & 69 deletions b/‎energy-leaderboard-web/public/data/output_gpt-oss-120b_hard_16_12.json‎
Lines changed: 69 additions & 69 deletions
diff --git a/‎energy-leaderboard-web/public/data/output_gpt-oss-120b_medium_16_12.json‎
Lines changed: 57 additions & 57 deletions b/‎energy-leaderboard-web/public/data/output_gpt-oss-120b_medium_16_12.json‎
Lines changed: 57 additions & 57 deletions
diff --git a/‎energy-leaderboard-web/public/data/output_gpt-oss-120b_mixed_16_12.json‎
Lines changed: 62 additions & 62 deletions b/‎energy-leaderboard-web/public/data/output_gpt-oss-120b_mixed_16_12.json‎
Lines changed: 62 additions & 62 deletions
diff --git a/‎energy-leaderboard-web/public/data/output_gpt-oss-20b_easy_16_12.json‎
Lines changed: 54 additions & 54 deletions b/‎energy-leaderboard-web/public/data/output_gpt-oss-20b_easy_16_12.json‎
Lines changed: 54 additions & 54 deletions
diff --git a/‎energy-leaderboard-web/public/data/output_gpt-oss-20b_easy_16_12_ollama.json‎
Lines changed: 38 additions & 38 deletions b/‎energy-leaderboard-web/public/data/output_gpt-oss-20b_easy_16_12_ollama.json‎
Lines changed: 38 additions & 38 deletions
@@ -7,6 +7,18 @@
   "output_gemma3_4b_medium_26_11.json",
   "output_gemma3_4b_mixed_02_12.json",
   "output_gemma3_4b_mixed_26_11.json",
+  "output_gpt-oss-120b_easy_16_12.json",
+  "output_gpt-oss-120b_hard_16_12.json",
+  "output_gpt-oss-120b_medium_16_12.json",
+  "output_gpt-oss-120b_mixed_16_12.json",
+  "output_gpt-oss-20b_easy_16_12.json",
+  "output_gpt-oss-20b_easy_16_12_ollama.json",
+  "output_gpt-oss-20b_hard_16_12.json",
+  "output_gpt-oss-20b_hard_16_12_ollama.json",
+  "output_gpt-oss-20b_medium_16_12.json",
+  "output_gpt-oss-20b_medium_16_12_ollama.json",
+  "output_gpt-oss-20b_mixed_16_12.json",
+  "output_gpt-oss-20b_mixed_16_12_ollama.json",
   "output_gpt-oss_20b_easy_02_12.json",
   "output_gpt-oss_20b_hard_02_12.json",
   "output_gpt-oss_20b_medium_02_12.json",
@@ -23,6 +35,10 @@
   "output_llama3_8b_hard_26_11.json",
   "output_llama3_8b_medium_26_11.json",
   "output_llama3_8b_mixed_26_11.json",
+  "output_nemotron-3-nano_easy_16_12_ollama.json",
+  "output_nemotron-3-nano_hard_16_12_ollama.json",
+  "output_nemotron-3-nano_medium_16_12_ollama.json",
+  "output_nemotron-3-nano_mixed_16_12_ollama.json",
   "output_qwen3_8b_easy_02_12.json",
   "output_qwen3_8b_easy_26_11.json",
   "output_qwen3_8b_hard_02_12.json",
 
@@ -13,22 +13,22 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q1",
     "question_difficulty": "easy",
     "question_task_type": "qa",
-    "expected_answer_description": "A one\u2011word answer naming Japan\u2019s capital (Tokyo).",
+    "expected_answer_description": "A one‑word answer naming Japan’s capital (Tokyo).",
     "max_output_tokens_hint": 5,
     "energy_relevance": "Very short prompt and answer provide a baseline for minimal energy consumption.",
     "tags": [
@@ -54,17 +54,17 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q2",
     "question_difficulty": "easy",
@@ -95,17 +95,17 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q3",
     "question_difficulty": "easy",
@@ -136,22 +136,22 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q4",
     "question_difficulty": "easy",
     "question_task_type": "qa",
-    "expected_answer_description": "The two\u2011letter chemical formula (H2O).",
+    "expected_answer_description": "The two‑letter chemical formula (H2O).",
     "max_output_tokens_hint": 5,
     "energy_relevance": "Short chemical knowledge question; minimal output.",
     "tags": [
@@ -164,7 +164,7 @@
     "g_co2": 0.017527
   },
   {
-    "prompt": "Who wrote the play \u2018Romeo and Juliet\u2019?",
+    "prompt": "Who wrote the play ‘Romeo and Juliet’?",
     "completion": "",
     "tokens_prompt": 78,
     "tokens_completion": 61,
@@ -177,22 +177,22 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q5",
     "question_difficulty": "easy",
     "question_task_type": "qa",
-    "expected_answer_description": "The author\u2019s name (William Shakespeare).",
+    "expected_answer_description": "The author’s name (William Shakespeare).",
     "max_output_tokens_hint": 6,
     "energy_relevance": "Simple fact retrieval; low energy.",
     "tags": [
@@ -218,22 +218,22 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q6",
     "question_difficulty": "easy",
     "question_task_type": "qa",
-    "expected_answer_description": "A four\u2011digit year (1969).",
+    "expected_answer_description": "A four‑digit year (1969).",
     "max_output_tokens_hint": 5,
     "energy_relevance": "Short question with numeric answer; minimal compute.",
     "tags": [
@@ -259,22 +259,22 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q7",
     "question_difficulty": "easy",
     "question_task_type": "qa",
-    "expected_answer_description": "The element\u2019s name (Carbon).",
+    "expected_answer_description": "The element’s name (Carbon).",
     "max_output_tokens_hint": 5,
     "energy_relevance": "Simple factual recall; low energy cost.",
     "tags": [
@@ -300,24 +300,24 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q8",
     "question_difficulty": "easy",
     "question_task_type": "qa",
     "expected_answer_description": "A single integer (7).",
     "max_output_tokens_hint": 4,
-    "energy_relevance": "Basic arithmetic with one\u2011word output.",
+    "energy_relevance": "Basic arithmetic with one‑word output.",
     "tags": [
       "math",
       "numeric",
@@ -341,17 +341,17 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q9",
     "question_difficulty": "easy",
@@ -382,24 +382,24 @@
     "region": "unknown",
     "notice": null,
     "sampling_ms": 100,
-    "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "device_name": "AMD Radeon Graphics",
     "device_type": "amd",
     "os_name": "Linux",
     "os_version": "6.14.0-37-generic",
     "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S",
-    "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics",
+    "gpu_model": "AMD Radeon Graphics",
     "ram_gb": 125.1,
     "chip_architecture": "x86_64",
     "testset_id": "ts1",
     "testset_name": "Short factual questions (low energy baseline)",
-    "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.",
+    "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.",
     "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.",
     "question_id": "ts1_q10",
     "question_difficulty": "easy",
     "question_task_type": "qa",
     "expected_answer_description": "The resulting secondary color (purple or violet).",
     "max_output_tokens_hint": 6,
-    "energy_relevance": "Simple fact with one\u2011word answer to establish baseline energy usage.",
+    "energy_relevance": "Simple fact with one‑word answer to establish baseline energy usage.",
     "tags": [
       "color-mixing",
       "factual",