|
13 | 13 | "region": "unknown", |
14 | 14 | "notice": null, |
15 | 15 | "sampling_ms": 100, |
16 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 16 | + "device_name": "AMD Radeon Graphics", |
17 | 17 | "device_type": "amd", |
18 | 18 | "os_name": "Linux", |
19 | 19 | "os_version": "6.14.0-37-generic", |
20 | 20 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
21 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 21 | + "gpu_model": "AMD Radeon Graphics", |
22 | 22 | "ram_gb": 125.1, |
23 | 23 | "chip_architecture": "x86_64", |
24 | 24 | "testset_id": "ts1", |
25 | 25 | "testset_name": "Short factual questions (low energy baseline)", |
26 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 26 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
27 | 27 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
28 | 28 | "question_id": "ts1_q1", |
29 | 29 | "question_difficulty": "easy", |
30 | 30 | "question_task_type": "qa", |
31 | | - "expected_answer_description": "A one\u2011word answer naming Japan\u2019s capital (Tokyo).", |
| 31 | + "expected_answer_description": "A one‑word answer naming Japan’s capital (Tokyo).", |
32 | 32 | "max_output_tokens_hint": 5, |
33 | 33 | "energy_relevance": "Very short prompt and answer provide a baseline for minimal energy consumption.", |
34 | 34 | "tags": [ |
|
54 | 54 | "region": "unknown", |
55 | 55 | "notice": null, |
56 | 56 | "sampling_ms": 100, |
57 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 57 | + "device_name": "AMD Radeon Graphics", |
58 | 58 | "device_type": "amd", |
59 | 59 | "os_name": "Linux", |
60 | 60 | "os_version": "6.14.0-37-generic", |
61 | 61 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
62 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 62 | + "gpu_model": "AMD Radeon Graphics", |
63 | 63 | "ram_gb": 125.1, |
64 | 64 | "chip_architecture": "x86_64", |
65 | 65 | "testset_id": "ts1", |
66 | 66 | "testset_name": "Short factual questions (low energy baseline)", |
67 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 67 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
68 | 68 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
69 | 69 | "question_id": "ts1_q2", |
70 | 70 | "question_difficulty": "easy", |
|
95 | 95 | "region": "unknown", |
96 | 96 | "notice": null, |
97 | 97 | "sampling_ms": 100, |
98 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 98 | + "device_name": "AMD Radeon Graphics", |
99 | 99 | "device_type": "amd", |
100 | 100 | "os_name": "Linux", |
101 | 101 | "os_version": "6.14.0-37-generic", |
102 | 102 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
103 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 103 | + "gpu_model": "AMD Radeon Graphics", |
104 | 104 | "ram_gb": 125.1, |
105 | 105 | "chip_architecture": "x86_64", |
106 | 106 | "testset_id": "ts1", |
107 | 107 | "testset_name": "Short factual questions (low energy baseline)", |
108 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 108 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
109 | 109 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
110 | 110 | "question_id": "ts1_q3", |
111 | 111 | "question_difficulty": "easy", |
|
136 | 136 | "region": "unknown", |
137 | 137 | "notice": null, |
138 | 138 | "sampling_ms": 100, |
139 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 139 | + "device_name": "AMD Radeon Graphics", |
140 | 140 | "device_type": "amd", |
141 | 141 | "os_name": "Linux", |
142 | 142 | "os_version": "6.14.0-37-generic", |
143 | 143 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
144 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 144 | + "gpu_model": "AMD Radeon Graphics", |
145 | 145 | "ram_gb": 125.1, |
146 | 146 | "chip_architecture": "x86_64", |
147 | 147 | "testset_id": "ts1", |
148 | 148 | "testset_name": "Short factual questions (low energy baseline)", |
149 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 149 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
150 | 150 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
151 | 151 | "question_id": "ts1_q4", |
152 | 152 | "question_difficulty": "easy", |
153 | 153 | "question_task_type": "qa", |
154 | | - "expected_answer_description": "The two\u2011letter chemical formula (H2O).", |
| 154 | + "expected_answer_description": "The two‑letter chemical formula (H2O).", |
155 | 155 | "max_output_tokens_hint": 5, |
156 | 156 | "energy_relevance": "Short chemical knowledge question; minimal output.", |
157 | 157 | "tags": [ |
|
164 | 164 | "g_co2": 0.017527 |
165 | 165 | }, |
166 | 166 | { |
167 | | - "prompt": "Who wrote the play \u2018Romeo and Juliet\u2019?", |
| 167 | + "prompt": "Who wrote the play ‘Romeo and Juliet’?", |
168 | 168 | "completion": "", |
169 | 169 | "tokens_prompt": 78, |
170 | 170 | "tokens_completion": 61, |
|
177 | 177 | "region": "unknown", |
178 | 178 | "notice": null, |
179 | 179 | "sampling_ms": 100, |
180 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 180 | + "device_name": "AMD Radeon Graphics", |
181 | 181 | "device_type": "amd", |
182 | 182 | "os_name": "Linux", |
183 | 183 | "os_version": "6.14.0-37-generic", |
184 | 184 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
185 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 185 | + "gpu_model": "AMD Radeon Graphics", |
186 | 186 | "ram_gb": 125.1, |
187 | 187 | "chip_architecture": "x86_64", |
188 | 188 | "testset_id": "ts1", |
189 | 189 | "testset_name": "Short factual questions (low energy baseline)", |
190 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 190 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
191 | 191 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
192 | 192 | "question_id": "ts1_q5", |
193 | 193 | "question_difficulty": "easy", |
194 | 194 | "question_task_type": "qa", |
195 | | - "expected_answer_description": "The author\u2019s name (William Shakespeare).", |
| 195 | + "expected_answer_description": "The author’s name (William Shakespeare).", |
196 | 196 | "max_output_tokens_hint": 6, |
197 | 197 | "energy_relevance": "Simple fact retrieval; low energy.", |
198 | 198 | "tags": [ |
|
218 | 218 | "region": "unknown", |
219 | 219 | "notice": null, |
220 | 220 | "sampling_ms": 100, |
221 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 221 | + "device_name": "AMD Radeon Graphics", |
222 | 222 | "device_type": "amd", |
223 | 223 | "os_name": "Linux", |
224 | 224 | "os_version": "6.14.0-37-generic", |
225 | 225 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
226 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 226 | + "gpu_model": "AMD Radeon Graphics", |
227 | 227 | "ram_gb": 125.1, |
228 | 228 | "chip_architecture": "x86_64", |
229 | 229 | "testset_id": "ts1", |
230 | 230 | "testset_name": "Short factual questions (low energy baseline)", |
231 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 231 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
232 | 232 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
233 | 233 | "question_id": "ts1_q6", |
234 | 234 | "question_difficulty": "easy", |
235 | 235 | "question_task_type": "qa", |
236 | | - "expected_answer_description": "A four\u2011digit year (1969).", |
| 236 | + "expected_answer_description": "A four‑digit year (1969).", |
237 | 237 | "max_output_tokens_hint": 5, |
238 | 238 | "energy_relevance": "Short question with numeric answer; minimal compute.", |
239 | 239 | "tags": [ |
|
259 | 259 | "region": "unknown", |
260 | 260 | "notice": null, |
261 | 261 | "sampling_ms": 100, |
262 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 262 | + "device_name": "AMD Radeon Graphics", |
263 | 263 | "device_type": "amd", |
264 | 264 | "os_name": "Linux", |
265 | 265 | "os_version": "6.14.0-37-generic", |
266 | 266 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
267 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 267 | + "gpu_model": "AMD Radeon Graphics", |
268 | 268 | "ram_gb": 125.1, |
269 | 269 | "chip_architecture": "x86_64", |
270 | 270 | "testset_id": "ts1", |
271 | 271 | "testset_name": "Short factual questions (low energy baseline)", |
272 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 272 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
273 | 273 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
274 | 274 | "question_id": "ts1_q7", |
275 | 275 | "question_difficulty": "easy", |
276 | 276 | "question_task_type": "qa", |
277 | | - "expected_answer_description": "The element\u2019s name (Carbon).", |
| 277 | + "expected_answer_description": "The element’s name (Carbon).", |
278 | 278 | "max_output_tokens_hint": 5, |
279 | 279 | "energy_relevance": "Simple factual recall; low energy cost.", |
280 | 280 | "tags": [ |
|
300 | 300 | "region": "unknown", |
301 | 301 | "notice": null, |
302 | 302 | "sampling_ms": 100, |
303 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 303 | + "device_name": "AMD Radeon Graphics", |
304 | 304 | "device_type": "amd", |
305 | 305 | "os_name": "Linux", |
306 | 306 | "os_version": "6.14.0-37-generic", |
307 | 307 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
308 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 308 | + "gpu_model": "AMD Radeon Graphics", |
309 | 309 | "ram_gb": 125.1, |
310 | 310 | "chip_architecture": "x86_64", |
311 | 311 | "testset_id": "ts1", |
312 | 312 | "testset_name": "Short factual questions (low energy baseline)", |
313 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 313 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
314 | 314 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
315 | 315 | "question_id": "ts1_q8", |
316 | 316 | "question_difficulty": "easy", |
317 | 317 | "question_task_type": "qa", |
318 | 318 | "expected_answer_description": "A single integer (7).", |
319 | 319 | "max_output_tokens_hint": 4, |
320 | | - "energy_relevance": "Basic arithmetic with one\u2011word output.", |
| 320 | + "energy_relevance": "Basic arithmetic with one‑word output.", |
321 | 321 | "tags": [ |
322 | 322 | "math", |
323 | 323 | "numeric", |
|
341 | 341 | "region": "unknown", |
342 | 342 | "notice": null, |
343 | 343 | "sampling_ms": 100, |
344 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 344 | + "device_name": "AMD Radeon Graphics", |
345 | 345 | "device_type": "amd", |
346 | 346 | "os_name": "Linux", |
347 | 347 | "os_version": "6.14.0-37-generic", |
348 | 348 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
349 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 349 | + "gpu_model": "AMD Radeon Graphics", |
350 | 350 | "ram_gb": 125.1, |
351 | 351 | "chip_architecture": "x86_64", |
352 | 352 | "testset_id": "ts1", |
353 | 353 | "testset_name": "Short factual questions (low energy baseline)", |
354 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 354 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
355 | 355 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
356 | 356 | "question_id": "ts1_q9", |
357 | 357 | "question_difficulty": "easy", |
|
382 | 382 | "region": "unknown", |
383 | 383 | "notice": null, |
384 | 384 | "sampling_ms": 100, |
385 | | - "device_name": "Linux with GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 385 | + "device_name": "AMD Radeon Graphics", |
386 | 386 | "device_type": "amd", |
387 | 387 | "os_name": "Linux", |
388 | 388 | "os_version": "6.14.0-37-generic", |
389 | 389 | "cpu_model": "AMD RYZEN AI MAX+ 395 w/ Radeon 8060S", |
390 | | - "gpu_model": "GPU[0]\t\t: Card Series: \t\tAMD Radeon Graphics", |
| 390 | + "gpu_model": "AMD Radeon Graphics", |
391 | 391 | "ram_gb": 125.1, |
392 | 392 | "chip_architecture": "x86_64", |
393 | 393 | "testset_id": "ts1", |
394 | 394 | "testset_name": "Short factual questions (low energy baseline)", |
395 | | - "testset_goal": "Establish a low\u2011energy baseline by asking simple factual or arithmetic questions that require short, single\u2011sentence answers.", |
| 395 | + "testset_goal": "Establish a low‑energy baseline by asking simple factual or arithmetic questions that require short, single‑sentence answers.", |
396 | 396 | "testset_notes": "Use this set to measure the minimum energy cost of a local LLM under controlled conditions. Each prompt is concise, and the expected output is a short factual answer with minimal reasoning. Run multiple models on the same hardware and compare average energy per response.", |
397 | 397 | "question_id": "ts1_q10", |
398 | 398 | "question_difficulty": "easy", |
399 | 399 | "question_task_type": "qa", |
400 | 400 | "expected_answer_description": "The resulting secondary color (purple or violet).", |
401 | 401 | "max_output_tokens_hint": 6, |
402 | | - "energy_relevance": "Simple fact with one\u2011word answer to establish baseline energy usage.", |
| 402 | + "energy_relevance": "Simple fact with one‑word answer to establish baseline energy usage.", |
403 | 403 | "tags": [ |
404 | 404 | "color-mixing", |
405 | 405 | "factual", |
|
0 commit comments