diff --git a/Qwen/Qwen3-1.7B/accuracy/tasks.yml b/Qwen/Qwen3-1.7B/accuracy/tasks.yml new file mode 100644 index 0000000..ffc0ab7 --- /dev/null +++ b/Qwen/Qwen3-1.7B/accuracy/tasks.yml @@ -0,0 +1,10 @@ +# Migrated from neuralmagic/lm-eval-configs/models/Qwen3-1.7B.yaml +# Note: Metric values are placeholders (0.0) and should be updated with actual baseline values when available +tasks: + - name: gsm8k + metrics: + - name: exact_match,strict-match + value: 0.0 + - name: exact_match,flexible-extract + value: 0.0 + diff --git a/Qwen/Qwen3-4B/accuracy/tasks.yml b/Qwen/Qwen3-4B/accuracy/tasks.yml new file mode 100644 index 0000000..0ab4772 --- /dev/null +++ b/Qwen/Qwen3-4B/accuracy/tasks.yml @@ -0,0 +1,10 @@ +# Migrated from neuralmagic/lm-eval-configs/models/Qwen3-4B.yaml +# Note: Metric values are placeholders (0.0) and should be updated with actual baseline values when available +tasks: + - name: gsm8k + metrics: + - name: exact_match,strict-match + value: 0.0 + - name: exact_match,flexible-extract + value: 0.0 + diff --git a/google/gemma-7b/accuracy/tasks.yml b/google/gemma-7b/accuracy/tasks.yml new file mode 100644 index 0000000..dcb5c97 --- /dev/null +++ b/google/gemma-7b/accuracy/tasks.yml @@ -0,0 +1,10 @@ +# Migrated from neuralmagic/lm-eval-configs/models/gemma-7b.yaml +# Note: Metric values are placeholders (0.0) and should be updated with actual baseline values when available +tasks: + - name: gsm8k + metrics: + - name: exact_match,strict-match + value: 0.0 + - name: exact_match,flexible-extract + value: 0.0 + diff --git a/ibm-granite/granite-3.2-2b-instruct/accuracy/tasks.yml b/ibm-granite/granite-3.2-2b-instruct/accuracy/tasks.yml new file mode 100644 index 0000000..0cfbfd2 --- /dev/null +++ b/ibm-granite/granite-3.2-2b-instruct/accuracy/tasks.yml @@ -0,0 +1,10 @@ +# Migrated from neuralmagic/lm-eval-configs/models/granite-3.2-2b-instruct.yaml +# Note: Metric values are placeholders (0.0) and should be updated with actual baseline values when available +tasks: + - name: gsm8k + metrics: + - name: exact_match,strict-match + value: 0.0 + - name: exact_match,flexible-extract + value: 0.0 + diff --git a/zai-org/glm-4-9b-hf/accuracy/tasks.yml b/zai-org/glm-4-9b-hf/accuracy/tasks.yml new file mode 100644 index 0000000..b36a3a6 --- /dev/null +++ b/zai-org/glm-4-9b-hf/accuracy/tasks.yml @@ -0,0 +1,11 @@ +# Migrated from neuralmagic/lm-eval-configs/models/glm-4-9b-hf.yaml +# Note: Original config referenced zai-org/glm-4-9b-hf +# Note: Metric values are placeholders (0.0) and should be updated with actual baseline values when available +tasks: + - name: gsm8k + metrics: + - name: exact_match,strict-match + value: 0.0 + - name: exact_match,flexible-extract + value: 0.0 +