Skip to content

Commit 993568a

Browse files
committed
initiate repo
1 parent 023dd89 commit 993568a

File tree

2 files changed

+53
-1
lines changed

2 files changed

+53
-1
lines changed

README.md

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1,6 @@
1-
# model-validation-configs
1+
# model-validation-configs
2+
3+
This repository contains configurations for model validation.
4+
5+
The `lm-eval` folder contains YAML files for each model that configures information needed for the model to be validated through the [lm-evaluation-harness]
6+
[https://github.com/huggingface/lm-evaluation-harness].
Lines changed: 47 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,47 @@
1+
# configs for https://huggingface.co/meta-llama/Meta-Llama-3.1-8B-Instruct
2+
server:
3+
model: "meta-llama/Meta-Llama-3.1-8B-Instruct"
4+
trust_remote_code: true
5+
enable_chunked_prefill: true
6+
tensor_parallel_size:
7+
max_model_len: 4096
8+
9+
storage:
10+
model: hf
11+
data: hf
12+
13+
lm-eval:
14+
model: "vllm"
15+
model_args:
16+
pretrained: "meta-llama/Meta-Llama-3.1-8B-Instruct"
17+
num_fewshot:
18+
apply_chat_template: true
19+
fewshot_as_multiturn: true
20+
add_bos_token: false
21+
tasks:
22+
- name: "leaderboard_bbh"
23+
metrics:
24+
- name: "acc_norm,none"
25+
value: 0.50946
26+
- name: "leaderboard_gpqa"
27+
metrics:
28+
- name: "acc_norm,none"
29+
value: 0.29698
30+
- name: "leaderboard_ifeval"
31+
metrics:
32+
- name: "inst_level_loose_acc,none"
33+
value: 0.85851
34+
- name: "inst_level_strict_acc,none"
35+
value: 0.82374
36+
- name: "prompt_level_loose_acc,none"
37+
value: 0.79667
38+
- name: "prompt_level_strict_acc,none"
39+
value: 0.74861
40+
- name: "leaderboard_math_hard"
41+
metrics:
42+
- name: "exact_match,none"
43+
value: 0.19864
44+
- name: "leaderboard_musr"
45+
metrics:
46+
- name: "acc_norm,none"
47+
value: 0.38359

0 commit comments

Comments
 (0)