File tree Expand file tree Collapse file tree 1 file changed +5
-30
lines changed
Expand file tree Collapse file tree 1 file changed +5
-30
lines changed Original file line number Diff line number Diff line change 1- BS=5
21DATASET=bigcodebench
3- MODEL=gpt-3.5-turbo-0125
4- BACKEND=openai
5- TEMP=0
6- N_SAMPLES=1
2+ MODEL=meta-llama/Llama-3.2-1B-Instruct
3+ BACKEND=vllm
74NUM_GPU=1
85SPLIT=complete
96SUBSET=hard
10- if [[ $MODEL == * " /" * ]]; then
11- ORG=$( echo $MODEL | cut -d' /' -f1) --
12- BASE_MODEL=$( echo $MODEL | cut -d' /' -f2)
13- else
14- ORG=" "
15- BASE_MODEL=$MODEL
16- fi
177
18- if [ " $SUBSET " = " full" ]; then
19- FILE_HEADER=" ${ORG}${BASE_MODEL} --${DATASET} -${SPLIT} --${BACKEND} -${TEMP} -${N_SAMPLES} "
20- else
21- FILE_HEADER=" ${ORG}${BASE_MODEL} --${DATASET} -${SUBSET} -${SPLIT} --${BACKEND} -${TEMP} -${N_SAMPLES} "
22- fi
23-
24- echo $FILE_HEADER
25- bigcodebench.generate \
8+ bigcodebench.evaluate \
269 --model $MODEL \
27- --resume \
10+ --samples meta-llama--Llama-3.2-1B-Instruct--bigcodebench-hard-complete--vllm-0-1-sanitized_calibrated.jsonl \
2811 --split $SPLIT \
2912 --subset $SUBSET \
3013 --backend $BACKEND \
31- --greedy
32-
33- bigcodebench.sanitize --samples $FILE_HEADER .jsonl --calibrate
34-
35- # Check if the ground truth works on your machine
36- bigcodebench.evaluate --split $SPLIT --subset $SUBSET --samples $FILE_HEADER -sanitized-calibrated.jsonl
37-
38- # If the execution is slow:
39- bigcodebench.evaluate --split $SPLIT --subset $SUBSET --samples $FILE_HEADER -sanitized-calibrated.jsonl --parallel 32
14+ --greedy
You can’t perform that action at this time.
0 commit comments