Skip to content

Commit 01e2fb0

Browse files
committed
doc: update full script
1 parent ae94984 commit 01e2fb0

File tree

1 file changed

+5
-30
lines changed

1 file changed

+5
-30
lines changed

run.sh

Lines changed: 5 additions & 30 deletions
Original file line numberDiff line numberDiff line change
@@ -1,39 +1,14 @@
1-
BS=5
21
DATASET=bigcodebench
3-
MODEL=gpt-3.5-turbo-0125
4-
BACKEND=openai
5-
TEMP=0
6-
N_SAMPLES=1
2+
MODEL=meta-llama/Llama-3.2-1B-Instruct
3+
BACKEND=vllm
74
NUM_GPU=1
85
SPLIT=complete
96
SUBSET=hard
10-
if [[ $MODEL == *"/"* ]]; then
11-
ORG=$(echo $MODEL | cut -d'/' -f1)--
12-
BASE_MODEL=$(echo $MODEL | cut -d'/' -f2)
13-
else
14-
ORG=""
15-
BASE_MODEL=$MODEL
16-
fi
177

18-
if [ "$SUBSET" = "full" ]; then
19-
FILE_HEADER="${ORG}${BASE_MODEL}--${DATASET}-${SPLIT}--${BACKEND}-${TEMP}-${N_SAMPLES}"
20-
else
21-
FILE_HEADER="${ORG}${BASE_MODEL}--${DATASET}-${SUBSET}-${SPLIT}--${BACKEND}-${TEMP}-${N_SAMPLES}"
22-
fi
23-
24-
echo $FILE_HEADER
25-
bigcodebench.generate \
8+
bigcodebench.evaluate \
269
--model $MODEL \
27-
--resume \
10+
--samples meta-llama--Llama-3.2-1B-Instruct--bigcodebench-hard-complete--vllm-0-1-sanitized_calibrated.jsonl \
2811
--split $SPLIT \
2912
--subset $SUBSET \
3013
--backend $BACKEND \
31-
--greedy
32-
33-
bigcodebench.sanitize --samples $FILE_HEADER.jsonl --calibrate
34-
35-
# Check if the ground truth works on your machine
36-
bigcodebench.evaluate --split $SPLIT --subset $SUBSET --samples $FILE_HEADER-sanitized-calibrated.jsonl
37-
38-
# If the execution is slow:
39-
bigcodebench.evaluate --split $SPLIT --subset $SUBSET --samples $FILE_HEADER-sanitized-calibrated.jsonl --parallel 32
14+
--greedy

0 commit comments

Comments
 (0)