|
5 | 5 |
|
6 | 6 | TAG=$(date +"%Y_%m_%d_%H_%M")
|
7 | 7 | SCRIPT_DIR=$( cd -- "$( dirname -- "${BASH_SOURCE[0]}" )" &> /dev/null && pwd )
|
8 |
| -BASE="$SCRIPT_DIR/../../.." |
9 |
| -MODEL="meta-llama/Llama-3.1-8B-Instruct" |
10 |
| -SYSTEM="TPU" |
11 |
| -TP=1 |
12 |
| -DOWNLOAD_DIR="" |
13 |
| -INPUT_LEN=4000 |
14 |
| -OUTPUT_LEN=16 |
15 |
| -MAX_MODEL_LEN=4096 |
16 |
| -MIN_CACHE_HIT_PCT=0 |
17 |
| -MAX_LATENCY_ALLOWED_MS=100000000000 |
18 |
| -NUM_SEQS_LIST="128 256" |
19 |
| -NUM_BATCHED_TOKENS_LIST="512 1024 2048 4096" |
| 8 | +VLLM_LOGGING_LEVEL=${VLLM_LOGGING_LEVEL:-INFO} |
| 9 | +BASE=${BASE:-"$SCRIPT_DIR/../../.."} |
| 10 | +MODEL=${MODEL:-"meta-llama/Llama-3.1-8B-Instruct"} |
| 11 | +SYSTEM=${SYSTEM:-"TPU"} |
| 12 | +TP=${TP:-1} |
| 13 | +DOWNLOAD_DIR=${DOWNLOAD_DIR:-""} |
| 14 | +INPUT_LEN=${INPUT_LEN:-4000} |
| 15 | +OUTPUT_LEN=${OUTPUT_LEN:-16} |
| 16 | +MAX_MODEL_LEN=${MAX_MODEL_LEN:-4096} |
| 17 | +MIN_CACHE_HIT_PCT=${MIN_CACHE_HIT_PCT:-0} |
| 18 | +MAX_LATENCY_ALLOWED_MS=${MAX_LATENCY_ALLOWED_MS:-100000000000} |
| 19 | +NUM_SEQS_LIST=${NUM_SEQS_LIST:-"128 256"} |
| 20 | +NUM_BATCHED_TOKENS_LIST=${NUM_BATCHED_TOKENS_LIST:-"512 1024 2048 4096"} |
20 | 21 |
|
21 | 22 | LOG_FOLDER="$BASE/auto-benchmark/$TAG"
|
22 | 23 | RESULT="$LOG_FOLDER/result.txt"
|
23 | 24 | PROFILE_PATH="$LOG_FOLDER/profile"
|
24 | 25 |
|
25 |
| -echo "result file: $RESULT" |
26 |
| -echo "model: $MODEL" |
| 26 | +echo "====================== AUTO TUNE PARAMETERS ====================" |
| 27 | +echo "SCRIPT_DIR=$SCRIPT_DIR" |
| 28 | +echo "BASE=$BASE" |
| 29 | +echo "MODEL=$MODEL" |
| 30 | +echo "SYSTEM=$SYSTEM" |
| 31 | +echo "TP=$TP" |
| 32 | +echo "DOWNLOAD_DIR=$DOWNLOAD_DIR" |
| 33 | +echo "INPUT_LEN=$INPUT_LEN" |
| 34 | +echo "OUTPUT_LEN=$OUTPUT_LEN" |
| 35 | +echo "MAX_MODEL_LEN=$MAX_MODEL_LEN" |
| 36 | +echo "MIN_CACHE_HIT_PCT=$MIN_CACHE_HIT_PCT" |
| 37 | +echo "MAX_LATENCY_ALLOWED_MS=$MAX_LATENCY_ALLOWED_MS" |
| 38 | +echo "NUM_SEQS_LIST=$NUM_SEQS_LIST" |
| 39 | +echo "NUM_BATCHED_TOKENS_LIST=$NUM_BATCHED_TOKENS_LIST" |
| 40 | +echo "VLLM_LOGGING_LEVEL=$VLLM_LOGGING_LEVEL" |
| 41 | +echo "RESULT_FILE=$RESULT" |
| 42 | +echo "====================== AUTO TUNEPARAMETERS ====================" |
27 | 43 |
|
28 | 44 | rm -rf $LOG_FOLDER
|
29 | 45 | rm -rf $PROFILE_PATH
|
|
0 commit comments