Skip to content

Commit 5ed7a12

Browse files
committed
ip
1 parent af51a6f commit 5ed7a12

File tree

1 file changed

+48
-0
lines changed
  • ci/L0_backend_vllm/accuracy_test

1 file changed

+48
-0
lines changed

ci/L0_backend_vllm/accuracy_test/test.sh

Lines changed: 48 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -45,6 +45,8 @@ sed -i 's/"gpu_memory_utilization": 0.5/"gpu_memory_utilization": 0.3/' models/v
4545
[ -f vllm_baseline_output.pkl ] && rm vllm_baseline_output.pkl
4646
RET=0
4747

48+
export VLLM_USE_V1=0
49+
4850
set +e
4951
# Need to generate baseline first, since running 2 vLLM engines causes
5052
# memory issues: https://github.com/vllm-project/vllm/issues/2248
@@ -82,6 +84,50 @@ set -e
8284

8385
kill $SERVER_PID
8486
wait $SERVER_PID
87+
88+
# Remove old baseline files if they exist
89+
[ -f vllm_baseline_output.pkl ] && rm vllm_baseline_output.pkl
90+
[ -f vllm_guided_baseline_output.pkl ] && rm vllm_guided_baseline_output.pkl
91+
92+
# Run tests for VLLM v1, but omit guided decoding, as it's development in progress as of 0.8.1
93+
export VLLM_USE_V1=1
94+
EXPECTED_NUM_TESTS=1
95+
96+
set +e
97+
# Need to generate baseline first, since running 2 vLLM engines causes
98+
# memory issues: https://github.com/vllm-project/vllm/issues/2248
99+
python3 $CLIENT_PY --generate-baseline >> $VLLM_ENGINE_LOG 2>&1 & BASELINE_PID=$!
100+
wait $BASELINE_PID
101+
102+
set -e
103+
104+
run_server
105+
if [ "$SERVER_PID" == "0" ]; then
106+
cat $SERVER_LOG
107+
echo -e "\n***\n*** Failed to start $SERVER\n***"
108+
exit 1
109+
fi
110+
111+
set +e
112+
python3 $CLIENT_PY VLLMTritonAccuracyTest.test_vllm_model > $CLIENT_LOG 2>&1
113+
114+
if [ $? -ne 0 ]; then
115+
cat $CLIENT_LOG
116+
echo -e "\n***\n*** Running $CLIENT_PY FAILED. \n***"
117+
RET=1
118+
else
119+
check_test_results $TEST_RESULT_FILE $EXPECTED_NUM_TESTS
120+
if [ $? -ne 0 ]; then
121+
cat $CLIENT_LOG
122+
echo -e "\n***\n*** Test Result Verification FAILED.\n***"
123+
RET=1
124+
fi
125+
fi
126+
set -e
127+
128+
kill $SERVER_PID
129+
wait $SERVER_PID
130+
85131
rm -rf models/
86132

87133
if [ $RET -eq 1 ]; then
@@ -92,6 +138,8 @@ else
92138
echo -e "\n***\n*** Accuracy test PASSED. \n***"
93139
fi
94140

141+
unset VLLM_USE_V1
142+
95143
collect_artifacts_from_subdir
96144

97145
exit $RET

0 commit comments

Comments
 (0)