File tree Expand file tree Collapse file tree 1 file changed +48
-0
lines changed
ci/L0_backend_vllm/accuracy_test Expand file tree Collapse file tree 1 file changed +48
-0
lines changed Original file line number Diff line number Diff line change @@ -45,6 +45,8 @@ sed -i 's/"gpu_memory_utilization": 0.5/"gpu_memory_utilization": 0.3/' models/v
4545[ -f vllm_baseline_output.pkl ] && rm vllm_baseline_output.pkl
4646RET=0
4747
48+ export VLLM_USE_V1=0
49+
4850set +e
4951# Need to generate baseline first, since running 2 vLLM engines causes
5052# memory issues: https://github.com/vllm-project/vllm/issues/2248
@@ -82,6 +84,50 @@ set -e
8284
8385kill $SERVER_PID
8486wait $SERVER_PID
87+
88+ # Remove old baseline files if they exist
89+ [ -f vllm_baseline_output.pkl ] && rm vllm_baseline_output.pkl
90+ [ -f vllm_guided_baseline_output.pkl ] && rm vllm_guided_baseline_output.pkl
91+
92+ # Run tests for VLLM v1, but omit guided decoding, as it's development in progress as of 0.8.1
93+ export VLLM_USE_V1=1
94+ EXPECTED_NUM_TESTS=1
95+
96+ set +e
97+ # Need to generate baseline first, since running 2 vLLM engines causes
98+ # memory issues: https://github.com/vllm-project/vllm/issues/2248
99+ python3 $CLIENT_PY --generate-baseline >> $VLLM_ENGINE_LOG 2>&1 & BASELINE_PID=$!
100+ wait $BASELINE_PID
101+
102+ set -e
103+
104+ run_server
105+ if [ " $SERVER_PID " == " 0" ]; then
106+ cat $SERVER_LOG
107+ echo -e " \n***\n*** Failed to start $SERVER \n***"
108+ exit 1
109+ fi
110+
111+ set +e
112+ python3 $CLIENT_PY VLLMTritonAccuracyTest.test_vllm_model > $CLIENT_LOG 2>&1
113+
114+ if [ $? -ne 0 ]; then
115+ cat $CLIENT_LOG
116+ echo -e " \n***\n*** Running $CLIENT_PY FAILED. \n***"
117+ RET=1
118+ else
119+ check_test_results $TEST_RESULT_FILE $EXPECTED_NUM_TESTS
120+ if [ $? -ne 0 ]; then
121+ cat $CLIENT_LOG
122+ echo -e " \n***\n*** Test Result Verification FAILED.\n***"
123+ RET=1
124+ fi
125+ fi
126+ set -e
127+
128+ kill $SERVER_PID
129+ wait $SERVER_PID
130+
85131rm -rf models/
86132
87133if [ $RET -eq 1 ]; then
92138 echo -e " \n***\n*** Accuracy test PASSED. \n***"
93139fi
94140
141+ unset VLLM_USE_V1
142+
95143collect_artifacts_from_subdir
96144
97145exit $RET
You can’t perform that action at this time.
0 commit comments