@@ -50,7 +50,7 @@ function assert_curl_success {
5050
5151rm -rf models && mkdir -p models
5252cp -r ${SAMPLE_MODELS_REPO} /vllm_model models/vllm_opt
53- # `vllm_opt`` model will be loaded on server start and stay loaded throughout
53+ # `vllm_opt` model will be loaded on server start and stay loaded throughout
5454# unittesting. To ensure that vllm's memory profiler will not error out
5555# on `vllm_load_test` load, we reduce "gpu_memory_utilization" for `vllm_opt`,
5656# so that at least 60% of GPU memory was available for other models.
@@ -71,7 +71,7 @@ python3 $CLIENT_PY VLLMTritonMetricsTest.test_vllm_metrics -v > $CLIENT_LOG 2>&1
7171
7272if [ $? -ne 0 ]; then
7373 cat $CLIENT_LOG
74- echo -e " \n***\n*** Running $CLIENT_PY FAILED. \n***"
74+ echo -e " \n***\n*** Running $CLIENT_PY VLLMTritonMetricsTest.test_vllm_metrics FAILED. \n***"
7575 RET=1
7676else
7777 check_test_results $TEST_RESULT_FILE $EXPECTED_NUM_TESTS
@@ -101,7 +101,7 @@ python3 $CLIENT_PY VLLMTritonMetricsTest.test_vllm_metrics_disabled -v > $CLIENT
101101
102102if [ $? -ne 0 ]; then
103103 cat $CLIENT_LOG
104- echo -e " \n***\n*** Running $CLIENT_PY FAILED. \n***"
104+ echo -e " \n***\n*** Running $CLIENT_PY VLLMTritonMetricsTest.test_vllm_metrics_disabled FAILED. \n***"
105105 RET=1
106106else
107107 check_test_results $TEST_RESULT_FILE $EXPECTED_NUM_TESTS
@@ -132,7 +132,7 @@ python3 $CLIENT_PY VLLMTritonMetricsTest.test_vllm_metrics -v > $CLIENT_LOG 2>&1
132132
133133if [ $? -ne 0 ]; then
134134 cat $CLIENT_LOG
135- echo -e " \n***\n*** Running $CLIENT_PY FAILED. \n***"
135+ echo -e " \n***\n*** Running $CLIENT_PY VLLMTritonMetricsTest.test_vllm_metrics FAILED. \n***"
136136 RET=1
137137else
138138 check_test_results $TEST_RESULT_FILE $EXPECTED_NUM_TESTS
0 commit comments