File tree Expand file tree Collapse file tree 3 files changed +10
-2
lines changed
L0_additional_outputs_vllm
L0_multi_gpu_vllm/vllm_backend Expand file tree Collapse file tree 3 files changed +10
-2
lines changed Original file line number Diff line number Diff line change @@ -32,7 +32,7 @@ pip3 install pytest==8.1.1
3232pip3 install tritonclient[grpc]
3333
3434# Prepare Model
35- rm -rf models vllm_baseline_output.pkl && mkdir -p models
35+ rm -rf models && mkdir -p models
3636SAMPLE_MODELS_REPO=" ../../samples/model_repository"
3737cp -r $SAMPLE_MODELS_REPO /vllm_model models/vllm_opt
3838sed -i ' s/"gpu_memory_utilization": 0.5/"gpu_memory_utilization": 0.3/' models/vllm_opt/1/model.json
4242# Test
4343SERVER_LOG=" additional_outputs_test.server.log"
4444SERVER_ARGS=" --model-repository=models"
45+ # Cold start on SBSA device can take longer than default 120 seconds
46+ PREV_SERVER_TIMEOUT=$SERVER_TIMEOUT
47+ SERVER_TIMEOUT=240
4548run_server
49+ SERVER_TIMEOUT=$PREV_SERVER_TIMEOUT
4650if [ " $SERVER_PID " == " 0" ]; then
4751 echo -e " \n***\n*** Failed to start $SERVER \n***"
4852 cat $SERVER_LOG
@@ -61,6 +65,7 @@ wait $SERVER_PID
6165if [ $RET -eq 0 ]; then
6266 echo -e " \n***\n*** Test Passed\n***"
6367else
68+ cat $SERVER_LOG
6469 echo -e " \n***\n*** Test FAILED\n***"
6570fi
6671exit $RET
Original file line number Diff line number Diff line change @@ -135,6 +135,7 @@ unmock_vllm_async_llm_engine
135135if [ $RET -eq 0 ]; then
136136 echo -e " \n***\n*** Test Passed\n***"
137137else
138+ cat $SERVER_LOG
138139 echo -e " \n***\n*** Test FAILED\n***"
139140fi
140141exit $RET
Original file line number Diff line number Diff line change 11#! /bin/bash
2- # Copyright 2023-2024 , NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2+ # Copyright 2023-2025 , NVIDIA CORPORATION & AFFILIATES. All rights reserved.
33#
44# Redistribution and use in source and binary forms, with or without
55# modification, are permitted provided that the following conditions
138138
139139# ## Results
140140if [ $RET -eq 1 ]; then
141+ cat $CLIENT_LOG
142+ cat $SERVER_LOG
141143 echo -e " \n***\n*** Multi GPU Utilization test FAILED. \n***"
142144else
143145 echo -e " \n***\n*** Multi GPU Utilization test PASSED. \n***"
You can’t perform that action at this time.
0 commit comments