File tree Expand file tree Collapse file tree 6 files changed +6
-4
lines changed
L0_additional_outputs_vllm Expand file tree Collapse file tree 6 files changed +6
-4
lines changed Original file line number Diff line number Diff line change @@ -30,7 +30,6 @@ source ../common/util.sh
3030
3131pip3 install pytest==8.1.1
3232pip3 install tritonclient[grpc]
33- pip3 install " transformers<=4.53.3" # TODO:DLIS-8441 remove this dependency
3433
3534# Prepare Model
3635rm -rf models vllm_baseline_output.pkl && mkdir -p models
Original file line number Diff line number Diff line change 2929SUBTESTS=" accuracy_test request_cancellation enabled_stream vllm_backend metrics_test"
3030
3131python3 -m pip install tritonclient[grpc]
32- python3 -m pip install " transformers<=4.53.3" # TODO:DLIS-8441 remove this dependency
3332
3433for TEST in ${SUBTESTS} ; do
3534 (cd ${TEST} && bash -ex test.sh && cd ..)
Original file line number Diff line number Diff line change @@ -30,7 +30,6 @@ source ../common/util.sh
3030
3131pip3 install pytest==8.1.1
3232pip3 install tritonclient[grpc]
33- pip3 install " transformers<=4.53.3" # TODO:DLIS-8441 remove this dependency
3433
3534RET=0
3635
Original file line number Diff line number Diff line change @@ -41,6 +41,9 @@ EXPECTED_NUM_TESTS=2
4141GENERATE_ENDPOINT=" localhost:8000/v2/models/vllm_llama_multi_lora/generate"
4242CHECK_FOR_ERROR=true
4343
44+ export C_INCLUDE_PATH=/usr/local/cuda/include:$C_INCLUDE_PATH
45+ export TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas
46+
4447make_api_call () {
4548 local endpoint=" $1 "
4649 local data=" $2 "
Original file line number Diff line number Diff line change 2929SUBTESTS=" vllm_backend multi_lora"
3030
3131python3 -m pip install tritonclient[grpc]
32- python3 -m pip install " transformers<=4.53.3" # TODO:DLIS-8441 remove this dependency
3332
3433for TEST in ${SUBTESTS} ; do
3534 (cd ${TEST} && bash -ex test.sh && cd ..)
Original file line number Diff line number Diff line change @@ -36,6 +36,9 @@ CLIENT_PY="./vllm_multi_gpu_test.py"
3636SAMPLE_MODELS_REPO=" ../../../samples/model_repository"
3737EXPECTED_NUM_TESTS=1
3838
39+ export C_INCLUDE_PATH=/usr/local/cuda/include:$C_INCLUDE_PATH
40+ export TRITON_PTXAS_PATH=/usr/local/cuda/bin/ptxas
41+
3942# ## Helpers
4043function validate_file_contains() {
4144 local KEY=" ${1} "
You can’t perform that action at this time.
0 commit comments