From c8611904bc7e1b57a6c17b7a41d6b7500d5b94ba Mon Sep 17 00:00:00 2001 From: Yingge He <157551214+yinggeh@users.noreply.github.com> Date: Tue, 23 Sep 2025 15:06:19 -0700 Subject: [PATCH 1/2] fix: OpenAI and vLLM related tests (#8397) --- python/openai/requirements.txt | 2 +- .../mistral-nemo-instruct-2407/1/model.json | 2 +- .../tests/vllm_models/llama-3.1-8b-instruct/1/model.json | 2 +- qa/L0_perf_vllm/test.sh | 3 +-- 4 files changed, 4 insertions(+), 5 deletions(-) diff --git a/python/openai/requirements.txt b/python/openai/requirements.txt index 5536880c09..608f3b5ac3 100644 --- a/python/openai/requirements.txt +++ b/python/openai/requirements.txt @@ -29,7 +29,7 @@ fastapi==0.115.6 # Fix httpx version to avoid bug in openai library: # https://community.openai.com/t/error-with-openai-1-56-0-client-init-got-an-unexpected-keyword-argument-proxies/1040332/3 httpx==0.27.2 -openai==1.60.0 +openai==1.107.3 partial-json-parser # used for parsing partial JSON outputs # Minimum starlette version needed to address CVE: # https://github.com/advisories/GHSA-f96h-pmfr-66vw diff --git a/python/openai/tests/vllm_mistral_models/mistral-nemo-instruct-2407/1/model.json b/python/openai/tests/vllm_mistral_models/mistral-nemo-instruct-2407/1/model.json index 835e537349..b7ce0ee199 100644 --- a/python/openai/tests/vllm_mistral_models/mistral-nemo-instruct-2407/1/model.json +++ b/python/openai/tests/vllm_mistral_models/mistral-nemo-instruct-2407/1/model.json @@ -1 +1 @@ -{"model": "mistralai/Mistral-Nemo-Instruct-2407", "disable_log_requests": true, "gpu_memory_utilization": 0.9} \ No newline at end of file +{"model": "mistralai/Mistral-Nemo-Instruct-2407", "gpu_memory_utilization": 0.9} \ No newline at end of file diff --git a/python/openai/tests/vllm_models/llama-3.1-8b-instruct/1/model.json b/python/openai/tests/vllm_models/llama-3.1-8b-instruct/1/model.json index cb9b14c765..df85a05da0 100644 --- a/python/openai/tests/vllm_models/llama-3.1-8b-instruct/1/model.json +++ b/python/openai/tests/vllm_models/llama-3.1-8b-instruct/1/model.json @@ -1 +1 @@ -{"model": "meta-llama/Meta-Llama-3.1-8B-Instruct", "disable_log_requests": true, "gpu_memory_utilization": 0.9} +{"model": "meta-llama/Meta-Llama-3.1-8B-Instruct", "gpu_memory_utilization": 0.9} diff --git a/qa/L0_perf_vllm/test.sh b/qa/L0_perf_vllm/test.sh index e1ce8cf2ed..2c9fc87cb4 100755 --- a/qa/L0_perf_vllm/test.sh +++ b/qa/L0_perf_vllm/test.sh @@ -1,5 +1,5 @@ #!/bin/bash -# Copyright 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved. +# Copyright 2023-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved. # # Redistribution and use in source and binary forms, with or without # modification, are permitted provided that the following conditions @@ -47,7 +47,6 @@ rm -rf $MODEL_REPO $EXPORT_FILE *.tjson *.json *.csv mkdir -p $MODEL_REPO/$MODEL_NAME/1 echo '{ "model":"gpt2", - "disable_log_requests": "true", "gpu_memory_utilization": 0.5 }' >$MODEL_REPO/$MODEL_NAME/1/model.json From dcffd8b3d3979131ca2d454465e25741211887a9 Mon Sep 17 00:00:00 2001 From: Yingge He Date: Wed, 24 Sep 2025 14:33:46 -0700 Subject: [PATCH 2/2] Revert openai version --- python/openai/requirements.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/openai/requirements.txt b/python/openai/requirements.txt index 608f3b5ac3..5536880c09 100644 --- a/python/openai/requirements.txt +++ b/python/openai/requirements.txt @@ -29,7 +29,7 @@ fastapi==0.115.6 # Fix httpx version to avoid bug in openai library: # https://community.openai.com/t/error-with-openai-1-56-0-client-init-got-an-unexpected-keyword-argument-proxies/1040332/3 httpx==0.27.2 -openai==1.107.3 +openai==1.60.0 partial-json-parser # used for parsing partial JSON outputs # Minimum starlette version needed to address CVE: # https://github.com/advisories/GHSA-f96h-pmfr-66vw