From c8611904bc7e1b57a6c17b7a41d6b7500d5b94ba Mon Sep 17 00:00:00 2001
From: Yingge He <157551214+yinggeh@users.noreply.github.com>
Date: Tue, 23 Sep 2025 15:06:19 -0700
Subject: [PATCH 1/2] fix: OpenAI and vLLM related tests (#8397)

---
 python/openai/requirements.txt                                 | 2 +-
 .../mistral-nemo-instruct-2407/1/model.json                    | 2 +-
 .../tests/vllm_models/llama-3.1-8b-instruct/1/model.json       | 2 +-
 qa/L0_perf_vllm/test.sh                                        | 3 +--
 4 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/python/openai/requirements.txt b/python/openai/requirements.txt
index 5536880c09..608f3b5ac3 100644
--- a/python/openai/requirements.txt
+++ b/python/openai/requirements.txt
@@ -29,7 +29,7 @@ fastapi==0.115.6
 # Fix httpx version to avoid bug in openai library:
 # https://community.openai.com/t/error-with-openai-1-56-0-client-init-got-an-unexpected-keyword-argument-proxies/1040332/3
 httpx==0.27.2
-openai==1.60.0
+openai==1.107.3
 partial-json-parser # used for parsing partial JSON outputs
 # Minimum starlette version needed to address CVE:
 # https://github.com/advisories/GHSA-f96h-pmfr-66vw
diff --git a/python/openai/tests/vllm_mistral_models/mistral-nemo-instruct-2407/1/model.json b/python/openai/tests/vllm_mistral_models/mistral-nemo-instruct-2407/1/model.json
index 835e537349..b7ce0ee199 100644
--- a/python/openai/tests/vllm_mistral_models/mistral-nemo-instruct-2407/1/model.json
+++ b/python/openai/tests/vllm_mistral_models/mistral-nemo-instruct-2407/1/model.json
@@ -1 +1 @@
-{"model": "mistralai/Mistral-Nemo-Instruct-2407", "disable_log_requests": true, "gpu_memory_utilization": 0.9}
\ No newline at end of file
+{"model": "mistralai/Mistral-Nemo-Instruct-2407", "gpu_memory_utilization": 0.9}
\ No newline at end of file
diff --git a/python/openai/tests/vllm_models/llama-3.1-8b-instruct/1/model.json b/python/openai/tests/vllm_models/llama-3.1-8b-instruct/1/model.json
index cb9b14c765..df85a05da0 100644
--- a/python/openai/tests/vllm_models/llama-3.1-8b-instruct/1/model.json
+++ b/python/openai/tests/vllm_models/llama-3.1-8b-instruct/1/model.json
@@ -1 +1 @@
-{"model": "meta-llama/Meta-Llama-3.1-8B-Instruct", "disable_log_requests": true, "gpu_memory_utilization": 0.9}
+{"model": "meta-llama/Meta-Llama-3.1-8B-Instruct", "gpu_memory_utilization": 0.9}
diff --git a/qa/L0_perf_vllm/test.sh b/qa/L0_perf_vllm/test.sh
index e1ce8cf2ed..2c9fc87cb4 100755
--- a/qa/L0_perf_vllm/test.sh
+++ b/qa/L0_perf_vllm/test.sh
@@ -1,5 +1,5 @@
 #!/bin/bash
-# Copyright 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# Copyright 2023-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions
@@ -47,7 +47,6 @@ rm -rf $MODEL_REPO $EXPORT_FILE *.tjson *.json *.csv
 mkdir -p $MODEL_REPO/$MODEL_NAME/1
 echo '{
     "model":"gpt2",
-    "disable_log_requests": "true",
     "gpu_memory_utilization": 0.5
 }' >$MODEL_REPO/$MODEL_NAME/1/model.json
 

From dcffd8b3d3979131ca2d454465e25741211887a9 Mon Sep 17 00:00:00 2001
From: Yingge He <yinggeh@nvidia.com>
Date: Wed, 24 Sep 2025 14:33:46 -0700
Subject: [PATCH 2/2] Revert openai version

---
 python/openai/requirements.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/openai/requirements.txt b/python/openai/requirements.txt
index 608f3b5ac3..5536880c09 100644
--- a/python/openai/requirements.txt
+++ b/python/openai/requirements.txt
@@ -29,7 +29,7 @@ fastapi==0.115.6
 # Fix httpx version to avoid bug in openai library:
 # https://community.openai.com/t/error-with-openai-1-56-0-client-init-got-an-unexpected-keyword-argument-proxies/1040332/3
 httpx==0.27.2
-openai==1.107.3
+openai==1.60.0
 partial-json-parser # used for parsing partial JSON outputs
 # Minimum starlette version needed to address CVE:
 # https://github.com/advisories/GHSA-f96h-pmfr-66vw