diff --git a/src/llmperf/ray_clients/openai_chat_completions_client.py b/src/llmperf/ray_clients/openai_chat_completions_client.py index f2e0a91..6d38dfe 100644 --- a/src/llmperf/ray_clients/openai_chat_completions_client.py +++ b/src/llmperf/ray_clients/openai_chat_completions_client.py @@ -59,6 +59,12 @@ def llm_request(self, request_config: RequestConfig) -> Dict[str, Any]: if not address.endswith("/"): address = address + "/" address += "chat/completions" + if "azure"in address: + api_version = os.environ.get("OPENAI_API_VERSION") + if not api_version: + raise ValueError("the environment variable OPENAI_API_VERSION must be set for Azure OpenAI service.") + address = f"{address}?api-version={api_version}" + headers = {"api-key": key} # replace with Authorization: Bearer try: with requests.post( address,