update tests to target aug preview version (#37360)

kristapratico · web-flow · commit e964d988b604 · 2024-09-13T10:58:41.000-07:00
* update tests to target aug preview version

* adjust models where gpt-4o not supported
diff --git a/sdk/openai/azure-openai/dev_requirements.txt b/sdk/openai/azure-openai/dev_requirements.txt
@@ -3,3 +3,4 @@
 aiohttp
 openai
 pillow
+pydantic
diff --git a/sdk/openai/azure-openai/tests/conftest.py b/sdk/openai/azure-openai/tests/conftest.py
@@ -21,7 +21,7 @@
 
 # for pytest.parametrize
 GA = "2024-06-01"
-PREVIEW = "2024-07-01-preview"
+PREVIEW = "2024-08-01-preview"
 LATEST = PREVIEW
 
 AZURE = "azure"
@@ -48,7 +48,7 @@
 ENV_AZURE_OPENAI_EMBEDDINGS_NAME = "text-embedding-ada-002"
 ENV_AZURE_OPENAI_AUDIO_NAME = "whisper"
 ENV_AZURE_OPENAI_DALLE_NAME = "dall-e-3"
-ENV_AZURE_OPENAI_CHAT_COMPLETIONS_GPT4_NAME = "gpt-4-1106-preview"
+ENV_AZURE_OPENAI_CHAT_COMPLETIONS_GPT4_NAME = "gpt-4o"
 ENV_AZURE_OPENAI_TTS_NAME = "tts"
 
 ENV_OPENAI_KEY = "OPENAI_KEY"
@@ -57,7 +57,7 @@
 ENV_OPENAI_EMBEDDINGS_MODEL = "text-embedding-ada-002"
 ENV_OPENAI_AUDIO_MODEL = "whisper-1"
 ENV_OPENAI_DALLE_MODEL = "dall-e-3"
-ENV_OPENAI_CHAT_COMPLETIONS_GPT4_MODEL = "gpt-4-1106-preview"
+ENV_OPENAI_CHAT_COMPLETIONS_GPT4_MODEL = "gpt-4o-2024-08-06"
 ENV_OPENAI_TTS_MODEL = "tts-1"
 
 
diff --git a/sdk/openai/azure-openai/tests/test_assistants.py b/sdk/openai/azure-openai/tests/test_assistants.py
@@ -201,7 +201,7 @@ def test_assistants_crud(self, client, api_type, api_version, **kwargs):
                 name="python test",
                 instructions="You are a personal math tutor. Write and run code to answer math questions.",
                 tools=[{"type": "code_interpreter"}],
-                **kwargs,
+                model="gpt-4-1106-preview",
             )
             retrieved_assistant = client.beta.assistants.retrieve(
                 assistant_id=assistant.id,
@@ -489,7 +489,7 @@ def test_assistants_runs_code(self, client, api_type, api_version, **kwargs):
                 name="python test",
                 instructions="You are a personal math tutor. Write and run code to answer math questions.",
                 tools=[{"type": "code_interpreter"}],
-                **kwargs,
+                model="gpt-4-1106-preview",
             )
 
             thread = client.beta.threads.create()
@@ -561,7 +561,7 @@ def test_assistants_runs_file_search(self, client, api_type, api_version, **kwar
                         "vector_store_ids": [vector_store.id]
                     }
                 },
-                **kwargs
+                model="gpt-4-1106-preview"
             )
 
             run = client.beta.threads.create_and_run_poll(
@@ -629,7 +629,7 @@ def test_assistants_runs_functions(self, client, api_type, api_version, **kwargs
                         }
                     }
                 ],
-                **kwargs,
+                model="gpt-4-1106-preview",
             )
 
             run = client.beta.threads.create_and_run_poll(
@@ -710,7 +710,7 @@ def test_assistants_streaming(self, client, api_type, api_version, **kwargs):
             name="Math Tutor",
             instructions="You are a personal math tutor. Write and run code to answer math questions.",
             tools=[{"type": "code_interpreter"}],
-            **kwargs,
+            model="gpt-4-1106-preview",
         )
         try:
             thread = client.beta.threads.create()
@@ -738,7 +738,7 @@ def test_assistants_stream_event_handler(self, client, api_type, api_version, **
             name="Math Tutor",
             instructions="You are a personal math tutor. Write and run code to answer math questions.",
             tools=[{"type": "code_interpreter"}],
-            **kwargs
+            model="gpt-4-1106-preview"
         )
 
         try:
diff --git a/sdk/openai/azure-openai/tests/test_assistants_async.py b/sdk/openai/azure-openai/tests/test_assistants_async.py
@@ -200,7 +200,7 @@ async def test_assistants_crud(self, client_async, api_type, api_version, **kwar
                 name="python test",
                 instructions="You are a personal math tutor. Write and run code to answer math questions.",
                 tools=[{"type": "code_interpreter"}],
-                **kwargs,
+                model="gpt-4-1106-preview",
             )
             retrieved_assistant = await client_async.beta.assistants.retrieve(
                 assistant_id=assistant.id,
@@ -493,7 +493,7 @@ async def test_assistants_runs_code(self, client_async, api_type, api_version, *
                 name="python test",
                 instructions="You are a personal math tutor. Write and run code to answer math questions.",
                 tools=[{"type": "code_interpreter"}],
-                **kwargs,
+                model="gpt-4-1106-preview",
             )
             thread = await client_async.beta.threads.create()
 
@@ -565,7 +565,7 @@ async def test_assistants_runs_file_search(self, client_async, api_type, api_ver
                         "vector_store_ids": [vector_store.id]
                     }
                 },
-                **kwargs
+                model="gpt-4-1106-preview"
             )
 
             run = await client_async.beta.threads.create_and_run_poll(
@@ -634,7 +634,7 @@ async def test_assistants_runs_functions(self, client_async, api_type, api_versi
                         }
                     }
                 ],
-                **kwargs,
+                model="gpt-4-1106-preview",
             )
 
             run = await client_async.beta.threads.create_and_run_poll(
@@ -717,7 +717,7 @@ async def test_assistants_streaming(self, client_async, api_type, api_version, *
             name="Math Tutor",
             instructions="You are a personal math tutor. Write and run code to answer math questions.",
             tools=[{"type": "code_interpreter"}],
-            **kwargs,
+            model="gpt-4-1106-preview",
         )
         try:
             thread = await client_async.beta.threads.create()
@@ -746,7 +746,7 @@ async def test_assistants_stream_event_handler(self, client_async, api_type, api
             name="Math Tutor",
             instructions="You are a personal math tutor. Write and run code to answer math questions.",
             tools=[{"type": "code_interpreter"}],
-            **kwargs
+            model="gpt-4-1106-preview"
         )
 
         try:
diff --git a/sdk/openai/azure-openai/tests/test_chat_completions.py b/sdk/openai/azure-openai/tests/test_chat_completions.py
@@ -6,6 +6,8 @@
 import os
 import pytest
 import json
+from typing import List
+from pydantic import BaseModel
 import openai
 from devtools_testutils import AzureRecordedTestCase
 from conftest import (
@@ -843,7 +845,7 @@ def test_chat_completion_block_list_term(self, client, api_type, api_version, **
             {"role": "user", "content": "What is the best time of year to pick pineapple?"}
         ]
         with pytest.raises(openai.BadRequestError) as e:
-            client.chat.completions.create(messages=messages, **kwargs)
+            client.chat.completions.create(messages=messages, model="gpt-4-1106-preview")
         err = e.value.body
         assert err["code"] == "content_filter"
         content_filter_result = err["innererror"]["content_filter_result"]
@@ -1159,3 +1161,43 @@ def test_chat_completion_logprobs(self, client, api_type, api_version, **kwargs)
             assert logprob.token is not None
             assert logprob.logprob is not None
             assert logprob.bytes is not None
+
+    @configure
+    @pytest.mark.parametrize("api_type, api_version", [(GPT_4_AZURE, PREVIEW), (GPT_4_OPENAI, "v1")])
+    def test_chat_completion_structured_outputs(self, client, api_type, api_version, **kwargs):
+
+        class Step(BaseModel):
+            explanation: str
+            output: str
+
+        class MathResponse(BaseModel):
+            steps: List[Step]
+            final_answer: str
+
+        completion = client.beta.chat.completions.parse(
+            messages=[
+                {"role": "system", "content": "You are a helpful math tutor."},
+                {"role": "user", "content": "solve 8x + 31 = 2"},
+            ],
+            response_format=MathResponse,
+            **kwargs,
+        )
+
+        assert completion.id
+        assert completion.object == "chat.completion"
+        assert completion.model
+        assert completion.created
+        assert completion.usage.completion_tokens is not None
+        assert completion.usage.prompt_tokens is not None
+        assert completion.usage.total_tokens == completion.usage.completion_tokens + completion.usage.prompt_tokens
+        assert len(completion.choices) == 1
+        assert completion.choices[0].finish_reason
+        assert completion.choices[0].index is not None
+        assert completion.choices[0].message.content is not None
+        assert completion.choices[0].message.role
+        if completion.choices[0].message.parsed:
+            assert completion.choices[0].message.parsed.steps
+            for step in completion.choices[0].message.parsed.steps:
+                assert step.explanation
+                assert step.output
+            assert completion.choices[0].message.parsed.final_answer
diff --git a/sdk/openai/azure-openai/tests/test_chat_completions_async.py b/sdk/openai/azure-openai/tests/test_chat_completions_async.py
@@ -6,6 +6,8 @@
 import os
 import pytest
 import json
+from typing import List
+from pydantic import BaseModel
 import openai
 from devtools_testutils import AzureRecordedTestCase
 from conftest import (
@@ -864,7 +866,7 @@ async def test_chat_completion_block_list_term(self, client_async, api_type, api
             {"role": "user", "content": "What is the best time of year to pick pineapple?"}
         ]
         with pytest.raises(openai.BadRequestError) as e:
-            await client_async.chat.completions.create(messages=messages, **kwargs)
+            await client_async.chat.completions.create(messages=messages, model="gpt-4-1106-preview")
         err = e.value.body
         assert err["code"] == "content_filter"
         content_filter_result = err["innererror"]["content_filter_result"]
@@ -1185,3 +1187,43 @@ async def test_chat_completion_logprobs(self, client_async, api_type, api_versio
             assert logprob.token is not None
             assert logprob.logprob is not None
             assert logprob.bytes is not None
+
+    @configure_async
+    @pytest.mark.asyncio
+    @pytest.mark.parametrize("api_type, api_version", [(GPT_4_AZURE, PREVIEW), (GPT_4_OPENAI, "v1")])
+    async def test_chat_completion_structured_outputs(self, client_async, api_type, api_version, **kwargs):
+
+        class Step(BaseModel):
+            explanation: str
+            output: str
+
+        class MathResponse(BaseModel):
+            steps: List[Step]
+            final_answer: str
+
+        completion = await client_async.beta.chat.completions.parse(
+            messages=[
+                {"role": "system", "content": "You are a helpful math tutor. You only answer about math. Refuse to answer any other question."},
+                {"role": "user", "content": "solve 8x + 31 = 2"},
+            ],
+            response_format=MathResponse,
+            **kwargs,
+        )
+        assert completion.id
+        assert completion.object == "chat.completion"
+        assert completion.model
+        assert completion.created
+        assert completion.usage.completion_tokens is not None
+        assert completion.usage.prompt_tokens is not None
+        assert completion.usage.total_tokens == completion.usage.completion_tokens + completion.usage.prompt_tokens
+        assert len(completion.choices) == 1
+        assert completion.choices[0].finish_reason
+        assert completion.choices[0].index is not None
+        assert completion.choices[0].message.content is not None
+        assert completion.choices[0].message.role
+        if completion.choices[0].message.parsed:
+            assert completion.choices[0].message.parsed.steps
+            for step in completion.choices[0].message.parsed.steps:
+                assert step.explanation
+                assert step.output
+            assert completion.choices[0].message.parsed.final_answer

-Original file line number
+Diff line change
 aiohttp
 openai
 pillow
 +pydantic
Original file line number	Diff line number	Diff line change
`@@ -201,7 +201,7 @@ def test_assistants_crud(self, client, api_type, api_version, **kwargs):`
`201`	`201`	`name="python test",`
`202`	`202`	`instructions="You are a personal math tutor. Write and run code to answer math questions.",`
`203`	`203`	`tools=[{"type": "code_interpreter"}],`
`204`		`- **kwargs,`
	`204`	`+ model="gpt-4-1106-preview",`
`205`	`205`	`)`
`206`	`206`	`retrieved_assistant = client.beta.assistants.retrieve(`
`207`	`207`	`assistant_id=assistant.id,`
`@@ -489,7 +489,7 @@ def test_assistants_runs_code(self, client, api_type, api_version, **kwargs):`
`489`	`489`	`name="python test",`
`490`	`490`	`instructions="You are a personal math tutor. Write and run code to answer math questions.",`
`491`	`491`	`tools=[{"type": "code_interpreter"}],`
`492`		`- **kwargs,`
	`492`	`+ model="gpt-4-1106-preview",`
`493`	`493`	`)`
`494`	`494`
`495`	`495`	`thread = client.beta.threads.create()`
`@@ -561,7 +561,7 @@ def test_assistants_runs_file_search(self, client, api_type, api_version, **kwar`
`561`	`561`	`"vector_store_ids": [vector_store.id]`
`562`	`562`	`}`
`563`	`563`	`},`
`564`		`- **kwargs`
	`564`	`+ model="gpt-4-1106-preview"`
`565`	`565`	`)`
`566`	`566`
`567`	`567`	`run = client.beta.threads.create_and_run_poll(`
`@@ -629,7 +629,7 @@ def test_assistants_runs_functions(self, client, api_type, api_version, **kwargs`
`629`	`629`	`}`
`630`	`630`	`}`
`631`	`631`	`],`
`632`		`- **kwargs,`
	`632`	`+ model="gpt-4-1106-preview",`
`633`	`633`	`)`
`634`	`634`
`635`	`635`	`run = client.beta.threads.create_and_run_poll(`
`@@ -710,7 +710,7 @@ def test_assistants_streaming(self, client, api_type, api_version, **kwargs):`
`710`	`710`	`name="Math Tutor",`
`711`	`711`	`instructions="You are a personal math tutor. Write and run code to answer math questions.",`
`712`	`712`	`tools=[{"type": "code_interpreter"}],`
`713`		`- **kwargs,`
	`713`	`+ model="gpt-4-1106-preview",`
`714`	`714`	`)`
`715`	`715`	`try:`
`716`	`716`	`thread = client.beta.threads.create()`
`@@ -738,7 +738,7 @@ def test_assistants_stream_event_handler(self, client, api_type, api_version, **`
`738`	`738`	`name="Math Tutor",`
`739`	`739`	`instructions="You are a personal math tutor. Write and run code to answer math questions.",`
`740`	`740`	`tools=[{"type": "code_interpreter"}],`
`741`		`- **kwargs`
	`741`	`+ model="gpt-4-1106-preview"`
`742`	`742`	`)`
`743`	`743`
`744`	`744`	`try:`
Original file line number	Diff line number	Diff line change
`@@ -200,7 +200,7 @@ async def test_assistants_crud(self, client_async, api_type, api_version, **kwar`
`200`	`200`	`name="python test",`
`201`	`201`	`instructions="You are a personal math tutor. Write and run code to answer math questions.",`
`202`	`202`	`tools=[{"type": "code_interpreter"}],`
`203`		`- **kwargs,`
	`203`	`+ model="gpt-4-1106-preview",`
`204`	`204`	`)`
`205`	`205`	`retrieved_assistant = await client_async.beta.assistants.retrieve(`
`206`	`206`	`assistant_id=assistant.id,`
`@@ -493,7 +493,7 @@ async def test_assistants_runs_code(self, client_async, api_type, api_version, *`
`493`	`493`	`name="python test",`
`494`	`494`	`instructions="You are a personal math tutor. Write and run code to answer math questions.",`
`495`	`495`	`tools=[{"type": "code_interpreter"}],`
`496`		`- **kwargs,`
	`496`	`+ model="gpt-4-1106-preview",`
`497`	`497`	`)`
`498`	`498`	`thread = await client_async.beta.threads.create()`
`499`	`499`
`@@ -565,7 +565,7 @@ async def test_assistants_runs_file_search(self, client_async, api_type, api_ver`
`565`	`565`	`"vector_store_ids": [vector_store.id]`
`566`	`566`	`}`
`567`	`567`	`},`
`568`		`- **kwargs`
	`568`	`+ model="gpt-4-1106-preview"`
`569`	`569`	`)`
`570`	`570`
`571`	`571`	`run = await client_async.beta.threads.create_and_run_poll(`
`@@ -634,7 +634,7 @@ async def test_assistants_runs_functions(self, client_async, api_type, api_versi`
`634`	`634`	`}`
`635`	`635`	`}`
`636`	`636`	`],`
`637`		`- **kwargs,`
	`637`	`+ model="gpt-4-1106-preview",`
`638`	`638`	`)`
`639`	`639`
`640`	`640`	`run = await client_async.beta.threads.create_and_run_poll(`
`@@ -717,7 +717,7 @@ async def test_assistants_streaming(self, client_async, api_type, api_version, *`
`717`	`717`	`name="Math Tutor",`
`718`	`718`	`instructions="You are a personal math tutor. Write and run code to answer math questions.",`
`719`	`719`	`tools=[{"type": "code_interpreter"}],`
`720`		`- **kwargs,`
	`720`	`+ model="gpt-4-1106-preview",`
`721`	`721`	`)`
`722`	`722`	`try:`
`723`	`723`	`thread = await client_async.beta.threads.create()`
`@@ -746,7 +746,7 @@ async def test_assistants_stream_event_handler(self, client_async, api_type, api`
`746`	`746`	`name="Math Tutor",`
`747`	`747`	`instructions="You are a personal math tutor. Write and run code to answer math questions.",`
`748`	`748`	`tools=[{"type": "code_interpreter"}],`
`749`		`- **kwargs`
	`749`	`+ model="gpt-4-1106-preview"`
`750`	`750`	`)`
`751`	`751`
`752`	`752`	`try:`