Update tests

pamelafox · pamelafox · commit d0e4aa7935cb · 2025-03-12T13:27:10.000-07:00
diff --git a/tests/conftest.py b/tests/conftest.py
@@ -1,4 +1,4 @@
-import azure.ai.inference.models
+import openai
 import pytest
 import pytest_asyncio
 
@@ -13,54 +13,70 @@ class AsyncChatCompletionIterator:
         def __init__(self, answer: str):
             self.chunk_index = 0
             self.chunks = [
-                azure.ai.inference.models.StreamingChatCompletionsUpdate(
-                    id="test-123",
-                    created=1703462735,
-                    model="DeepSeek-R1",
-                    choices=[
-                        azure.ai.inference.models.StreamingChatChoiceUpdate(
-                            delta=azure.ai.inference.models.StreamingChatResponseMessageUpdate(
-                                content=None, role="assistant"
-                            ),
-                            index=0,
-                            finish_reason=None,
-                        )
+                openai.types.chat.ChatCompletionChunk(
+                    object="chat.completion.chunk",
+                    choices=[],
+                    id="",
+                    created=0,
+                    model="",
+                    prompt_filter_results=[
+                        {
+                            "prompt_index": 0,
+                            "content_filter_results": {
+                                "hate": {"filtered": False, "severity": "safe"},
+                                "self_harm": {"filtered": False, "severity": "safe"},
+                                "sexual": {"filtered": False, "severity": "safe"},
+                                "violence": {"filtered": False, "severity": "safe"},
+                            },
+                        }
                     ],
-                ),
+                )
             ]
             answer_deltas = answer.split(" ")
             for answer_index, answer_delta in enumerate(answer_deltas):
-                # Completion chunks include whitespace, so we need to add it back in
-                if answer_index > 0:
+                # Text completion chunks include whitespace, so we need to add it back in
+                if answer_index > 0 and answer_delta != "</think>":
                     answer_delta = " " + answer_delta
                 self.chunks.append(
-                    azure.ai.inference.models.StreamingChatCompletionsUpdate(
+                    openai.types.chat.ChatCompletionChunk(
                         id="test-123",
-                        created=1703462735,
-                        model="DeepSeek-R1",
+                        object="chat.completion.chunk",
                         choices=[
-                            azure.ai.inference.models.StreamingChatChoiceUpdate(
-                                delta=azure.ai.inference.models.StreamingChatResponseMessageUpdate(
-                                    content=answer_delta, role=None
+                            openai.types.chat.chat_completion_chunk.Choice(
+                                delta=openai.types.chat.chat_completion_chunk.ChoiceDelta(
+                                    role=None, content=answer_delta
                                 ),
-                                index=0,
                                 finish_reason=None,
+                                index=0,
+                                logprobs=None,
+                                # Only Azure includes content_filter_results
+                                content_filter_results={
+                                    "hate": {"filtered": False, "severity": "safe"},
+                                    "self_harm": {"filtered": False, "severity": "safe"},
+                                    "sexual": {"filtered": False, "severity": "safe"},
+                                    "violence": {"filtered": False, "severity": "safe"},
+                                },
                             )
                         ],
+                        created=1703462735,
+                        model="DeepSeek-R1",
                     )
                 )
             self.chunks.append(
-                azure.ai.inference.models.StreamingChatCompletionsUpdate(
+                openai.types.chat.ChatCompletionChunk(
                     id="test-123",
-                    created=1703462735,
-                    model="DeepSeek-R1",
+                    object="chat.completion.chunk",
                     choices=[
-                        azure.ai.inference.models.StreamingChatChoiceUpdate(
-                            delta=azure.ai.inference.models.StreamingChatResponseMessageUpdate(content=None, role=None),
+                        openai.types.chat.chat_completion_chunk.Choice(
+                            delta=openai.types.chat.chat_completion_chunk.ChoiceDelta(content=None, role=None),
                             index=0,
                             finish_reason="stop",
+                            # Only Azure includes content_filter_results
+                            content_filter_results={},
                         )
                     ],
+                    created=1703462735,
+                    model="DeepSeek-R1",
                 )
             )
 
@@ -75,28 +91,29 @@ async def __anext__(self):
             else:
                 raise StopAsyncIteration
 
-    async def mock_complete(*args, **kwargs):
+    async def mock_acreate(*args, **kwargs):
         # Only mock a stream=True completion
         last_message = kwargs.get("messages")[-1]["content"]
         if last_message == "What is the capital of France?":
-            return AsyncChatCompletionIterator("The capital of France is Paris.")
+            return AsyncChatCompletionIterator("<think> hmm </think> The capital of France is Paris.")
         elif last_message == "What is the capital of Germany?":
-            return AsyncChatCompletionIterator("The capital of Germany is Berlin.")
+            return AsyncChatCompletionIterator("<think> hmm </think> The capital of Germany is Berlin.")
         else:
             raise ValueError(f"Unexpected message: {last_message}")
 
-    monkeypatch.setattr("azure.ai.inference.aio.ChatCompletionsClient.complete", mock_complete)
+    monkeypatch.setattr("openai.resources.chat.AsyncCompletions.create", mock_acreate)
 
 
 @pytest.fixture
 def mock_defaultazurecredential(monkeypatch):
-    monkeypatch.setattr("azure.identity.aio.DefaultAzureCredential", mock_cred.MockAzureCredential)
+    monkeypatch.setattr("azure.identity.aio.AzureDeveloperCliCredential", mock_cred.MockAzureCredential)
     monkeypatch.setattr("azure.identity.aio.ManagedIdentityCredential", mock_cred.MockAzureCredential)
 
 
 @pytest_asyncio.fixture
 async def client(monkeypatch, mock_openai_chatcompletion, mock_defaultazurecredential):
     monkeypatch.setenv("AZURE_INFERENCE_ENDPOINT", "test-deepseek-service.ai.azure.com")
+    monkeypatch.setenv("AZURE_TENANT_ID", "test-tenant-id")
 
     quart_app = quartapp.create_app(testing=True)
 
diff --git a/tests/mock_cred.py b/tests/mock_cred.py
@@ -1,5 +1,10 @@
+import azure.core.credentials
 import azure.core.credentials_async
 
 
 class MockAzureCredential(azure.core.credentials_async.AsyncTokenCredential):
-    pass
+    async def get_token(self, *scopes, **kwargs):
+        return azure.core.credentials.AccessToken(
+            token="mock_token",
+            expires_on=1703462735,
+        )
diff --git a/tests/snapshots/test_app/test_chat_stream_text/result.jsonlines b/tests/snapshots/test_app/test_chat_stream_text/result.jsonlines
@@ -1,4 +1,5 @@
-{"delta": {"content": "The", "reasoning_content": null, "role": "assistant"}}
+{"delta": {"content": null, "reasoning_content": " hmm", "role": "assistant"}}
+{"delta": {"content": " The", "reasoning_content": null, "role": "assistant"}}
 {"delta": {"content": " capital", "reasoning_content": null, "role": "assistant"}}
 {"delta": {"content": " of", "reasoning_content": null, "role": "assistant"}}
 {"delta": {"content": " France", "reasoning_content": null, "role": "assistant"}}
diff --git a/tests/snapshots/test_app/test_chat_stream_text_history/result.jsonlines b/tests/snapshots/test_app/test_chat_stream_text_history/result.jsonlines
@@ -1,4 +1,5 @@
-{"delta": {"content": "The", "reasoning_content": null, "role": "assistant"}}
+{"delta": {"content": null, "reasoning_content": " hmm", "role": "assistant"}}
+{"delta": {"content": " The", "reasoning_content": null, "role": "assistant"}}
 {"delta": {"content": " capital", "reasoning_content": null, "role": "assistant"}}
 {"delta": {"content": " of", "reasoning_content": null, "role": "assistant"}}
 {"delta": {"content": " Germany", "reasoning_content": null, "role": "assistant"}}
diff --git a/tests/test_app.py b/tests/test_app.py
@@ -49,11 +49,12 @@ async def test_chat_stream_text_history(client, snapshot):
 async def test_openai_managedidentity(monkeypatch):
     monkeypatch.setenv("AZURE_CLIENT_ID", "test-client-id")
     monkeypatch.setenv("AZURE_INFERENCE_ENDPOINT", "test-deepseek-service.ai.azure.com")
+    monkeypatch.setenv("RUNNING_IN_PRODUCTION", "true")
 
     monkeypatch.setattr("azure.identity.aio.ManagedIdentityCredential", mock_cred.MockAzureCredential)
 
     quart_app = quartapp.create_app(testing=True)
 
     async with quart_app.test_app():
-        assert not isinstance(quart_app.blueprints["chat"].ai_client._config.credential, AzureKeyCredential)
-        assert isinstance(quart_app.blueprints["chat"].ai_client._config.credential, AsyncTokenCredential)
+        assert not isinstance(quart_app.blueprints["chat"].azure_credential, AzureKeyCredential)
+        assert isinstance(quart_app.blueprints["chat"].azure_credential, AsyncTokenCredential)