fix

jackalcooper · jackalcooper · commit cac9ef771f57 · 2026-01-15T18:18:34.000+08:00
diff --git a/tests/test_doc.py b/tests/test_doc.py
@@ -6,6 +6,7 @@
 
 # --- CONFIGURATION ---
 BASE_URL_PREFIX = "http://localhost:8000/siliconflow/models"
+BASE_URL_PREFIX = "https://api-bailian.siliconflow.cn/siliconflow/models"
 API_KEY = os.getenv("SILICONFLOW_API_KEY", "test_api_key")
 
 HEADERS = {
diff --git a/tests/test_tools.py b/tests/test_tools.py
@@ -1,19 +1,16 @@
 import pytest
 import json
 import requests
-from typing import Generator, List, Dict, Any
-from dataclasses import dataclass
 import os
+from typing import Generator, List, Dict, Any, Optional
+from dataclasses import dataclass
+
+# --- 1. CONFIGURATION & CONSTANTS ---
 
-# --- CONSTANTS & CONFIGURATION ---
-# Note: Ensure your MockServer/Proxy is running on this port
 # GATEWAY_URL = "https://api-bailian.siliconflow.cn/api/v1/services/aigc/text-generation/generation"
 GATEWAY_URL = "http://localhost:8000/api/v1/services/aigc/text-generation/generation"
-# GATEWAY_URL = "http://localhost:8000/siliconflow/models/deepseek-ai/DeepSeek-R1"
-# GATEWAY_URL = "https://api-bailian.siliconflow.cn/siliconflow/models/deepseek-ai/DeepSeek-R1"
 API_KEY = os.getenv("SILICONFLOW_API_KEY", "test_api_key")
 
-# Define the Tool Schema Vector
 TOOL_VECTOR_WEATHER = [
     {
         "type": "function",
@@ -35,16 +32,31 @@
     }
 ]
 
+# --- 2. CORE UTILITIES & DATA STRUCTURES ---
 
 @dataclass
 class SSEFrame:
     """Formal representation of a Server-Sent Event frame for validation."""
-
     id: str
     output: Dict[str, Any]
     usage: Dict[str, Any]
     request_id: str
 
+    @property
+    def text_content(self) -> str:
+        """Helper to safely extract standard content."""
+        choices = self.output.get("choices", [])
+        if not choices:
+            return ""
+        return choices[0].get("message", {}).get("content", "")
+
+    @property
+    def reasoning_content(self) -> str:
+        """Helper to safely extract reasoning content (for R1 models)."""
+        choices = self.output.get("choices", [])
+        if not choices:
+            return ""
+        return choices[0].get("message", {}).get("reasoning_content", "")
 
 def parse_sse_stream(response: requests.Response) -> Generator[SSEFrame, None, None]:
     """
@@ -58,27 +70,25 @@ def parse_sse_stream(response: requests.Response) -> Generator[SSEFrame, None, N
                 json_str = decoded_line[5:].strip()
                 try:
                     data = json.loads(json_str)
+                    # Handle cases where usage might be missing in some frames if strictly required
+                    usage_data = data.get("usage", {})
+
                     yield SSEFrame(
-                        id=data.get("output", {})
-                        .get("choices", [{}])[0]
-                        .get("id", "unknown"),
+                        id=data.get("output", {}).get("choices", [{}])[0].get("id", "unknown"),
                         output=data.get("output", {}),
-                        usage=data.get("usage", {}),
+                        usage=usage_data,
                         request_id=data.get("request_id", ""),
                     )
                 except json.JSONDecodeError:
                     continue
 
-
 # --- SUITE A: INVARIANT & PREDICATE VERIFICATION ---
 
-
 def test_invariant_format_constraint():
     """
     Predicate A: If P_tools is not empty, P_result_format must be 'message'.
     """
     headers = {"Authorization": f"Bearer {API_KEY}", "Content-Type": "application/json"}
-
     payload = {
         "model": "deepseek-v3",
         "input": {"messages": [{"role": "user", "content": "What's the weather?"}]},
@@ -87,26 +97,21 @@ def test_invariant_format_constraint():
             "result_format": "text",  # <--- INTENTIONAL VIOLATION
         },
     }
-
     response = requests.post(GATEWAY_URL, headers=headers, json=payload)
 
     assert response.status_code == 400
     error_data = response.json()
     assert "code" in error_data
     assert "result_format" in str(error_data).lower()
 
-
 def test_invariant_r1_orthogonality():
     """
     Predicate B: DeepSeek R1 'Thinking Mode' is orthogonal to 'Forced Tool Choice (Dict)'.
     """
     headers = {"Authorization": f"Bearer {API_KEY}", "Content-Type": "application/json"}
-
     payload = {
         "model": "deepseek-r1",
-        "input": {
-            "messages": [{"role": "user", "content": "Analyze the weather logic."}]
-        },
+        "input": {"messages": [{"role": "user", "content": "Analyze the weather logic."}]},
         "parameters": {
             "enable_thinking": True,
             "tools": TOOL_VECTOR_WEATHER,
@@ -116,16 +121,13 @@ def test_invariant_r1_orthogonality():
             },
         },
     }
-
     response = requests.post(GATEWAY_URL, headers=headers, json=payload)
 
     assert response.status_code == 400
     assert "InvalidParameter" in response.json().get("code", "")
 
-
 # --- SUITE B: PROTOCOL ISOMORPHISM (SSE TELEMETRY) ---
 
-
 def test_telemetry_continuity_sse():
     """
     Theorem: The 'usage' object must be persisted in EVERY SSE frame.
@@ -135,7 +137,6 @@ def test_telemetry_continuity_sse():
         "Content-Type": "application/json",
         "X-DashScope-SSE": "enable",
     }
-
     payload = {
         "model": "deepseek-v3",
         "input": {"messages": [{"role": "user", "content": "Call the tool."}]},
@@ -157,14 +158,11 @@ def test_telemetry_continuity_sse():
 
     assert frame_count > 0
 
-
 # --- SUITE C: TOOL INVOCATION & CONFIGURATION TESTS ---
 
-
 def test_unary_tool_invocation_structure():
     """
-    Validates that standard unary (non-streaming) responses maintain proper tool structures
-    when tools are enabled but not necessarily forced.
+    Validates standard unary responses maintain tool structures when tools enabled.
     """
     headers = {"Authorization": f"Bearer {API_KEY}", "Content-Type": "application/json"}
     payload = {
@@ -185,16 +183,13 @@ def test_unary_tool_invocation_structure():
     assert "choices" in data["output"]
     assert len(data["output"]["choices"]) > 0
 
-    # Check structure integrity
     choice = data["output"]["choices"][0]
     assert "message" in choice
     assert "usage" in data
 
-
 def test_tool_choice_none_suppression():
     """
-    Validates that tool_choice='none' is accepted by the gateway and processed without error.
-    This ensures the explicit suppression logic path is valid.
+    Validates that tool_choice='none' is accepted and processes without error.
     """
     headers = {"Authorization": f"Bearer {API_KEY}", "Content-Type": "application/json"}
     payload = {
@@ -209,120 +204,31 @@ def test_tool_choice_none_suppression():
     response = requests.post(GATEWAY_URL, headers=headers, json=payload)
     assert response.status_code == 200
 
-    # Even if mocked, the structure must be valid
     data = response.json()
     assert data["output"]["choices"][0]["finish_reason"] is not None
 
-
-import pytest
-import json
-import requests
-from typing import Generator, List, Dict, Any, Optional
-from dataclasses import dataclass
-import os
-
-# --- CONSTANTS & CONFIGURATION ---
-GATEWAY_URL = "http://localhost:8000/api/v1/services/aigc/text-generation/generation"
-API_KEY = os.getenv("SILICONFLOW_API_KEY", "test_api_key")
-
-TOOL_VECTOR_WEATHER = [
-    {
-        "type": "function",
-        "function": {
-            "name": "get_current_weather",
-            "description": "Get the current weather in a given location",
-            "parameters": {
-                "type": "object",
-                "properties": {
-                    "location": {"type": "string"},
-                    "unit": {"type": "string", "enum": ["celsius", "fahrenheit"]},
-                },
-                "required": ["location"],
-            },
-        },
-    }
-]
-
-
-@dataclass
-class SSEFrame:
-    id: str
-    output: Dict[str, Any]
-    usage: Dict[str, Any]
-    request_id: str
-
-    @property
-    def text_content(self) -> str:
-        """Helper to safely extract standard content."""
-        choices = self.output.get("choices", [])
-        if not choices:
-            return ""
-        return choices[0].get("message", {}).get("content", "")
-
-    @property
-    def reasoning_content(self) -> str:
-        """Helper to safely extract reasoning content (for R1 models)."""
-        choices = self.output.get("choices", [])
-        if not choices:
-            return ""
-        return choices[0].get("message", {}).get("reasoning_content", "")
-
-
-def parse_sse_stream(response: requests.Response) -> Generator[SSEFrame, None, None]:
-    for line in response.iter_lines():
-        if line:
-            decoded_line = line.decode("utf-8")
-            if decoded_line.startswith("data:"):
-                json_str = decoded_line[5:].strip()
-                try:
-                    data = json.loads(json_str)
-                    yield SSEFrame(
-                        id=data.get("output", {})
-                        .get("choices", [{}])[0]
-                        .get("id", "unknown"),
-                        output=data.get("output", {}),
-                        usage=data.get("usage", {}),
-                        request_id=data.get("request_id", ""),
-                    )
-                except json.JSONDecodeError:
-                    continue
-
-
-# --- EXISTING SUITES (A, B, C) OMITTED FOR BREVITY ---
-# (Assume Suite A, B, and C from your original code are here)
-
 # --- SUITE D: INCREMENTAL OUTPUT BEHAVIOR ---
 
-
 def assert_stream_accumulation(frames: List[SSEFrame], check_reasoning: bool = False):
     """
     Validates 'Accumulated' behavior (incremental_output=False).
     Theorem: For any frame N > 0, Content(N) must start with Content(N-1).
     """
     previous_content = ""
-
-    # Filter out empty initial frames if necessary, though accumulation should start immediately
     for i, frame in enumerate(frames):
-        # Select content type based on what the model is outputting (Reasoning vs Standard)
-        current_content = (
-            frame.reasoning_content if check_reasoning else frame.text_content
-        )
+        current_content = frame.reasoning_content if check_reasoning else frame.text_content
 
-        # Skip empty frames (sometimes initial frames are just metadata)
+        # Skip empty frames
         if not current_content and not previous_content:
             continue
 
-        # Assertion: The new content must contain the previous content as a prefix
-        # This proves the server is sending the full history every time.
         assert current_content.startswith(previous_content), (
             f"Frame {i} violation: Output is not accumulated.\n"
             f"Previous: {previous_content!r}\n"
             f"Current:  {current_content!r}"
         )
-
         previous_content = current_content
 
-
 def assert_stream_deltas(frames: List[SSEFrame], check_reasoning: bool = False):
     """
     Validates 'Delta' behavior (incremental_output=True).
@@ -332,31 +238,20 @@ def assert_stream_deltas(frames: List[SSEFrame], check_reasoning: bool = False):
     previous_content = ""
 
     for i, frame in enumerate(frames):
-        current_content = (
-            frame.reasoning_content if check_reasoning else frame.text_content
-        )
-
+        current_content = frame.reasoning_content if check_reasoning else frame.text_content
         if not current_content:
             continue
 
-        # If current content strictly starts with previous content AND adds to it,
-        # we might be in accumulation mode.
-        # Note: We need a heuristic because "The" -> "The cat" is technically accumulation,
-        # but in Delta mode it should be "The" -> " cat".
-        if (
-            previous_content
-            and current_content.startswith(previous_content)
-            and len(current_content) > len(previous_content)
-        ):
+        # Heuristic: If content strictly grows and contains previous, it's likely accumulation
+        if (previous_content and
+            current_content.startswith(previous_content) and
+            len(current_content) > len(previous_content)):
             accumulation_detected = True
             break
 
         previous_content = current_content
 
-    assert (
-        not accumulation_detected
-    ), "Stream appears to be accumulating full text, expected Deltas (chunks) only."
-
+    assert not accumulation_detected, "Stream appears to be accumulating full text, expected Deltas."
 
 def test_incremental_output_false_explicit():
     """
@@ -369,7 +264,7 @@ def test_incremental_output_false_explicit():
         "X-DashScope-SSE": "enable",
     }
     payload = {
-        "model": "deepseek-r1",  # Using R1 to check reasoning accumulation
+        "model": "deepseek-r1",
         "input": {"messages": [{"role": "user", "content": "Count to 5"}]},
         "parameters": {
             "result_format": "message",
@@ -379,14 +274,10 @@ def test_incremental_output_false_explicit():
 
     response = requests.post(GATEWAY_URL, headers=headers, json=payload, stream=True)
     assert response.status_code == 200
-
     frames = list(parse_sse_stream(response))
     assert len(frames) > 0
-
-    # Verify accumulation on reasoning_content (since R1 outputs reasoning first)
     assert_stream_accumulation(frames, check_reasoning=True)
 
-
 def test_incremental_output_default_behavior():
     """
     Case 2: incremental_output param is MISSING.
@@ -408,19 +299,14 @@ def test_incremental_output_default_behavior():
 
     response = requests.post(GATEWAY_URL, headers=headers, json=payload, stream=True)
     assert response.status_code == 200
-
     frames = list(parse_sse_stream(response))
     assert len(frames) > 0
-
-    # Verify the default behavior matches accumulation
     assert_stream_accumulation(frames, check_reasoning=True)
 
-
 def test_incremental_output_true_contrast():
     """
     Case 3: Explicitly set incremental_output=True.
     Expectation: The response contains only DELTAS (chunks).
-    Used to ensure the switch actually works.
     """
     headers = {
         "Authorization": f"Bearer {API_KEY}",
@@ -438,9 +324,6 @@ def test_incremental_output_true_contrast():
 
     response = requests.post(GATEWAY_URL, headers=headers, json=payload, stream=True)
     assert response.status_code == 200
-
     frames = list(parse_sse_stream(response))
     assert len(frames) > 0
-
-    # Verify we are receiving deltas, not full text
     assert_stream_deltas(frames, check_reasoning=True)