Update test_doc.py

jackalcooper · jackalcooper · commit 2d71f5e620f7 · 2026-01-15T15:46:31.000+08:00
diff --git a/tests/test_doc.py b/tests/test_doc.py
@@ -1,14 +1,15 @@
 import pytest
 import json
 import requests
-from typing import Generator, List, Dict, Any
-from dataclasses import dataclass
 import os
+from typing import Generator, List, Dict, Any, Optional
+from dataclasses import dataclass
 
 # --- CONSTANTS & CONFIGURATION ---
 
-# 修改为动态 URL 的基础路径
-GATEWAY_BASE_URL = "http://localhost:8000/siliconflow/models"
+# 基础 URL 修改为适配动态路径的前缀
+# 最终请求 URL 将拼接为: BASE_URL + "/" + {model_path}
+BASE_URL_PREFIX = "http://localhost:8000/siliconflow/models"
 
 API_KEY = os.getenv("SILICONFLOW_API_KEY", "test_api_key")
 
@@ -43,19 +44,16 @@
 
 # --- HELPERS ---
 
-
 @dataclass
 class SSEFrame:
     """Formal representation of a Server-Sent Event frame for validation."""
-
     id: str
     output: Dict[str, Any]
     usage: Dict[str, Any]
     request_id: str
 
-
 def parse_sse_stream(response: requests.Response) -> Generator[SSEFrame, None, None]:
-    """Parses the raw SSE stream."""
+    """Parses the raw SSE stream line by line."""
     for line in response.iter_lines():
         if line:
             decoded_line = line.decode("utf-8")
@@ -64,41 +62,68 @@ def parse_sse_stream(response: requests.Response) -> Generator[SSEFrame, None, N
                 try:
                     data = json.loads(json_str)
                     yield SSEFrame(
-                        id=data.get("output", {})
-                        .get("choices", [{}])[0]
-                        .get("id", "unknown"),
+                        id=data.get("output", {}).get("choices", [{}])[0].get("id", "unknown"),
                         output=data.get("output", {}),
                         usage=data.get("usage", {}),
                         request_id=data.get("request_id", ""),
                     )
                 except json.JSONDecodeError:
                     continue
 
-
-def make_request(payload: Dict[str, Any]):
+def make_request(payload: Dict[str, Any]) -> requests.Response:
     """
-    Helper to send POST request using the Dynamic Path URL.
-    Extracts 'model' from payload to construct the URL:
-    POST /siliconflow/models/{model_path}
+    Helper to send POST request using the Dynamic Path URL structure.
+
+    Format: POST /siliconflow/models/{model_path}
+
+    It extracts the 'model' from the payload to construct the URL.
     """
-    # 提取模型名称用于构建 URL
     model_path = payload.get("model")
 
     if not model_path:
-        raise ValueError(
-            "Payload must contain 'model' field for dynamic URL construction"
-        )
+        raise ValueError("Test payload must contain 'model' field for dynamic URL construction")
 
-    # 构建动态 URL
-    # 例如: http://localhost:8000/siliconflow/models/pre-siliconflow/deepseek-v3
-    url = f"{GATEWAY_BASE_URL}/{model_path}"
+    # Construct the dynamic URL, e.g.:
+    # http://localhost:8000/siliconflow/models/deepseek-ai/DeepSeek-V3
+    url = f"{BASE_URL_PREFIX}/{model_path}"
 
-    # 发送请求 (Payload 中保留 model 字段通常没问题，服务器端代码会再次处理或忽略)
+    # Send the request. Note: We keep 'model' in the json body as well,
+    # though the server mainly relies on the path parameter now.
     return requests.post(url, headers=HEADERS, json=payload, stream=True)
 
-
 # --- TEST SUITE ---
 
+class TestDynamicPathRouting:
+    """
+    测试动态 URL 路由本身的正确性
+    """
+
+    def test_routing_basic_success(self):
+        """
+        测试标准的 URL 格式是否能通
+        URL: .../deepseek-ai/DeepSeek-V3
+        """
+        payload = {
+            "model": "deepseek-ai/DeepSeek-V3",
+            "input": {"messages": [{"role": "user", "content": "Hello"}]},
+            "parameters": {"max_tokens": 10}
+        }
+        response = make_request(payload)
+        assert response.status_code == 200
+
+    def test_routing_with_mapping(self):
+        """
+        测试服务端 ModelResolver 是否依然工作
+        URL: .../pre-siliconflow/deepseek-v3 (会被映射到 upstream 的 deepseek-ai/DeepSeek-V3)
+        """
+        payload = {
+            "model": "pre-siliconflow/deepseek-v3",
+            "input": {"messages": [{"role": "user", "content": "Test"}]},
+            "parameters": {"max_tokens": 10}
+        }
+        response = make_request(payload)
+        assert response.status_code == 200
+
 
 class TestParameterValidation:
     """
@@ -108,51 +133,40 @@ class TestParameterValidation:
     def test_invalid_parameter_type_top_p(self):
         """
         Case: parameters.top_p 输入字符串 'a'，预期返回 400 InvalidParameter。
-        URL: /siliconflow/models/pre-siliconflow/deepseek-v3
         """
         payload = {
-            "model": "pre-siliconflow/deepseek-v3",
+            "model": "deepseek-ai/DeepSeek-V3",
             "input": {"messages": [{"role": "user", "content": "你好"}]},
             "parameters": {"top_p": "a"},  # Invalid type
         }
         response = make_request(payload)
 
-        # 验证状态码不应为 500
-        assert (
-            response.status_code != 500
-        ), "Should not return 500 for invalid parameter type"
         assert response.status_code == 400
-
         data = response.json()
-        assert "InvalidParameter" in data.get(
-            "code", ""
-        ) or "InvalidParameter" in data.get("message", "")
+        assert "InvalidParameter" in data.get("code", "") or "InvalidParameter" in data.get("message", "")
 
     @pytest.mark.parametrize("top_p_value", [0, 0.0])
     def test_invalid_parameter_range_top_p(self, top_p_value):
         """
-        Case: pre-siliconflow-deepseek-v3.1 top_p取值范围 (0, 1.0]。
-        测试边界值 0，预期报错。
-        URL: /siliconflow/models/pre-siliconflow/deepseek-v3.1
+        Case: top_p取值范围 (0, 1.0]。测试边界值 0。
         """
         payload = {
-            "model": "pre-siliconflow/deepseek-v3.1",
+            "model": "deepseek-ai/DeepSeek-V3.1",
             "input": {"messages": [{"role": "user", "content": "你好"}]},
             "parameters": {"top_p": top_p_value},
         }
         response = make_request(payload)
 
-        assert response.status_code == 400, f"top_p={top_p_value} should be invalid"
+        assert response.status_code == 400
         data = response.json()
         assert "Range of top_p should be" in data.get("message", "")
 
     def test_invalid_parameter_range_temperature(self):
         """
-        Case: pre-siliconflow-deepseek-v3.1 temperature 取值范围 [0, 2]。
-        测试值 2.1，预期报错。
+        Case: temperature 取值范围 [0, 2]。测试值 2.1。
         """
         payload = {
-            "model": "pre-siliconflow/deepseek-v3.1",
+            "model": "deepseek-ai/DeepSeek-V3.1",
             "input": {"messages": [{"role": "user", "content": "你好"}]},
             "parameters": {"temperature": 2.1},
         }
@@ -165,17 +179,16 @@ def test_invalid_parameter_range_temperature(self):
 
 class TestDeepSeekR1Specifics:
     """
-    针对 R1 模型的特定测试用例
+    针对 R1 模型的特定测试用例 (Reasoning Models)
     """
 
     def test_r1_usage_structure(self):
         """
-        Case: .usage.output_tokens_details 该路径下不应该返回 text_tokens 字段。
-        R1 模型推理侧可能没有 text_tokens。
-        URL: /siliconflow/models/pre-siliconflow/deepseek-r1
+        Case: R1 模型不应该返回 text_tokens，应该返回 reasoning_tokens。
+        URL: .../deepseek-ai/DeepSeek-R1
         """
         payload = {
-            "model": "pre-siliconflow/deepseek-r1",
+            "model": "deepseek-ai/DeepSeek-R1",
             "input": {"messages": [{"role": "user", "content": "你好"}]},
             "parameters": {},
         }
@@ -188,22 +201,19 @@ def test_r1_usage_structure(self):
         final_usage = frames[-1].usage
 
         output_details = final_usage.get("output_tokens_details", {})
-        # 验证 output_tokens_details 存在
         assert output_details, "output_tokens_details missing"
-        # 验证不包含 text_tokens (根据表格描述这是预期行为)
-        assert (
-            "text_tokens" not in output_details
-        ), "R1 usage should not contain text_tokens"
+
+        # 验证不包含 text_tokens (R1 特性)
+        assert "text_tokens" not in output_details, "R1 usage should not contain text_tokens"
         # 验证包含 reasoning_tokens
         assert "reasoning_tokens" in output_details
 
     def test_r1_enable_thinking_parameter_error(self):
         """
-        Case: r1传了 enable_thinking 报错。
-        预期: 400 Value error, current model does not support parameter `enable_thinking`.
+        Case: R1 原生支持思考，显式传递 enable_thinking=True 应报错。
         """
         payload = {
-            "model": "pre-siliconflow/deepseek-r1",
+            "model": "deepseek-ai/DeepSeek-R1",
             "input": {"messages": [{"role": "user", "content": "你好"}]},
             "parameters": {"enable_thinking": True},
         }
@@ -216,17 +226,15 @@ def test_r1_enable_thinking_parameter_error(self):
 
 class TestAdvancedFeatures:
     """
-    复杂场景：前缀续写、历史消息包含 ToolCall 等
+    复杂场景：前缀续写、ToolCall 格式校验等
     """
 
     def test_prefix_completion_thinking_conflict(self):
         """
         Case: 思考模式下(enable_thinking=true)，不支持前缀续写(partial=true)。
-        预期返回: 400 InvalidParameter.
-        URL: /siliconflow/models/pre-siliconflow/deepseek-v3.2
         """
         payload = {
-            "model": "pre-siliconflow/deepseek-v3.2",
+            "model": "deepseek-ai/DeepSeek-V3.2",
             "input": {
                 "messages": [
                     {"role": "user", "content": "你好"},
@@ -239,69 +247,22 @@ def test_prefix_completion_thinking_conflict(self):
 
         assert response.status_code == 400
         data = response.json()
-        assert "Partial mode is not supported when enable_thinking is true" in data.get(
-            "message", ""
-        )
-
-    def test_history_with_tool_calls(self):
-        """
-        Case: 3.1和3.2 message中包含历史 tool_call 调用信息曾报 5xx。
-        预期: 200 OK。
-        """
-        payload = {
-            "model": "pre-siliconflow/deepseek-v3.2",
-            "input": {
-                "messages": [
-                    {
-                        "role": "system",
-                        "content": "你是一个为智能助手。请使用简洁、自然、适合朗读的中文回答",
-                    },
-                    {"role": "user", "content": "外部轴设置"},
-                    {
-                        "role": "assistant",
-                        "tool_calls": [
-                            {
-                                "function": {
-                                    "arguments": '{"input_text": "外部轴设置"}',
-                                    "name": "KB20250625001",
-                                },
-                                "id": "call_6478091069c2448b83f38e",
-                                "type": "function",
-                            }
-                        ],
-                    },
-                    {
-                        "role": "tool",
-                        "content": "界面用于用户进行快速配置。",
-                        "tool_call_id": "call_6478091069c2448b83f38e",
-                    },
-                ]
-            },
-            "parameters": {"enable_thinking": True},
-        }
-        response = make_request(payload)
+        assert "Partial mode is not supported when enable_thinking is true" in data.get("message", "")
 
-        # 核心验证：不能崩 (500)
-        assert (
-            response.status_code != 500
-        ), "Server returned 500 for history with tool calls"
-        assert response.status_code == 200
-
-    def test_r1_tool_call_format_wrapping(self):
+    def test_r1_tool_choice_conflict(self):
         """
-        Case: Error code: 400, _sse_http_status: 500 (Wrappping error).
-        Input should be 'none', 'auto' or 'required'.
-        验证 R1 对 result_format='message' 和 tool_choice 的组合处理。
+        Case: R1 模型下，enable_thinking (或原生 R1) 开启时，不支持具体的 tool_choice 字典绑定。
         """
         payload = {
-            "model": "pre-siliconflow/deepseek-r1",
+            "model": "deepseek-ai/DeepSeek-R1",
             "input": {
                 "messages": [
                     {"role": "user", "content": "What is the weather like in Boston?"}
                 ]
             },
             "parameters": {
                 "result_format": "message",
+                # R1 logic usually prevents enforcing a specific tool via dict when thinking is active
                 "tool_choice": {
                     "type": "function",
                     "function": {"name": "get_current_weather"},
@@ -312,7 +273,12 @@ def test_r1_tool_call_format_wrapping(self):
 
         response = make_request(payload)
 
+        # Expecting 400 because R1 + Specific Tool Choice is often restricted in this proxy logic
         if response.status_code != 200:
+            assert response.status_code == 400
             error_data = response.json()
-            assert response.status_code != 500
-            assert error_data.get("code") != "InternalError"
+            assert "DeepSeek R1 does not support specific tool_choice" in error_data.get("message", "")
+
+if __name__ == "__main__":
+    # 如果直接运行此脚本，可以使用 pytest 调起
+    pytest.main(["-v", __file__])