fix: fix function call need send sig back to vertex

fatelei · fatelei · commit 7da3afa18304 · 2026-01-08T18:07:33.000+08:00
diff --git a/models/vertex_ai/manifest.yaml b/models/vertex_ai/manifest.yaml
@@ -32,4 +32,4 @@ resource:
     tool:
       enabled: true
 type: plugin
-version: 0.0.34
+version: 0.0.35
diff --git a/models/vertex_ai/models/llm/llm.py b/models/vertex_ai/models/llm/llm.py
@@ -1,6 +1,7 @@
 import base64
 import io
 import json
+import logging
 import time
 from collections.abc import Generator, Sequence
 from typing import Optional, Union, cast
@@ -52,6 +53,8 @@
 # For more information about the models, please refer to https://ai.google.dev/gemini-api/docs/thinking
 DEFAULT_NO_THINKING_MODELS = ["gemini-2.5-flash-lite"]
 
+logger = logging.getLogger(__name__)
+
 
 class VertexAiLargeLanguageModel(LargeLanguageModel):
     def _invoke(
@@ -634,6 +637,12 @@ def _handle_generate_response(
                             ),
                         )
                         assistant_prompt_message.tool_calls.append(tool_call)
+                        # Capture thought_signature if the SDK surfaced it on the same part
+                        sig = self._extract_thought_signature(part)
+                        if sig:
+                            if not hasattr(self, "_last_function_call_signatures"):
+                                self._last_function_call_signatures = []
+                            self._last_function_call_signatures.append(sig)
                     # Check for text
                     elif hasattr(part, 'text') and part.text:
                         if part.thought is True and not is_thinking:
@@ -698,6 +707,12 @@ def _handle_generate_stream_response(
                             ),
                         )
                     )
+                    # Capture thought_signature if present on the streaming part
+                    sig = self._extract_thought_signature(part)
+                    if sig:
+                        if not hasattr(self, "_last_function_call_signatures"):
+                            self._last_function_call_signatures = []
+                        self._last_function_call_signatures.append(sig)
                 # Check for text
                 elif hasattr(part, 'text') and part.text:
                     if part.thought is True and not is_thinking:
@@ -774,6 +789,32 @@ def _handle_generate_stream_response(
                         ),
                     )
 
+    def _extract_thought_signature(self, part) -> Optional[str]:
+        """
+        Best-effort extractor for Vertex AI thought signatures from a Part.
+        Handles snake_case and camelCase, and tries dict/extraContent fallbacks.
+        """
+        # Direct attributes first
+        sig = getattr(part, "thought_signature", None) or getattr(part, "thoughtSignature", None)
+        if isinstance(sig, str) and sig:
+            return sig
+        # Try dict conversion if the SDK object supports it
+        try:
+            d = part.to_dict() if hasattr(part, "to_dict") else (getattr(part, "__dict__", {}) or {})
+            if isinstance(d, dict):
+                sig = d.get("thoughtSignature") or d.get("thought_signature")
+                if not sig:
+                    extra = d.get("extraContent") or d.get("extra_content") or {}
+                    if isinstance(extra, dict):
+                        g = extra.get("google")
+                        if isinstance(g, dict):
+                            sig = g.get("thought_signature")
+                if isinstance(sig, str) and sig:
+                    return sig
+        except Exception as e:
+            logger.warning(e, exc_info=True)
+        return None
+
     def _convert_one_message_to_text(self, message: PromptMessage) -> str:
         """
         Convert a single message to a string.
@@ -830,15 +871,20 @@ def _format_message_to_genai_content(self, message: PromptMessage) -> dict:
             return {"role": "user", "parts": parts}
         elif isinstance(message, AssistantPromptMessage):
             if message.tool_calls:
-                parts = [
-                    {
+                parts = []
+                for tool_call in message.tool_calls:
+                    part_dict = {
                         "function_call": {
                             "name": tool_call.function.name,
                             "args": json.loads(tool_call.function.arguments),
                         }
                     }
-                    for tool_call in message.tool_calls
-                ]
+                    # Attach thought_signature if we captured one from the previous model output
+                    if hasattr(self, "_last_function_call_signatures") and self._last_function_call_signatures:
+                        sig = self._last_function_call_signatures.pop(0)
+                        if sig:
+                            part_dict["thought_signature"] = sig
+                    parts.append(part_dict)
             else:
                 parts = [{"text": message.content}]
             return {"role": "model", "parts": parts}