WIP vertex tool calls

aabmass · aabmass · commit ad0019884c07 · 2025-02-04T22:17:09.000Z
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/CHANGELOG.md b/instrumentation-genai/opentelemetry-instrumentation-vertexai/CHANGELOG.md
@@ -15,5 +15,5 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
   ([#3208](https://github.com/open-telemetry/opentelemetry-python-contrib/pull/3208))
 - VertexAI emit user, system, and assistant events
   ([#3203](https://github.com/open-telemetry/opentelemetry-python-contrib/pull/3203))
-- Add Vertex gen AI response span attributes
+- Add Vertex gen AI response attributes and `gen_ai.choice` events
   ([#3227](https://github.com/open-telemetry/opentelemetry-python-contrib/pull/3227))
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/events.py b/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/events.py
@@ -23,7 +23,7 @@
 from __future__ import annotations
 
 from dataclasses import asdict, dataclass
-from typing import Literal
+from typing import Any, Iterable, Literal
 
 from opentelemetry._events import Event
 from opentelemetry.semconv._incubating.attributes import gen_ai_attributes
@@ -104,36 +104,58 @@ class ChoiceMessage:
     role: str = "assistant"
 
 
+@dataclass
+class ChoiceToolCall:
+    """The tool_calls field for a gen_ai.choice event"""
+
+    @dataclass
+    class Function:
+        name: str
+        arguments: AnyValue = None
+
+    function: Function
+    id: str
+    type: Literal["function"] = "function"
+
+
 FinishReason = Literal[
     "content_filter", "error", "length", "stop", "tool_calls"
 ]
 
 
-# TODO add tool calls
-# https://github.com/open-telemetry/opentelemetry-python-contrib/issues/3216
 def choice_event(
     *,
     finish_reason: FinishReason | str,
     index: int,
     message: ChoiceMessage,
+    tool_calls: Iterable[ChoiceToolCall] = (),
 ) -> Event:
     """Creates a choice event, which describes the Gen AI response message.
     https://github.com/open-telemetry/semantic-conventions/blob/v1.28.0/docs/gen-ai/gen-ai-events.md#event-gen_aichoice
     """
     body: dict[str, AnyValue] = {
         "finish_reason": finish_reason,
         "index": index,
-        "message": asdict(
-            message,
-            # filter nulls
-            dict_factory=lambda kvs: {k: v for (k, v) in kvs if v is not None},
-        ),
+        "message": _asdict_filter_nulls(message),
     }
 
+    tool_calls_list = [
+        _asdict_filter_nulls(tool_call) for tool_call in tool_calls
+    ]
+    if tool_calls_list:
+        body["tool_calls"] = tool_calls_list
+
     return Event(
         name="gen_ai.choice",
         attributes={
             gen_ai_attributes.GEN_AI_SYSTEM: gen_ai_attributes.GenAiSystemValues.VERTEX_AI.value,
         },
         body=body,
     )
+
+
+def _asdict_filter_nulls(instance: Any) -> dict[str, AnyValue]:
+    return asdict(
+        instance,
+        dict_factory=lambda kvs: {k: v for (k, v) in kvs if v is not None},
+    )
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/utils.py b/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/utils.py
@@ -26,9 +26,12 @@
 )
 from urllib.parse import urlparse
 
+from google.protobuf import json_format
+
 from opentelemetry._events import Event
 from opentelemetry.instrumentation.vertexai.events import (
     ChoiceMessage,
+    ChoiceToolCall,
     FinishReason,
     assistant_event,
     choice_event,
@@ -231,6 +234,17 @@ def response_to_events(
     capture_content: bool,
 ) -> Iterable[Event]:
     for candidate in response.candidates:
+        # NOTE: since function_call appears in content.parts, it will also be in the choice
+        # event. This is different from OpenAI where the tool calls are outside of content:
+        # https://platform.openai.com/docs/api-reference/chat/object. I would prefer not to
+        # filter from choice event to keep indexing obvious.
+        #
+        # There is similarly a pair of executable_code and
+        # code_execution_result which are similar to tool call in that the model is asking for
+        # you to do something rather than generating content:
+        # https://github.com/googleapis/googleapis/blob/ae87dc8a3830f37d575e2cff577c9b5a4737176b/google/cloud/aiplatform/v1beta1/content.proto#L123-L128
+        tool_calls = _extract_tool_calls(candidate)
+
         yield choice_event(
             finish_reason=_map_finish_reason(candidate.finish_reason),
             index=candidate.index,
@@ -242,6 +256,26 @@ def response_to_events(
                     parts=candidate.content.parts,
                 ),
             ),
+            tool_calls=tool_calls,
+        )
+
+
+def _extract_tool_calls(
+    candidate: content.Candidate | content_v1beta1.Candidate,
+) -> Iterable[ChoiceToolCall]:
+    for part in candidate.content.parts:
+        if "function_call" not in part:
+            continue
+
+        yield ChoiceToolCall(
+            # NOTE: Vertex does not have an id but this required
+            id="",
+            function=ChoiceToolCall.Function(
+                name=part.function_call.name,
+                arguments=json_format.MessageToDict(
+                    part.function_call._pb.args  # type: ignore[reportUnknownMemberType]
+                ),
+            ),
         )
 
 
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/tests/cassettes/test_function_call.yaml b/instrumentation-genai/opentelemetry-instrumentation-vertexai/tests/cassettes/test_function_call.yaml
@@ -0,0 +1,119 @@
+interactions:
+- request:
+    body: |-
+      {
+        "contents": [
+          {
+            "role": "user",
+            "parts": [
+              {
+                "text": "Get weather details in New Delhi and San Francisco?"
+              }
+            ]
+          }
+        ],
+        "tools": [
+          {
+            "functionDeclarations": [
+              {
+                "name": "get_current_weather",
+                "description": "Get the current weather in a given location",
+                "parameters": {
+                  "type": 6,
+                  "properties": {
+                    "location": {
+                      "type": 1,
+                      "description": "The location for which to get the weather. It can be a city name, a city name and state, or a zip code. Examples: 'San Francisco', 'San Francisco, CA', '95616', etc."
+                    }
+                  },
+                  "propertyOrdering": [
+                    "location"
+                  ]
+                }
+              }
+            ]
+          }
+        ]
+      }
+    headers:
+      Accept:
+      - '*/*'
+      Accept-Encoding:
+      - gzip, deflate
+      Connection:
+      - keep-alive
+      Content-Length:
+      - '824'
+      Content-Type:
+      - application/json
+      User-Agent:
+      - python-requests/2.32.3
+    method: POST
+    uri: https://us-central1-aiplatform.googleapis.com/v1/projects/fake-project/locations/us-central1/publishers/google/models/gemini-1.5-flash-002:generateContent?%24alt=json%3Benum-encoding%3Dint
+  response:
+    body:
+      string: |-
+        {
+          "candidates": [
+            {
+              "content": {
+                "role": "model",
+                "parts": [
+                  {
+                    "functionCall": {
+                      "name": "get_current_weather",
+                      "args": {
+                        "location": "New Delhi"
+                      }
+                    }
+                  },
+                  {
+                    "functionCall": {
+                      "name": "get_current_weather",
+                      "args": {
+                        "location": "San Francisco"
+                      }
+                    }
+                  }
+                ]
+              },
+              "finishReason": 1,
+              "avgLogprobs": -0.00018195244774688035
+            }
+          ],
+          "usageMetadata": {
+            "promptTokenCount": 72,
+            "candidatesTokenCount": 16,
+            "totalTokenCount": 88,
+            "promptTokensDetails": [
+              {
+                "modality": 1,
+                "tokenCount": 72
+              }
+            ],
+            "candidatesTokensDetails": [
+              {
+                "modality": 1,
+                "tokenCount": 16
+              }
+            ]
+          },
+          "modelVersion": "gemini-1.5-flash-002",
+          "createTime": "2025-02-04T03:52:01.562155Z",
+          "responseId": "4Y6hZ-unIrfQnvgPr73XgA0"
+        }
+    headers:
+      Content-Type:
+      - application/json; charset=UTF-8
+      Transfer-Encoding:
+      - chunked
+      Vary:
+      - Origin
+      - X-Origin
+      - Referer
+      content-length:
+      - '1029'
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/tests/cassettes/test_function_call_no_content.yaml b/instrumentation-genai/opentelemetry-instrumentation-vertexai/tests/cassettes/test_function_call_no_content.yaml
@@ -0,0 +1,119 @@
+interactions:
+- request:
+    body: |-
+      {
+        "contents": [
+          {
+            "role": "user",
+            "parts": [
+              {
+                "text": "Get weather details in New Delhi and San Francisco?"
+              }
+            ]
+          }
+        ],
+        "tools": [
+          {
+            "functionDeclarations": [
+              {
+                "name": "get_current_weather",
+                "description": "Get the current weather in a given location",
+                "parameters": {
+                  "type": 6,
+                  "properties": {
+                    "location": {
+                      "type": 1,
+                      "description": "The location for which to get the weather. It can be a city name, a city name and state, or a zip code. Examples: 'San Francisco', 'San Francisco, CA', '95616', etc."
+                    }
+                  },
+                  "propertyOrdering": [
+                    "location"
+                  ]
+                }
+              }
+            ]
+          }
+        ]
+      }
+    headers:
+      Accept:
+      - '*/*'
+      Accept-Encoding:
+      - gzip, deflate
+      Connection:
+      - keep-alive
+      Content-Length:
+      - '824'
+      Content-Type:
+      - application/json
+      User-Agent:
+      - python-requests/2.32.3
+    method: POST
+    uri: https://us-central1-aiplatform.googleapis.com/v1/projects/fake-project/locations/us-central1/publishers/google/models/gemini-1.5-flash-002:generateContent?%24alt=json%3Benum-encoding%3Dint
+  response:
+    body:
+      string: |-
+        {
+          "candidates": [
+            {
+              "content": {
+                "role": "model",
+                "parts": [
+                  {
+                    "functionCall": {
+                      "name": "get_current_weather",
+                      "args": {
+                        "location": "New Delhi"
+                      }
+                    }
+                  },
+                  {
+                    "functionCall": {
+                      "name": "get_current_weather",
+                      "args": {
+                        "location": "San Francisco"
+                      }
+                    }
+                  }
+                ]
+              },
+              "finishReason": 1,
+              "avgLogprobs": -0.00018187805835623294
+            }
+          ],
+          "usageMetadata": {
+            "promptTokenCount": 72,
+            "candidatesTokenCount": 16,
+            "totalTokenCount": 88,
+            "promptTokensDetails": [
+              {
+                "modality": 1,
+                "tokenCount": 72
+              }
+            ],
+            "candidatesTokensDetails": [
+              {
+                "modality": 1,
+                "tokenCount": 16
+              }
+            ]
+          },
+          "modelVersion": "gemini-1.5-flash-002",
+          "createTime": "2025-02-04T22:05:24.282269Z",
+          "responseId": "JI-iZ52dEeWI3NoP39Od0Qg"
+        }
+    headers:
+      Content-Type:
+      - application/json; charset=UTF-8
+      Transfer-Encoding:
+      - chunked
+      Vary:
+      - Origin
+      - X-Origin
+      - Referer
+      content-length:
+      - '1029'
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/tests/test_function_calling.py b/instrumentation-genai/opentelemetry-instrumentation-vertexai/tests/test_function_calling.py