open-telemetry
diff --git a/‎cassettes/test_tool_events_no_content‎
Lines changed: 83 additions & 0 deletions b/‎cassettes/test_tool_events_no_content‎
Lines changed: 83 additions & 0 deletions
diff --git a/‎cassettes/test_tool_events_no_content.yaml‎
Lines changed: 83 additions & 0 deletions b/‎cassettes/test_tool_events_no_content.yaml‎
Lines changed: 83 additions & 0 deletions
diff --git a/‎instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/__init__.py‎
Lines changed: 6 additions & 0 deletions b/‎instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/__init__.py‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/patch.py‎
Lines changed: 77 additions & 29 deletions b/‎instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/patch.py‎
Lines changed: 77 additions & 29 deletions
@@ -0,0 +1,83 @@
+interactions:
+- request:
+    body: "{\n  \"contents\": [\n    {\n      \"role\": \"user\",\n      \"parts\":
+      [\n        {\n          \"text\": \"Get weather details in New Delhi and San
+      Francisco?\"\n        }\n      ]\n    },\n    {\n      \"role\": \"model\",\n
+      \     \"parts\": [\n        {\n          \"functionCall\": {\n            \"name\":
+      \"get_current_weather\",\n            \"args\": {\n              \"location\":
+      \"New Delhi\"\n            }\n          }\n        },\n        {\n          \"functionCall\":
+      {\n            \"name\": \"get_current_weather\",\n            \"args\": {\n
+      \             \"location\": \"San Francisco\"\n            }\n          }\n
+      \       }\n      ]\n    },\n    {\n      \"role\": \"user\",\n      \"parts\":
+      [\n        {\n          \"functionResponse\": {\n            \"name\": \"get_current_weather\",\n
+      \           \"response\": {\n              \"content\": \"{\\\"temperature\\\":
+      35, \\\"unit\\\": \\\"C\\\"}\"\n            }\n          }\n        },\n        {\n
+      \         \"functionResponse\": {\n            \"name\": \"get_current_weather\",\n
+      \           \"response\": {\n              \"content\": \"{\\\"temperature\\\":
+      25, \\\"unit\\\": \\\"C\\\"}\"\n            }\n          }\n        }\n      ]\n
+      \   }\n  ],\n  \"tools\": [\n    {\n      \"functionDeclarations\": [\n        {\n
+      \         \"name\": \"get_current_weather\",\n          \"description\": \"Get
+      the current weather in a given location\",\n          \"parameters\": {\n            \"type\":
+      6,\n            \"properties\": {\n              \"location\": {\n                \"type\":
+      1,\n                \"description\": \"The location for which to get the weather.
+      It can be a city name, a city name and state, or a zip code. Examples: 'San
+      Francisco', 'San Francisco, CA', '95616', etc.\"\n              }\n            },\n
+      \           \"propertyOrdering\": [\n              \"location\"\n            ]\n
+      \         }\n        }\n      ]\n    }\n  ]\n}"
+    headers:
+      Accept:
+      - '*/*'
+      Accept-Encoding:
+      - gzip, deflate
+      Connection:
+      - keep-alive
+      Content-Length:
+      - '1731'
+      Content-Type:
+      - application/json
+      User-Agent:
+      - python-requests/2.32.3
+      x-goog-api-client:
+      - model-builder/1.79.0+top_google_constructor_method+vertexai.generative_models.GenerativeModel.generate_content
+        gl-python/3.11.9 grpc/1.68.1 gax/2.23.0 gapic/1.79.0+top_google_constructor_method+vertexai.generative_models.GenerativeModel.generate_content
+      x-goog-request-params:
+      - model=projects/fake-project/locations/us-central1/publishers/google/models/gemini-2.5-pro
+    method: POST
+    uri: https://us-central1-aiplatform.googleapis.com/v1/projects/fake-project/locations/us-central1/publishers/google/models/gemini-2.5-pro:generateContent?%24alt=json%3Benum-encoding%3Dint
+  response:
+    body:
+      string: !!binary |
+        H4sIAAAAAAAC/91TwU7rMBC89ytWPRcHECdOVG3EqwQFkXJCCBlnSRccb7A3BYT679ghQODAgeM7
+        OTueHc+OndcRwBi9Zz8+hNdYxNJwibE62N2bvAM1hqCrhI0v8LHFIEABagqBXAU+QuSxBN3KGp2Q
+        0ULswEQsldoqyJ8bNBI5Z9NIgn3QxkRREH5ANwHLFcUG5gdCYA8chTxstKVfVQtEWIs04TDLStyg
+        5QZ9UBVzZVEZrjPquPKSBarcDrnsCW8T1bALbHGn8XwfjalxP2kQLW1Ig14up5erf/lytZhNV/n8
+        g1CiaLKJcdUB0IfWbR7JS9OllNbehm4odFZ6V74xao63bbVwd9yrDpT/54z7WbeTvyeXp5f6MzmP
+        OrBL3bOLfJ6ubHpS3JwuimKxPP4WMdeaOuL3E4acOl5DqUV//g5f+JrLr15lLLel0tRYLXfsa7XZ
+        U+cxODIpwwL9hgyqY3ToteCMncSYBiel1/ZOSqIDnR/ePhu2o+F6PUpf29EbabJOVcEDAAA=
+    headers:
+      Content-Encoding:
+      - gzip
+      Content-Type:
+      - application/json; charset=UTF-8
+      Date:
+      - Tue, 30 Sep 2025 15:26:53 GMT
+      Server:
+      - scaffolding on HTTPServer2
+      Transfer-Encoding:
+      - chunked
+      Vary:
+      - Origin
+      - X-Origin
+      - Referer
+      WWW-Authenticate:
+      - Bearer realm="https://accounts.google.com/"
+      X-Content-Type-Options:
+      - nosniff
+      X-Frame-Options:
+      - SAMEORIGIN
+      X-XSS-Protection:
+      - '0'
+    status:
+      code: 401
+      message: Unauthorized
+version: 1
@@ -0,0 +1,83 @@
+interactions:
+- request:
+    body: "{\n  \"contents\": [\n    {\n      \"role\": \"user\",\n      \"parts\":
+      [\n        {\n          \"text\": \"Get weather details in New Delhi and San
+      Francisco?\"\n        }\n      ]\n    },\n    {\n      \"role\": \"model\",\n
+      \     \"parts\": [\n        {\n          \"functionCall\": {\n            \"name\":
+      \"get_current_weather\",\n            \"args\": {\n              \"location\":
+      \"New Delhi\"\n            }\n          }\n        },\n        {\n          \"functionCall\":
+      {\n            \"name\": \"get_current_weather\",\n            \"args\": {\n
+      \             \"location\": \"San Francisco\"\n            }\n          }\n
+      \       }\n      ]\n    },\n    {\n      \"role\": \"user\",\n      \"parts\":
+      [\n        {\n          \"functionResponse\": {\n            \"name\": \"get_current_weather\",\n
+      \           \"response\": {\n              \"content\": \"{\\\"temperature\\\":
+      35, \\\"unit\\\": \\\"C\\\"}\"\n            }\n          }\n        },\n        {\n
+      \         \"functionResponse\": {\n            \"name\": \"get_current_weather\",\n
+      \           \"response\": {\n              \"content\": \"{\\\"temperature\\\":
+      25, \\\"unit\\\": \\\"C\\\"}\"\n            }\n          }\n        }\n      ]\n
+      \   }\n  ],\n  \"tools\": [\n    {\n      \"functionDeclarations\": [\n        {\n
+      \         \"name\": \"get_current_weather\",\n          \"description\": \"Get
+      the current weather in a given location\",\n          \"parameters\": {\n            \"type\":
+      6,\n            \"properties\": {\n              \"location\": {\n                \"type\":
+      1,\n                \"description\": \"The location for which to get the weather.
+      It can be a city name, a city name and state, or a zip code. Examples: 'San
+      Francisco', 'San Francisco, CA', '95616', etc.\"\n              }\n            },\n
+      \           \"propertyOrdering\": [\n              \"location\"\n            ]\n
+      \         }\n        }\n      ]\n    }\n  ]\n}"
+    headers:
+      Accept:
+      - '*/*'
+      Accept-Encoding:
+      - gzip, deflate
+      Connection:
+      - keep-alive
+      Content-Length:
+      - '1731'
+      Content-Type:
+      - application/json
+      User-Agent:
+      - python-requests/2.32.3
+      x-goog-api-client:
+      - model-builder/1.79.0+top_google_constructor_method+vertexai.generative_models.GenerativeModel.generate_content
+        gl-python/3.11.9 grpc/1.68.1 gax/2.23.0 gapic/1.79.0+top_google_constructor_method+vertexai.generative_models.GenerativeModel.generate_content
+      x-goog-request-params:
+      - model=projects/fake-project/locations/us-central1/publishers/google/models/gemini-2.5-pro
+    method: POST
+    uri: https://us-central1-aiplatform.googleapis.com/v1/projects/fake-project/locations/us-central1/publishers/google/models/gemini-2.5-pro:generateContent?%24alt=json%3Benum-encoding%3Dint
+  response:
+    body:
+      string: !!binary |
+        H4sIAAAAAAAC/91TwU7rMBC89ytWPRcHECdOVG3EqwQFkXJCCBlnSRccb7A3BYT679ghQODAgeM7
+        OTueHc+OndcRwBi9Zz8+hNdYxNJwibE62N2bvAM1hqCrhI0v8LHFIEABagqBXAU+QuSxBN3KGp2Q
+        0ULswEQsldoqyJ8bNBI5Z9NIgn3QxkRREH5ANwHLFcUG5gdCYA8chTxstKVfVQtEWIs04TDLStyg
+        5QZ9UBVzZVEZrjPquPKSBarcDrnsCW8T1bALbHGn8XwfjalxP2kQLW1Ig14up5erf/lytZhNV/n8
+        g1CiaLKJcdUB0IfWbR7JS9OllNbehm4odFZ6V74xao63bbVwd9yrDpT/54z7WbeTvyeXp5f6MzmP
+        OrBL3bOLfJ6ubHpS3JwuimKxPP4WMdeaOuL3E4acOl5DqUV//g5f+JrLr15lLLel0tRYLXfsa7XZ
+        U+cxODIpwwL9hgyqY3ToteCMncSYBiel1/ZOSqIDnR/ePhu2o+F6PUpf29EbabJOVcEDAAA=
+    headers:
+      Content-Encoding:
+      - gzip
+      Content-Type:
+      - application/json; charset=UTF-8
+      Date:
+      - Tue, 30 Sep 2025 15:27:34 GMT
+      Server:
+      - scaffolding on HTTPServer2
+      Transfer-Encoding:
+      - chunked
+      Vary:
+      - Origin
+      - X-Origin
+      - Referer
+      WWW-Authenticate:
+      - Bearer realm="https://accounts.google.com/"
+      X-Content-Type-Options:
+      - nosniff
+      X-Frame-Options:
+      - SAMEORIGIN
+      X-XSS-Protection:
+      - '0'
+    status:
+      code: 401
+      message: Unauthorized
+version: 1
@@ -60,6 +60,7 @@
 from opentelemetry.instrumentation.vertexai.utils import is_content_enabled
 from opentelemetry.semconv.schemas import Schemas
 from opentelemetry.trace import get_tracer
+from opentelemetry.util.genai.completion_hook import load_completion_hook
 
 
 def _methods_to_wrap(
@@ -109,6 +110,9 @@ def instrumentation_dependencies(self) -> Collection[str]:
 
     def _instrument(self, **kwargs: Any):
         """Enable VertexAI instrumentation."""
+        completion_hook = (
+            kwargs.get("completion_hook") or load_completion_hook()
+        )
         sem_conv_opt_in_mode = _OpenTelemetrySemanticConventionStability._get_opentelemetry_stability_opt_in_mode(
             _OpenTelemetryStabilitySignalType.GEN_AI,
         )
@@ -141,6 +145,7 @@ def _instrument(self, **kwargs: Any):
                 event_logger,
                 is_content_enabled(sem_conv_opt_in_mode),
                 sem_conv_opt_in_mode,
+                completion_hook,
             )
         elif sem_conv_opt_in_mode == _StabilityMode.GEN_AI_LATEST_EXPERIMENTAL:
             # Type checker now knows it's the other literal
@@ -149,6 +154,7 @@ def _instrument(self, **kwargs: Any):
                 event_logger,
                 is_content_enabled(sem_conv_opt_in_mode),
                 sem_conv_opt_in_mode,
+                completion_hook,
             )
         else:
             raise RuntimeError(f"{sem_conv_opt_in_mode} mode not supported")
 
@@ -14,7 +14,9 @@
 
 from __future__ import annotations
 
+import json
 from contextlib import contextmanager
+from dataclasses import asdict
 from typing import (
     TYPE_CHECKING,
     Any,
@@ -27,13 +29,14 @@
     overload,
 )
 
-from opentelemetry._events import EventLogger
+from opentelemetry._events import Event, EventLogger
 from opentelemetry.instrumentation._semconv import (
     _StabilityMode,
 )
 from opentelemetry.instrumentation.vertexai.utils import (
     GenerateContentParams,
-    create_operation_details_event,
+    convert_content_to_message,
+    convert_response_to_output_messages,
     get_genai_request_attributes,
     get_genai_response_attributes,
     get_server_attributes,
@@ -45,7 +48,11 @@
     gen_ai_attributes as GenAI,
 )
 from opentelemetry.trace import SpanKind, Tracer
-from opentelemetry.util.genai.types import ContentCapturingMode
+from opentelemetry.util.genai.completion_hook import CompletionHook
+from opentelemetry.util.genai.types import (
+    ContentCapturingMode,
+    Text,
+)
 
 if TYPE_CHECKING:
     from google.cloud.aiplatform_v1.services.prediction_service import client
@@ -113,6 +120,7 @@ def __init__(
         sem_conv_opt_in_mode: Literal[
             _StabilityMode.GEN_AI_LATEST_EXPERIMENTAL
         ],
+        completion_hook: CompletionHook,
     ) -> None: ...
 
     @overload
@@ -122,6 +130,7 @@ def __init__(
         event_logger: EventLogger,
         capture_content: bool,
         sem_conv_opt_in_mode: Literal[_StabilityMode.DEFAULT],
+        completion_hook: CompletionHook,
     ) -> None: ...
 
     def __init__(
@@ -133,11 +142,13 @@ def __init__(
             Literal[_StabilityMode.DEFAULT],
             Literal[_StabilityMode.GEN_AI_LATEST_EXPERIMENTAL],
         ],
+        completion_hook: CompletionHook,
     ) -> None:
         self.tracer = tracer
         self.event_logger = event_logger
         self.capture_content = capture_content
         self.sem_conv_opt_in_mode = sem_conv_opt_in_mode
+        self.completion_hook = completion_hook
 
     @contextmanager
     def _with_new_instrumentation(
@@ -149,11 +160,9 @@ def _with_new_instrumentation(
         kwargs: Any,
     ):
         params = _extract_params(*args, **kwargs)
-        api_endpoint: str = instance.api_endpoint  # type: ignore[reportUnknownMemberType]
         request_attributes = get_genai_request_attributes(True, params)
-        server_attributes = get_server_attributes(api_endpoint)
         with self.tracer.start_as_current_span(
-            name=f"{GenAI.GenAiOperationNameValues.CHAT.value} {request_attributes.get(GenAI.GEN_AI_REQUEST_MODEL, '')}",
+            name=f"{GenAI.GenAiOperationNameValues.CHAT.value} {request_attributes.get(GenAI.GEN_AI_REQUEST_MODEL, '')}".strip(),
             kind=SpanKind.CLIENT,
         ) as span:
 
@@ -162,30 +171,69 @@ def handle_response(
                 | prediction_service_v1beta1.GenerateContentResponse
                 | None,
             ) -> None:
-                response_attributes = (
-                    {}
-                    if not response
-                    else get_genai_response_attributes(response)
+                attributes = (
+                    get_server_attributes(instance.api_endpoint)  # type: ignore[reportUnknownMemberType]
+                    | request_attributes
+                    | get_genai_response_attributes(response)
                 )
-                if span.is_recording() and response:
-                    # When streaming, this is called multiple times so attributes would be
-                    # overwritten. In practice, it looks the API only returns the interesting
-                    # attributes on the last streamed response. However, I couldn't find
-                    # documentation for this and setting attributes shouldn't be too expensive.
-                    span.set_attributes(
-                        **response_attributes,
-                        **server_attributes,
-                        **request_attributes,
-                    )
-                # event = Event(name="gen_ai.client.inference.operation.details")
-
-                self.event_logger.emit(
-                    create_operation_details_event(
-                        api_endpoint=api_endpoint,
-                        params=params,
-                        capture_content=capture_content,
-                        response=response,
-                    )
+                system_instructions, inputs, outputs = [], [], []
+                if params.system_instruction:
+                    system_instructions = [
+                        Text(
+                            content="\n".join(
+                                part.text
+                                for part in params.system_instruction.parts
+                            )
+                        )
+                    ]
+                if params.contents:
+                    inputs = [
+                        convert_content_to_message(content)
+                        for content in params.contents
+                    ]
+                if response:
+                    outputs = convert_response_to_output_messages(response)
+                content = {
+                    k: [asdict(x) for x in v]
+                    for k, v in [
+                        (
+                            GenAI.GEN_AI_SYSTEM_INSTRUCTIONS,
+                            system_instructions,
+                        ),
+                        (GenAI.GEN_AI_INPUT_MESSAGES, inputs),
+                        (GenAI.GEN_AI_OUTPUT_MESSAGES, outputs),
+                    ]
+                    if v
+                }
+                if span.is_recording():
+                    span.set_attributes(attributes)
+                    if capture_content in frozenset(
+                        [
+                            ContentCapturingMode.SPAN_AND_EVENT,
+                            ContentCapturingMode.SPAN_ONLY,
+                        ]
+                    ):
+                        span.set_attributes(
+                            {k: json.dumps(v) for k, v in content.items()}
+                        )
+                event = Event(
+                    name="gen_ai.client.inference.operation.details",
+                )
+                event.attributes = attributes
+                if capture_content in frozenset(
+                    [
+                        ContentCapturingMode.SPAN_AND_EVENT,
+                        ContentCapturingMode.EVENT_ONLY,
+                    ]
+                ):
+                    event.attributes |= content
+                self.event_logger.emit(event)
+                self.completion_hook.on_completion(
+                    inputs=inputs,
+                    outputs=outputs,
+                    system_instruction=system_instructions,
+                    span=span,
+                    log_record=event,
                 )
 
             yield handle_response