Working OK patching the generate_content() method

aabmass · aabmass · commit a7b4addd40cd · 2025-01-15T05:05:44.000Z
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/examples/zero-code/main.py b/instrumentation-genai/opentelemetry-instrumentation-vertexai/examples/zero-code/main.py
@@ -1,12 +1,15 @@
 import vertexai
-from vertexai.generative_models import GenerativeModel
+from vertexai.generative_models import GenerationConfig, GenerativeModel
 
 
 def main():
     vertexai.init()
     model = GenerativeModel("gemini-1.5-flash-002")
     chat_completion = model.generate_content(
-        "Write a short poem on OpenTelemetry."
+        "Write a short poem on OpenTelemetry.",
+        generation_config=GenerationConfig(
+            top_k=2, top_p=0.95, temperature=0.2, stop_sequences=["\n\n\n"]
+        ),
     )
     print(chat_completion.text)
 
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/__init__.py b/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/__init__.py
@@ -41,9 +41,17 @@
 
 from typing import Any, Collection
 
+from wrapt import (
+    wrap_function_wrapper,  # type: ignore[reportUnknownVariableType]
+)
+
 from opentelemetry._events import get_event_logger
+from opentelemetry.instrumentation.genai_utils import is_content_enabled
 from opentelemetry.instrumentation.instrumentor import BaseInstrumentor
 from opentelemetry.instrumentation.vertexai.package import _instruments
+from opentelemetry.instrumentation.vertexai.patch import (
+    generate_content_create,
+)
 from opentelemetry.semconv.schemas import Schemas
 from opentelemetry.trace import get_tracer
 
@@ -55,20 +63,28 @@ def instrumentation_dependencies(self) -> Collection[str]:
     def _instrument(self, **kwargs: Any):
         """Enable VertexAI instrumentation."""
         tracer_provider = kwargs.get("tracer_provider")
-        _tracer = get_tracer(
+        tracer = get_tracer(
             __name__,
             "",
             tracer_provider,
             schema_url=Schemas.V1_28_0.value,
         )
         event_logger_provider = kwargs.get("event_logger_provider")
-        _event_logger = get_event_logger(
+        event_logger = get_event_logger(
             __name__,
             "",
             schema_url=Schemas.V1_28_0.value,
             event_logger_provider=event_logger_provider,
         )
         # TODO: implemented in later PR
 
+        wrap_function_wrapper(
+            module="vertexai.generative_models._generative_models",
+            name="_GenerativeModel.generate_content",
+            wrapper=generate_content_create(
+                tracer, event_logger, is_content_enabled()
+            ),
+        )
+
     def _uninstrument(self, **kwargs: Any) -> None:
         """TODO: implemented in later PR"""
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/patch.py b/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/patch.py
@@ -11,3 +11,102 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+
+from __future__ import annotations
+
+from typing import (
+    TYPE_CHECKING,
+    Any,
+    Callable,
+    Optional,
+)
+
+from opentelemetry._events import EventLogger
+from opentelemetry.instrumentation.genai_utils import (
+    get_span_name,  # type: ignore[reportUnknownVariableType]
+    handle_span_exception,  # type: ignore[reportUnknownVariableType]
+)
+from opentelemetry.instrumentation.vertexai.utils import (
+    GenerateContentParams,
+    get_genai_request_attributes,
+)
+from opentelemetry.trace import SpanKind, Tracer
+
+if TYPE_CHECKING:
+    from vertexai.generative_models import Tool, ToolConfig
+    from vertexai.generative_models._generative_models import (
+        ContentsType,
+        GenerationConfigType,
+        SafetySettingsType,
+        _GenerativeModel,
+    )
+
+
+def generate_content_create(
+    tracer: Tracer, event_logger: EventLogger, capture_content: bool
+):
+    """Wrap the `generate_content` method of the `GenerativeModel` class to trace it."""
+
+    def traced_method(
+        wrapped: Callable[..., Any],
+        instance: _GenerativeModel,
+        args: Any,
+        kwargs: Any,
+    ):
+        # Use exact signature to handle named vs positional args robustly
+        def extract_params(
+            contents: ContentsType,
+            *,
+            generation_config: Optional[GenerationConfigType] = None,
+            safety_settings: Optional[SafetySettingsType] = None,
+            tools: Optional[list[Tool]] = None,
+            tool_config: Optional[ToolConfig] = None,
+            labels: Optional[dict[str, str]] = None,
+            stream: bool = False,
+        ) -> GenerateContentParams:
+            return GenerateContentParams(
+                contents=contents,
+                generation_config=generation_config,
+                safety_settings=safety_settings,
+                tools=tools,
+                tool_config=tool_config,
+                labels=labels,
+                stream=stream,
+            )
+
+        params = extract_params(*args, **kwargs)
+
+        span_attributes = get_genai_request_attributes(instance, params)
+
+        span_name = get_span_name(span_attributes)
+        with tracer.start_as_current_span(
+            name=span_name,
+            kind=SpanKind.CLIENT,
+            attributes=span_attributes,
+            end_on_exit=False,
+        ) as span:
+            # if span.is_recording():
+            #     for message in kwargs.get("messages", []):
+            #         event_logger.emit(
+            #             message_to_event(message, capture_content)
+            #         )
+
+            try:
+                result = wrapped(*args, **kwargs)
+                # if is_streaming(kwargs):
+                #     return StreamWrapper(
+                #         result, span, event_logger, capture_content
+                #     )
+
+                # if span.is_recording():
+                #     _set_response_attributes(
+                #         span, result, event_logger, capture_content
+                #     )
+                span.end()
+                return result
+
+            except Exception as error:
+                handle_span_exception(span, error)
+                raise
+
+    return traced_method
diff --git a/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/utils.py b/instrumentation-genai/opentelemetry-instrumentation-vertexai/src/opentelemetry/instrumentation/vertexai/utils.py
@@ -0,0 +1,128 @@
+# Copyright The OpenTelemetry Authors
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from __future__ import annotations
+
+from dataclasses import dataclass
+from typing import (
+    TYPE_CHECKING,
+    Dict,
+    List,
+    Optional,
+    TypedDict,
+    cast,
+)
+
+if TYPE_CHECKING:
+    from vertexai.generative_models import Tool, ToolConfig
+    from vertexai.generative_models._generative_models import (
+        ContentsType,
+        GenerationConfigType,
+        SafetySettingsType,
+        _GenerativeModel,
+    )
+from opentelemetry.semconv._incubating.attributes import (
+    gen_ai_attributes as GenAIAttributes,
+)
+
+
+@dataclass(frozen=True)
+class GenerateContentParams:
+    contents: ContentsType
+    generation_config: Optional[GenerationConfigType]
+    safety_settings: Optional[SafetySettingsType]
+    tools: Optional[List["Tool"]]
+    tool_config: Optional["ToolConfig"]
+    labels: Optional[Dict[str, str]]
+    stream: bool
+
+
+class GenerationConfigDict(TypedDict, total=False):
+    temperature: Optional[float]
+    top_p: Optional[float]
+    top_k: Optional[int]
+    max_output_tokens: Optional[int]
+    stop_sequences: Optional[List[str]]
+    presence_penalty: Optional[float]
+    frequency_penalty: Optional[float]
+    seed: Optional[int]
+    # And more fields which aren't needed yet
+
+
+def get_genai_request_attributes(
+    # TODO: use types
+    instance: _GenerativeModel,
+    params: GenerateContentParams,
+    operation_name: GenAIAttributes.GenAiOperationNameValues = GenAIAttributes.GenAiOperationNameValues.CHAT,
+):
+    model = _get_model_name(instance)
+    generation_config = _get_generation_config(instance, params)
+    # TODO: This currently ignores constructor parameters to GenerativeModel like
+    # instance._generation_config. Consider wrapping PredicationClient that is used under the
+    # hood. Otherwise we need to copy all the coalescing logic between class level options and
+    # per-call options.
+    attributes = {
+        GenAIAttributes.GEN_AI_OPERATION_NAME: operation_name.value,
+        GenAIAttributes.GEN_AI_SYSTEM: GenAIAttributes.GenAiSystemValues.VERTEX_AI.value,
+        GenAIAttributes.GEN_AI_REQUEST_MODEL: model,
+        GenAIAttributes.GEN_AI_REQUEST_TEMPERATURE: generation_config.get(
+            "temperature"
+        ),
+        GenAIAttributes.GEN_AI_REQUEST_TOP_P: generation_config.get("top_p"),
+        GenAIAttributes.GEN_AI_REQUEST_MAX_TOKENS: generation_config.get(
+            "max_output_tokens"
+        ),
+        GenAIAttributes.GEN_AI_REQUEST_PRESENCE_PENALTY: generation_config.get(
+            "presence_penalty"
+        ),
+        GenAIAttributes.GEN_AI_REQUEST_FREQUENCY_PENALTY: generation_config.get(
+            "frequency_penalty"
+        ),
+        GenAIAttributes.GEN_AI_OPENAI_REQUEST_SEED: generation_config.get(
+            "seed"
+        ),
+        GenAIAttributes.GEN_AI_REQUEST_STOP_SEQUENCES: generation_config.get(
+            "stop_sequences"
+        ),
+    }
+
+    # filter out None values
+    return {k: v for k, v in attributes.items() if v is not None}
+
+
+def _get_generation_config(
+    instance: _GenerativeModel,
+    params: GenerateContentParams,
+) -> GenerationConfigDict:
+    generation_config = params.generation_config or instance._generation_config
+    if generation_config is None:
+        return {}
+    if isinstance(generation_config, dict):
+        return cast(GenerationConfigDict, generation_config)
+    return cast(GenerationConfigDict, generation_config.to_dict())
+
+
+_RESOURCE_PREFIX = "publishers/google/models/"
+
+
+def _get_model_name(instance: _GenerativeModel) -> str:
+    try:
+        model_name = instance._model_name
+    except AttributeError:
+        model_name = "unknown"
+
+    #     Can use str.removeprefix() once 3.8 is dropped
+    if model_name.startswith(_RESOURCE_PREFIX):
+        model_name = model_name[len(_RESOURCE_PREFIX) :]
+    return model_name