From 27432ae04da365750a2990497cc5b572414da076 Mon Sep 17 00:00:00 2001
From: Anuraag Agrawal <anuraaga@gmail.com>
Date: Fri, 14 Mar 2025 16:27:27 +0900
Subject: [PATCH 1/5] openai: apply instrumentation to
 beta.chat.Completions.parse

---
 .../instrumentation/openai/__init__.py        |   14 +-
 .../tests/cassettes/test_chat_beta.yaml       |  140 ++
 .../tests/test_beta_chat_completions.py       | 1544 +++++++++++++++++
 3 files changed, 1697 insertions(+), 1 deletion(-)
 create mode 100644 instrumentation/elastic-opentelemetry-instrumentation-openai/tests/cassettes/test_chat_beta.yaml
 create mode 100644 instrumentation/elastic-opentelemetry-instrumentation-openai/tests/test_beta_chat_completions.py

diff --git a/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py b/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py
index d5c179b..0289823 100644
--- a/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py
+++ b/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py
@@ -105,11 +105,21 @@ def _patch(self, _module):
             "Completions.create",
             self._chat_completion_wrapper,
         )
+        wrap_function_wrapper(
+            "openai.resources.beta.chat.completions",
+            "Completions.parse",
+            self._chat_completion_wrapper,
+        )
         wrap_function_wrapper(
             "openai.resources.chat.completions",
             "AsyncCompletions.create",
             self._async_chat_completion_wrapper,
         )
+        wrap_function_wrapper(
+            "openai.resources.beta.chat.completions",
+            "AsyncCompletions.parse",
+            self._async_chat_completion_wrapper,
+        )
         wrap_function_wrapper(
             "openai.resources.embeddings",
             "Embeddings.create",
@@ -127,12 +137,14 @@ def _uninstrument(self, **kwargs):
         import openai
 
         unwrap(openai.resources.chat.completions.Completions, "create")
+        unwrap(openai.resources.beta.chat.completions.Completions, "parse")
         unwrap(openai.resources.chat.completions.AsyncCompletions, "create")
+        unwrap(openai.resources.beta.chat.completions.AsyncCompletions, "parse")
         unwrap(openai.resources.embeddings.Embeddings, "create")
         unwrap(openai.resources.embeddings.AsyncEmbeddings, "create")
 
     def _chat_completion_wrapper(self, wrapped, instance, args, kwargs):
-        logger.debug(f"openai.resources.chat.completions.Completions.create kwargs: {kwargs}")
+        logger.debug(f"{wrapped} kwargs: {kwargs}")
 
         span_attributes = _get_attributes_from_wrapper(instance, kwargs)
         event_attributes = _get_event_attributes()
diff --git a/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/cassettes/test_chat_beta.yaml b/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/cassettes/test_chat_beta.yaml
new file mode 100644
index 0000000..d359dbf
--- /dev/null
+++ b/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/cassettes/test_chat_beta.yaml
@@ -0,0 +1,140 @@
+interactions:
+- request:
+    body: |-
+      {
+        "messages": [
+          {
+            "role": "user",
+            "content": "Answer in up to 3 words: Which ocean contains Bouvet Island?"
+          }
+        ],
+        "model": "gpt-4o-mini",
+        "stream": false
+      }
+    headers:
+      accept:
+      - application/json
+      accept-encoding:
+      - gzip, deflate
+      authorization:
+      - Bearer test_openai_api_key
+      connection:
+      - keep-alive
+      content-length:
+      - '140'
+      content-type:
+      - application/json
+      host:
+      - api.openai.com
+      user-agent:
+      - OpenAI/Python 1.66.3
+      x-stainless-arch:
+      - arm64
+      x-stainless-async:
+      - 'false'
+      x-stainless-helper-method:
+      - beta.chat.completions.parse
+      x-stainless-lang:
+      - python
+      x-stainless-os:
+      - MacOS
+      x-stainless-package-version:
+      - 1.66.3
+      x-stainless-read-timeout:
+      - '600'
+      x-stainless-retry-count:
+      - '0'
+      x-stainless-runtime:
+      - CPython
+      x-stainless-runtime-version:
+      - 3.13.2
+    method: POST
+    uri: https://api.openai.com/v1/chat/completions
+  response:
+    body:
+      string: |-
+        {
+          "id": "chatcmpl-BAtHlTExnZD4baw8rCAETtH5zmgD9",
+          "object": "chat.completion",
+          "created": 1741935497,
+          "model": "gpt-4o-mini-2024-07-18",
+          "choices": [
+            {
+              "index": 0,
+              "message": {
+                "role": "assistant",
+                "content": "Atlantic Ocean",
+                "refusal": null,
+                "annotations": []
+              },
+              "logprobs": null,
+              "finish_reason": "stop"
+            }
+          ],
+          "usage": {
+            "prompt_tokens": 22,
+            "completion_tokens": 3,
+            "total_tokens": 25,
+            "prompt_tokens_details": {
+              "cached_tokens": 0,
+              "audio_tokens": 0
+            },
+            "completion_tokens_details": {
+              "reasoning_tokens": 0,
+              "audio_tokens": 0,
+              "accepted_prediction_tokens": 0,
+              "rejected_prediction_tokens": 0
+            }
+          },
+          "service_tier": "default",
+          "system_fingerprint": "fp_06737a9306"
+        }
+    headers:
+      CF-RAY:
+      - 9201e1b838715eb9-NRT
+      Connection:
+      - keep-alive
+      Content-Type:
+      - application/json
+      Date:
+      - Fri, 14 Mar 2025 06:58:17 GMT
+      Server:
+      - cloudflare
+      Set-Cookie: test_set_cookie
+      Transfer-Encoding:
+      - chunked
+      X-Content-Type-Options:
+      - nosniff
+      access-control-expose-headers:
+      - X-Request-ID
+      alt-svc:
+      - h3=":443"; ma=86400
+      cf-cache-status:
+      - DYNAMIC
+      content-length:
+      - '820'
+      openai-organization: test_openai_org_id
+      openai-processing-ms:
+      - '253'
+      openai-version:
+      - '2020-10-01'
+      strict-transport-security:
+      - max-age=31536000; includeSubDomains; preload
+      x-ratelimit-limit-requests:
+      - '10000'
+      x-ratelimit-limit-tokens:
+      - '200000'
+      x-ratelimit-remaining-requests:
+      - '9999'
+      x-ratelimit-remaining-tokens:
+      - '199968'
+      x-ratelimit-reset-requests:
+      - 8.64s
+      x-ratelimit-reset-tokens:
+      - 9ms
+      x-request-id:
+      - req_381ebd7d156c172900193e7a98982e79
+    status:
+      code: 200
+      message: OK
+version: 1
diff --git a/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/test_beta_chat_completions.py b/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/test_beta_chat_completions.py
new file mode 100644
index 0000000..76cabe0
--- /dev/null
+++ b/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/test_beta_chat_completions.py
@@ -0,0 +1,1544 @@
+# Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+# or more contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright
+# ownership. Elasticsearch B.V. licenses this file to you under
+# the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+import os
+import re
+from copy import deepcopy
+from dataclasses import dataclass
+from typing import List, Optional
+from unittest import mock
+
+import openai
+import pytest
+from opentelemetry._events import Event
+from opentelemetry._logs import LogRecord
+from opentelemetry.instrumentation.openai import OpenAIInstrumentor
+from opentelemetry.semconv._incubating.attributes.gen_ai_attributes import (
+    GEN_AI_OPENAI_REQUEST_RESPONSE_FORMAT,
+    GEN_AI_OPENAI_REQUEST_SEED,
+    GEN_AI_OPENAI_REQUEST_SERVICE_TIER,
+    GEN_AI_OPENAI_RESPONSE_SERVICE_TIER,
+    GEN_AI_OPERATION_NAME,
+    GEN_AI_REQUEST_FREQUENCY_PENALTY,
+    GEN_AI_REQUEST_MAX_TOKENS,
+    GEN_AI_REQUEST_MODEL,
+    GEN_AI_REQUEST_PRESENCE_PENALTY,
+    GEN_AI_REQUEST_STOP_SEQUENCES,
+    GEN_AI_REQUEST_TEMPERATURE,
+    GEN_AI_REQUEST_TOP_P,
+    GEN_AI_RESPONSE_FINISH_REASONS,
+    GEN_AI_RESPONSE_ID,
+    GEN_AI_RESPONSE_MODEL,
+    GEN_AI_SYSTEM,
+    GEN_AI_USAGE_INPUT_TOKENS,
+    GEN_AI_USAGE_OUTPUT_TOKENS,
+)
+from opentelemetry.semconv.attributes.error_attributes import ERROR_TYPE
+from opentelemetry.semconv.attributes.server_attributes import SERVER_ADDRESS, SERVER_PORT
+from opentelemetry.trace import SpanKind, StatusCode
+
+from .conftest import (
+    address_and_port,
+    assert_error_operation_duration_metric,
+    assert_operation_duration_metric,
+    assert_token_usage_metric,
+    get_integration_async_client,
+    get_integration_client,
+)
+from .utils import MOCK_POSITIVE_FLOAT, get_sorted_metrics, logrecords_from_logs
+
+OPENAI_VERSION = tuple([int(x) for x in openai.version.VERSION.split(".")])
+TEST_CHAT_MODEL = "gpt-4o-mini"
+TEST_CHAT_RESPONSE_MODEL = "gpt-4o-mini-2024-07-18"
+TEST_CHAT_INPUT = "Answer in up to 3 words: Which ocean contains Bouvet Island?"
+
+
+@pytest.mark.vcr()
+def test_chat(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
+    client = openai.OpenAI()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    chat_completion = client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages)
+
+    assert chat_completion.choices[0].message.content == "Atlantic Ocean."
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-AfhuGVpfQzbsboUTm9uUCSEUWwEbU",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop",),
+        GEN_AI_USAGE_INPUT_TOKENS: 22,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 3,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 2
+    log_records = logrecords_from_logs(logs)
+    user_message, choice = log_records
+    assert dict(user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(user_message.body) == {}
+
+    assert_stop_log_record(choice)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: "gpt-4o-mini-2024-07-18",
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.vcr()
+def test_chat_with_developer_role_message(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
+    client = openai.OpenAI()
+
+    messages = [
+        {
+            "role": "developer",
+            "content": "You are a friendly assistant",
+        },
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        },
+    ]
+
+    chat_completion = client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages)
+
+    assert chat_completion.choices[0].message.content == "Atlantic Ocean."
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPENAI_RESPONSE_SERVICE_TIER: "default",
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-B6vdHtqgT6rj4cj7itn9bNlaUlqHg",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop",),
+        GEN_AI_USAGE_INPUT_TOKENS: 31,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 4,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 3
+    log_records = logrecords_from_logs(logs)
+    system_message, user_message, choice = log_records
+    assert dict(system_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.system.message"}
+    assert dict(system_message.body) == {"role": "developer"}
+
+    assert dict(user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(user_message.body) == {}
+
+    assert_stop_log_record(choice)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: "gpt-4o-mini-2024-07-18",
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.skipif(OPENAI_VERSION < (1, 35, 0), reason="service tier added in 1.35.0")
+@pytest.mark.vcr()
+def test_chat_all_the_client_options(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
+    client = openai.OpenAI()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    params = {
+        "model": TEST_CHAT_MODEL,
+        "messages": messages,
+        "frequency_penalty": 0,
+        "max_completion_tokens": 100,
+        "presence_penalty": 0,
+        "temperature": 1,
+        "top_p": 1,
+        "stop": "foo",
+        "seed": 100,
+        "service_tier": "default",
+        "response_format": {"type": "text"},
+    }
+    chat_completion = client.beta.chat.completions.parse(**params)
+
+    assert chat_completion.choices[0].message.content == "Southern Ocean."
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    expected_attrs = {
+        GEN_AI_OPENAI_REQUEST_SEED: 100,
+        GEN_AI_OPENAI_REQUEST_SERVICE_TIER: "default",
+        GEN_AI_OPENAI_REQUEST_RESPONSE_FORMAT: "text",
+        GEN_AI_OPENAI_RESPONSE_SERVICE_TIER: "default",
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_FREQUENCY_PENALTY: 0,
+        GEN_AI_REQUEST_MAX_TOKENS: 100,
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_REQUEST_PRESENCE_PENALTY: 0,
+        GEN_AI_REQUEST_STOP_SEQUENCES: ("foo",),
+        GEN_AI_REQUEST_TEMPERATURE: 1,
+        GEN_AI_REQUEST_TOP_P: 1,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-AfhvFSrCe0B1E6Prdwn9U7V2Lq8XH",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop",),
+        GEN_AI_USAGE_INPUT_TOKENS: 22,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 3,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+    assert dict(span.attributes) == expected_attrs
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 2
+    log_records = logrecords_from_logs(logs)
+    user_message, choice = log_records
+    assert dict(user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(user_message.body) == {}
+
+    assert_stop_log_record(choice)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.vcr()
+def test_chat_multiple_choices_with_capture_message_content(
+    default_openai_env, trace_exporter, metrics_reader, logs_exporter
+):
+    # Redo the instrumentation dance to be affected by the environment variable
+    OpenAIInstrumentor().uninstrument()
+    with mock.patch.dict("os.environ", {"OTEL_INSTRUMENTATION_GENAI_CAPTURE_MESSAGE_CONTENT": "true"}):
+        OpenAIInstrumentor().instrument()
+
+    client = openai.OpenAI()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    chat_completion = client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages, n=2)
+
+    content = "Atlantic Ocean."
+    assert chat_completion.choices[0].message.content == content
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-AfhuHpVEbcYGlsFuHOP60MtU4tIq9",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop", "stop"),
+        GEN_AI_USAGE_INPUT_TOKENS: 22,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 6,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 3
+    log_records = logrecords_from_logs(logs)
+    user_message, choice, second_choice = log_records
+    assert user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert user_message.body == {"content": TEST_CHAT_INPUT}
+
+    assert_stop_log_record(choice, content)
+    assert_stop_log_record(second_choice, "Southern Ocean.", 1)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.vcr()
+def test_chat_function_calling_with_tools(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
+    client = openai.OpenAI()
+
+    tools = [
+        {
+            "type": "function",
+            "function": {
+                "name": "get_delivery_date",
+                "strict": True,
+                "description": "Get the delivery date for a customer's order. Call this whenever you need to know the delivery date, for example when a customer asks 'Where is my package'",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "order_id": {
+                            "type": "string",
+                            "description": "The customer's order ID.",
+                        },
+                    },
+                    "required": ["order_id"],
+                    "additionalProperties": False,
+                },
+            },
+        }
+    ]
+
+    messages = [
+        {
+            "role": "system",
+            "content": "You are a helpful customer support assistant. Use the supplied tools to assist the user.",
+        },
+        {"role": "user", "content": "Hi, can you tell me the delivery date for my order?"},
+        {
+            "role": "assistant",
+            "content": "Hi there! I can help with that. Can you please provide your order ID?",
+        },
+        {"role": "user", "content": "i think it is order_12345"},
+    ]
+
+    response = client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages, tools=tools)
+    tool_call = response.choices[0].message.tool_calls[0]
+    assert tool_call.function.name == "get_delivery_date"
+    # FIXME: add to test data
+    assert json.loads(tool_call.function.arguments) == {"order_id": "order_12345"}
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-AfhuIeTQU1AlqGqx3cfvtbNyJ2Q8p",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("tool_calls",),
+        GEN_AI_USAGE_INPUT_TOKENS: 140,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 19,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 5
+    log_records = logrecords_from_logs(logs)
+    system_message, user_message, assistant_message, second_user_message, choice = log_records
+    assert system_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.system.message"}
+    assert system_message.body == {}
+    assert user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert user_message.body == {}
+    assert assistant_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.assistant.message"}
+    assert assistant_message.body == {}
+    assert second_user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert second_user_message.body == {}
+
+    assert_tool_call_log_record(
+        choice, [ToolCall("call_BAohHzhtwXBSM13jKADbwgQH", "get_delivery_date", '{"order_id": "order_12345"}')]
+    )
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.vcr()
+def test_chat_tools_with_capture_message_content(default_openai_env, trace_exporter, logs_exporter, metrics_reader):
+    # Redo the instrumentation dance to be affected by the environment variable
+    OpenAIInstrumentor().uninstrument()
+    with mock.patch.dict("os.environ", {"OTEL_INSTRUMENTATION_GENAI_CAPTURE_MESSAGE_CONTENT": "true"}):
+        OpenAIInstrumentor().instrument()
+
+    client = openai.OpenAI()
+
+    tools = [
+        {
+            "type": "function",
+            "function": {
+                "name": "get_delivery_date",
+                "strict": True,
+                "description": "Get the delivery date for a customer's order. Call this whenever you need to know the delivery date, for example when a customer asks 'Where is my package'",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "order_id": {
+                            "type": "string",
+                            "description": "The customer's order ID.",
+                        },
+                    },
+                    "required": ["order_id"],
+                    "additionalProperties": False,
+                },
+            },
+        }
+    ]
+
+    messages = [
+        {
+            "role": "system",
+            "content": "You are a helpful customer support assistant. Use the supplied tools to assist the user.",
+        },
+        {"role": "user", "content": "Hi, can you tell me the delivery date for my order?"},
+        {
+            "role": "assistant",
+            "content": "Hi there! I can help with that. Can you please provide your order ID?",
+        },
+        {"role": "user", "content": "i think it is order_12345"},
+    ]
+
+    response = client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages, tools=tools)
+    tool_call = response.choices[0].message.tool_calls[0]
+    assert tool_call.function.name == "get_delivery_date"
+    assert json.loads(tool_call.function.arguments) == {"order_id": "order_12345"}
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-AfhuJxYuidCW2KvkwBy6VMnWtdiwb",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("tool_calls",),
+        GEN_AI_USAGE_INPUT_TOKENS: 140,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 19,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 5
+    log_records = logrecords_from_logs(logs)
+    system_message, user_message, assistant_message, second_user_message, choice = log_records
+    assert system_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.system.message"}
+    assert system_message.body == {
+        "content": "You are a helpful customer support assistant. Use the supplied tools to assist the user."
+    }
+    assert user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert user_message.body == {"content": "Hi, can you tell me the delivery date for my order?"}
+    assert assistant_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.assistant.message"}
+    assert assistant_message.body == {
+        "content": "Hi there! I can help with that. Can you please provide your order ID?"
+    }
+    assert second_user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert second_user_message.body == {"content": "i think it is order_12345"}
+
+    assert_tool_call_log_record(
+        choice, [ToolCall("call_TD1k1LOj7QC0uQPRihIY9Bml", "get_delivery_date", '{"order_id": "order_12345"}')]
+    )
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.integration
+def test_chat_tools_with_capture_message_content_integration(trace_exporter, logs_exporter, metrics_reader):
+    client = get_integration_client()
+    model = os.getenv("TEST_CHAT_MODEL", TEST_CHAT_MODEL)
+
+    # Redo the instrumentation dance to be affected by the environment variable
+    OpenAIInstrumentor().uninstrument()
+    with mock.patch.dict("os.environ", {"OTEL_INSTRUMENTATION_GENAI_CAPTURE_MESSAGE_CONTENT": "true"}):
+        OpenAIInstrumentor().instrument()
+
+    tools = [
+        {
+            "type": "function",
+            "function": {
+                "name": "get_delivery_date",
+                "strict": True,
+                "description": "Get the delivery date for a customer's order. Call this whenever you need to know the delivery date, for example when a customer asks 'Where is my package'",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "order_id": {
+                            "type": "string",
+                            "description": "The customer's order ID.",
+                        },
+                    },
+                    "required": ["order_id"],
+                    "additionalProperties": False,
+                },
+            },
+        }
+    ]
+
+    messages = [
+        {
+            "role": "system",
+            "content": "You are a helpful customer support assistant. Use the supplied tools to assist the user.",
+        },
+        {"role": "user", "content": "Hi, can you tell me the delivery date for my order?"},
+        {
+            "role": "assistant",
+            "content": "Hi there! I can help with that. Can you please provide your order ID?",
+        },
+        {"role": "user", "content": "i think it is order_12345"},
+    ]
+
+    response = client.beta.chat.completions.parse(model=model, messages=messages, tools=tools)
+    tool_call = response.choices[0].message.tool_calls[0]
+    assert tool_call.function.name == "get_delivery_date"
+    assert json.loads(tool_call.function.arguments) == {"order_id": "order_12345"}
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {model}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPENAI_RESPONSE_SERVICE_TIER: "default",
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: model,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: response.id,
+        GEN_AI_RESPONSE_MODEL: response.model,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("tool_calls",),
+        GEN_AI_USAGE_INPUT_TOKENS: response.usage.prompt_tokens,
+        GEN_AI_USAGE_OUTPUT_TOKENS: response.usage.completion_tokens,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 5
+    log_records = logrecords_from_logs(logs)
+    system_message, user_message, assistant_message, second_user_message, choice = log_records
+    assert system_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.system.message"}
+    assert system_message.body == {
+        "content": "You are a helpful customer support assistant. Use the supplied tools to assist the user."
+    }
+    assert user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert user_message.body == {"content": "Hi, can you tell me the delivery date for my order?"}
+    assert assistant_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.assistant.message"}
+    assert assistant_message.body == {
+        "content": "Hi there! I can help with that. Can you please provide your order ID?"
+    }
+    assert second_user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert second_user_message.body == {"content": "i think it is order_12345"}
+
+    assert_tool_call_log_record(choice, [ToolCall(tool_call.id, "get_delivery_date", '{"order_id": "order_12345"}')])
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: model,
+        GEN_AI_RESPONSE_MODEL: response.model,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=MOCK_POSITIVE_FLOAT
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+def test_chat_connection_error(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
+    client = openai.Client(base_url="http://localhost:9999/v5", api_key="not-read", max_retries=1)
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    with pytest.raises(Exception):
+        client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages)
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.ERROR
+
+    assert dict(span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        ERROR_TYPE: "APIConnectionError",
+        SERVER_ADDRESS: "localhost",
+        SERVER_PORT: 9999,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 1
+    log_records = logrecords_from_logs(logs)
+    (user_message,) = log_records
+    assert dict(user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(user_message.body) == {}
+
+    (operation_duration_metric,) = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        ERROR_TYPE: "APIConnectionError",
+    }
+    assert_error_operation_duration_metric(
+        "chat",
+        operation_duration_metric,
+        attributes=attributes,
+        data_point=1.026234219999992,
+        value_delta=1.0,
+    )
+
+
+@pytest.mark.integration
+def test_chat_with_capture_message_content_integration(trace_exporter, logs_exporter, metrics_reader):
+    model = os.getenv("TEST_CHAT_MODEL", TEST_CHAT_MODEL)
+
+    # Redo the instrumentation dance to be affected by the environment variable
+    OpenAIInstrumentor().uninstrument()
+    with mock.patch.dict(
+        "os.environ",
+        {"OTEL_INSTRUMENTATION_GENAI_CAPTURE_MESSAGE_CONTENT": "true"},
+    ):
+        OpenAIInstrumentor().instrument()
+
+    client = get_integration_client()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    response = client.beta.chat.completions.parse(model=model, messages=messages)
+    content = response.choices[0].message.content
+    assert content
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {model}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPENAI_RESPONSE_SERVICE_TIER: "default",
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: model,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: response.id,
+        GEN_AI_RESPONSE_MODEL: response.model,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop",),
+        GEN_AI_USAGE_INPUT_TOKENS: response.usage.prompt_tokens,
+        GEN_AI_USAGE_OUTPUT_TOKENS: response.usage.completion_tokens,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 2
+    log_records = logrecords_from_logs(logs)
+    user_message, choice = log_records
+    assert dict(user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(user_message.body) == {"content": TEST_CHAT_INPUT}
+
+    assert_stop_log_record(choice, content)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: model,
+        GEN_AI_RESPONSE_MODEL: response.model,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=MOCK_POSITIVE_FLOAT
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.vcr()
+def test_chat_with_capture_message_content(default_openai_env, trace_exporter, logs_exporter, metrics_reader):
+    client = openai.OpenAI()
+
+    # Redo the instrumentation dance to be affected by the environment variable
+    OpenAIInstrumentor().uninstrument()
+    with mock.patch.dict("os.environ", {"OTEL_INSTRUMENTATION_GENAI_CAPTURE_MESSAGE_CONTENT": "true"}):
+        OpenAIInstrumentor().instrument()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    chat_completion = client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages)
+
+    content = "South Atlantic Ocean."
+    assert chat_completion.choices[0].message.content == content
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-AfhuKQOLh8rjzshDoq35O7wceMSEK",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop",),
+        GEN_AI_USAGE_INPUT_TOKENS: 22,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 4,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 2
+    log_records = logrecords_from_logs(logs)
+    user_message, choice = log_records
+    assert dict(user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(user_message.body) == {"content": TEST_CHAT_INPUT}
+
+    assert_stop_log_record(choice, content)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.vcr()
+def test_chat_tools_with_followup_and_capture_message_content(
+    default_openai_env, trace_exporter, metrics_reader, logs_exporter
+):
+    # Redo the instrumentation dance to be affected by the environment variable
+    OpenAIInstrumentor().uninstrument()
+    with mock.patch.dict("os.environ", {"OTEL_INSTRUMENTATION_GENAI_CAPTURE_MESSAGE_CONTENT": "true"}):
+        OpenAIInstrumentor().instrument()
+
+    client = openai.OpenAI()
+
+    tools = [
+        {
+            "type": "function",
+            "function": {
+                "name": "get_weather",
+                "strict": True,
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "location": {"type": "string"},
+                    },
+                    "required": ["location"],
+                    "additionalProperties": False,
+                },
+            },
+        }
+    ]
+
+    messages = [
+        {
+            "role": "system",
+            "content": "You are a helpful assistant providing weather updates.",
+        },
+        {"role": "user", "content": "What is the weather in New York City and London?"},
+    ]
+
+    first_response = client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages, tools=tools)
+
+    assert first_response.choices[0].message.content is None
+
+    first_response_message = first_response.choices[0].message
+    if hasattr(first_response_message, "to_dict"):
+        previous_message = first_response.choices[0].message.to_dict()
+    else:
+        # old pydantic from old openai client
+        previous_message = first_response.choices[0].message.model_dump()
+    followup_messages = [
+        {
+            "role": "assistant",
+            "tool_calls": previous_message["tool_calls"],
+        },
+        {
+            "role": "tool",
+            "content": "25 degrees and sunny",
+            "tool_call_id": previous_message["tool_calls"][0]["id"],
+        },
+        {
+            "role": "tool",
+            "content": "15 degrees and raining",
+            "tool_call_id": previous_message["tool_calls"][1]["id"],
+        },
+    ]
+
+    second_response = client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages + followup_messages)
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 2
+
+    first_span, second_span = spans
+    assert first_span.name == f"chat {TEST_CHAT_MODEL}"
+    assert first_span.kind == SpanKind.CLIENT
+    assert first_span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(first_span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: first_response.id,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("tool_calls",),
+        GEN_AI_USAGE_INPUT_TOKENS: first_response.usage.prompt_tokens,
+        GEN_AI_USAGE_OUTPUT_TOKENS: first_response.usage.completion_tokens,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    assert second_span.name == f"chat {TEST_CHAT_MODEL}"
+    assert second_span.kind == SpanKind.CLIENT
+    assert second_span.status.status_code == StatusCode.UNSET
+
+    assert dict(second_span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: second_response.id,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop",),
+        GEN_AI_USAGE_INPUT_TOKENS: second_response.usage.prompt_tokens,
+        GEN_AI_USAGE_OUTPUT_TOKENS: second_response.usage.completion_tokens,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 9
+    log_records = logrecords_from_logs(logs)
+
+    # first call events
+    system_message, user_message, choice = log_records[:3]
+    assert system_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.system.message"}
+    assert system_message.body == {"content": "You are a helpful assistant providing weather updates."}
+    assert user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert user_message.body == {"content": "What is the weather in New York City and London?"}
+
+    assert_tool_call_log_record(
+        choice,
+        [
+            ToolCall(
+                id=previous_message["tool_calls"][0]["id"],
+                name="get_weather",
+                arguments_json='{"location": "New York City"}',
+            ),
+            ToolCall(
+                id=previous_message["tool_calls"][1]["id"], name="get_weather", arguments_json='{"location": "London"}'
+            ),
+        ],
+    )
+
+    # second call events
+    tool_call_telemetry = previous_message["tool_calls"]
+    for i in range(len(tool_call_telemetry)):
+        tool_call = deepcopy(tool_call_telemetry[i])
+        tool_call["function"].pop("parsed_arguments")
+        tool_call_telemetry[i] = tool_call
+    system_message, user_message, assistant_message, first_tool, second_tool, choice = log_records[3:]
+    assert system_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.system.message"}
+    assert system_message.body == {"content": "You are a helpful assistant providing weather updates."}
+    assert user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert user_message.body == {"content": "What is the weather in New York City and London?"}
+    assert assistant_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.assistant.message"}
+    assert assistant_message.body == {"tool_calls": tool_call_telemetry}
+    assert first_tool.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.tool.message"}
+    first_tool_response = tool_call_telemetry[0]
+    assert first_tool.body == {"content": "25 degrees and sunny", "id": first_tool_response["id"]}
+    assert second_tool.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.tool.message"}
+    second_tool_response = tool_call_telemetry[1]
+    assert second_tool.body == {"content": "15 degrees and raining", "id": second_tool_response["id"]}
+
+    assert_stop_log_record(choice, second_response.choices[0].message.content)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.007433261722326279, count=2
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=[first_response.usage.prompt_tokens, second_response.usage.prompt_tokens],
+        output_data_point=[first_response.usage.completion_tokens, second_response.usage.completion_tokens],
+        count=2,
+    )
+
+
+@pytest.mark.asyncio
+@pytest.mark.vcr()
+async def test_chat_async(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
+    client = openai.AsyncOpenAI()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    chat_completion = await client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages)
+
+    assert chat_completion.choices[0].message.content == "Atlantic Ocean."
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-AfhuGVpfQzbsboUTm9uUCSEUWwEbU",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop",),
+        GEN_AI_USAGE_INPUT_TOKENS: 22,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 3,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 2
+    log_records = logrecords_from_logs(logs)
+    user_message, choice = log_records
+    assert dict(user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(user_message.body) == {}
+
+    assert_stop_log_record(choice)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.asyncio
+@pytest.mark.vcr()
+async def test_chat_async_with_capture_message_content(
+    default_openai_env, trace_exporter, metrics_reader, logs_exporter
+):
+    # Redo the instrumentation dance to be affected by the environment variable
+    OpenAIInstrumentor().uninstrument()
+    with mock.patch.dict("os.environ", {"OTEL_INSTRUMENTATION_GENAI_CAPTURE_MESSAGE_CONTENT": "true"}):
+        OpenAIInstrumentor().instrument()
+
+    client = openai.AsyncOpenAI()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    chat_completion = await client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages)
+
+    content = "South Atlantic Ocean."
+    assert chat_completion.choices[0].message.content == content
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-AfhuKQOLh8rjzshDoq35O7wceMSEK",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop",),
+        GEN_AI_USAGE_INPUT_TOKENS: 22,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 4,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 2
+    log_records = logrecords_from_logs(logs)
+    user_message, choice = log_records
+    assert dict(user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(user_message.body) == {"content": TEST_CHAT_INPUT}
+
+    assert_stop_log_record(choice, content)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.integration
+@pytest.mark.asyncio
+async def test_chat_async_with_capture_message_content_integration(trace_exporter, logs_exporter, metrics_reader):
+    model = os.getenv("TEST_CHAT_MODEL", TEST_CHAT_MODEL)
+
+    # Redo the instrumentation dance to be affected by the environment variable
+    OpenAIInstrumentor().uninstrument()
+    with mock.patch.dict("os.environ", {"OTEL_INSTRUMENTATION_GENAI_CAPTURE_MESSAGE_CONTENT": "true"}):
+        OpenAIInstrumentor().instrument()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    client = get_integration_async_client()
+
+    response = await client.beta.chat.completions.parse(model=model, messages=messages)
+    content = response.choices[0].message.content
+    assert content
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {model}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPENAI_RESPONSE_SERVICE_TIER: "default",
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: model,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: response.id,
+        GEN_AI_RESPONSE_MODEL: response.model,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("stop",),
+        GEN_AI_USAGE_INPUT_TOKENS: response.usage.prompt_tokens,
+        GEN_AI_USAGE_OUTPUT_TOKENS: response.usage.completion_tokens,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 2
+    log_records = logrecords_from_logs(logs)
+    user_message, choice = log_records
+    assert user_message.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert user_message.body == {"content": TEST_CHAT_INPUT}
+
+    assert_stop_log_record(choice, content)
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: model,
+        GEN_AI_RESPONSE_MODEL: response.model,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=MOCK_POSITIVE_FLOAT
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=response.usage.prompt_tokens,
+        output_data_point=response.usage.completion_tokens,
+    )
+
+
+@pytest.mark.vcr()
+@pytest.mark.asyncio
+async def test_chat_async_tools_with_capture_message_content(
+    default_openai_env, trace_exporter, metrics_reader, logs_exporter
+):
+    # Redo the instrumentation dance to be affected by the environment variable
+    OpenAIInstrumentor().uninstrument()
+    with mock.patch.dict("os.environ", {"OTEL_INSTRUMENTATION_GENAI_CAPTURE_MESSAGE_CONTENT": "true"}):
+        OpenAIInstrumentor().instrument()
+
+    client = openai.AsyncOpenAI()
+
+    tools = [
+        {
+            "type": "function",
+            "function": {
+                "name": "get_delivery_date",
+                "strict": True,
+                "description": "Get the delivery date for a customer's order. Call this whenever you need to know the delivery date, for example when a customer asks 'Where is my package'",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "order_id": {
+                            "type": "string",
+                            "description": "The customer's order ID.",
+                        },
+                    },
+                    "required": ["order_id"],
+                    "additionalProperties": False,
+                },
+            },
+        }
+    ]
+
+    messages = [
+        {
+            "role": "system",
+            "content": "You are a helpful customer support assistant. Use the supplied tools to assist the user.",
+        },
+        {"role": "user", "content": "Hi, can you tell me the delivery date for my order?"},
+        {
+            "role": "assistant",
+            "content": "Hi there! I can help with that. Can you please provide your order ID?",
+        },
+        {"role": "user", "content": "i think it is order_12345"},
+    ]
+
+    response = await client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages, tools=tools)
+    tool_call = response.choices[0].message.tool_calls[0]
+    assert tool_call.function.name == "get_delivery_date"
+    assert json.loads(tool_call.function.arguments) == {"order_id": "order_12345"}
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == f"chat {TEST_CHAT_MODEL}"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.UNSET
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_SYSTEM: "openai",
+        GEN_AI_RESPONSE_ID: "chatcmpl-AfhuJxYuidCW2KvkwBy6VMnWtdiwb",
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+        GEN_AI_RESPONSE_FINISH_REASONS: ("tool_calls",),
+        GEN_AI_USAGE_INPUT_TOKENS: 140,
+        GEN_AI_USAGE_OUTPUT_TOKENS: 19,
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    logs = logs_exporter.get_finished_logs()
+    assert len(logs) == 5
+    log_records = logrecords_from_logs(logs)
+    system_message, user_message, assistant_message, second_user_message, choice = log_records
+    assert dict(system_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.system.message"}
+    assert dict(system_message.body) == {
+        "content": "You are a helpful customer support assistant. Use the supplied tools to assist the user."
+    }
+    assert dict(user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(user_message.body) == {"content": "Hi, can you tell me the delivery date for my order?"}
+    assert dict(assistant_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.assistant.message"}
+    assert dict(assistant_message.body) == {
+        "content": "Hi there! I can help with that. Can you please provide your order ID?"
+    }
+    assert dict(second_user_message.attributes) == {"gen_ai.system": "openai", "event.name": "gen_ai.user.message"}
+    assert dict(second_user_message.body) == {"content": "i think it is order_12345"}
+
+    assert_tool_call_log_record(
+        choice, [ToolCall("call_TD1k1LOj7QC0uQPRihIY9Bml", "get_delivery_date", '{"order_id": "order_12345"}')]
+    )
+
+    operation_duration_metric, token_usage_metric = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: TEST_CHAT_MODEL,
+        GEN_AI_RESPONSE_MODEL: TEST_CHAT_RESPONSE_MODEL,
+    }
+    assert_operation_duration_metric(
+        client, "chat", operation_duration_metric, attributes=attributes, min_data_point=0.006761051714420319
+    )
+    assert_token_usage_metric(
+        client,
+        "chat",
+        token_usage_metric,
+        attributes=attributes,
+        input_data_point=span.attributes[GEN_AI_USAGE_INPUT_TOKENS],
+        output_data_point=span.attributes[GEN_AI_USAGE_OUTPUT_TOKENS],
+    )
+
+
+@pytest.mark.vcr()
+def test_chat_without_model_parameter(default_openai_env, trace_exporter, metrics_reader):
+    client = openai.OpenAI()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    with pytest.raises(
+        TypeError,
+        match=re.escape("missing 1 required keyword-only argument: 'model'"),
+    ):
+        client.beta.chat.completions.parse(messages=messages)
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == "chat"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.ERROR
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        ERROR_TYPE: "TypeError",
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_SYSTEM: "openai",
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    (operation_duration_metric,) = get_sorted_metrics(metrics_reader)
+    attributes = {
+        "error.type": "TypeError",
+        "server.address": address,
+        "server.port": port,
+    }
+    assert_error_operation_duration_metric(
+        "chat", operation_duration_metric, attributes=attributes, data_point=5, value_delta=5
+    )
+
+
+@pytest.mark.vcr()
+def test_chat_with_model_not_found(default_openai_env, trace_exporter, metrics_reader):
+    client = openai.OpenAI()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    exception = "The model `not-found-TEST_CHAT_MODEL` does not exist or you do not have access to it."
+    with pytest.raises(openai.NotFoundError, match="Error code: 404.*" + re.escape(exception)):
+        client.beta.chat.completions.parse(model="not-found-TEST_CHAT_MODEL", messages=messages)
+
+    spans = trace_exporter.get_finished_spans()
+    assert len(spans) == 1
+
+    span = spans[0]
+    assert span.name == "chat not-found-TEST_CHAT_MODEL"
+    assert span.kind == SpanKind.CLIENT
+    assert span.status.status_code == StatusCode.ERROR
+
+    address, port = address_and_port(client)
+    assert dict(span.attributes) == {
+        ERROR_TYPE: "NotFoundError",
+        GEN_AI_OPERATION_NAME: "chat",
+        GEN_AI_REQUEST_MODEL: "not-found-TEST_CHAT_MODEL",
+        GEN_AI_SYSTEM: "openai",
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+
+    (operation_duration_metric,) = get_sorted_metrics(metrics_reader)
+    attributes = {
+        GEN_AI_REQUEST_MODEL: "not-found-TEST_CHAT_MODEL",
+        "error.type": "NotFoundError",
+        SERVER_ADDRESS: address,
+        SERVER_PORT: port,
+    }
+    assert_error_operation_duration_metric(
+        "chat", operation_duration_metric, attributes=attributes, data_point=0.00230291485786438
+    )
+
+
+@pytest.mark.vcr()
+def test_chat_exported_schema_version(default_openai_env, trace_exporter, metrics_reader):
+    client = openai.OpenAI()
+
+    messages = [
+        {
+            "role": "user",
+            "content": TEST_CHAT_INPUT,
+        }
+    ]
+
+    client.beta.chat.completions.parse(model=TEST_CHAT_MODEL, messages=messages)
+
+    spans = trace_exporter.get_finished_spans()
+    (span,) = spans
+    assert span.instrumentation_scope.schema_url == "https://opentelemetry.io/schemas/1.28.0"
+
+    metrics_data = metrics_reader.get_metrics_data()
+    resource_metrics = metrics_data.resource_metrics
+
+    for metrics in resource_metrics:
+        for scope_metrics in metrics.scope_metrics:
+            assert scope_metrics.schema_url == "https://opentelemetry.io/schemas/1.28.0"
+
+
+@dataclass
+class ToolCall:
+    id: str
+    name: str
+    arguments_json: str
+
+
+def assert_stop_log_record(log_record: LogRecord, expected_content: Optional[str] = None, expected_index=0):
+    assert log_record.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.choice"}
+    assert log_record.body["index"] == expected_index
+    assert log_record.body["finish_reason"] == "stop"
+    message = log_record.body["message"]
+    if expected_content is None:
+        assert "content" not in message
+    else:
+        assert message["content"] == expected_content
+
+
+def assert_tool_call_log_record(log_record: LogRecord, expected_tool_calls: List[ToolCall], expected_index=0):
+    assert log_record.attributes == {"gen_ai.system": "openai", "event.name": "gen_ai.choice"}
+    assert log_record.body["index"] == expected_index
+    assert log_record.body["finish_reason"] == "tool_calls"
+    message = log_record.body["message"]
+    assert_tool_calls(message["tool_calls"], expected_tool_calls)
+
+
+def assert_tool_call_event(event: Event, expected_tool_calls: List[ToolCall]):
+    assert event.name == "gen_ai.content.completion"
+    # The 'gen_ai.completion' attribute is a JSON string, so parse it first.
+    gen_ai_completions = json.loads(event.attributes["gen_ai.completion"])
+
+    gen_ai_completion = gen_ai_completions[0]
+    assert gen_ai_completion["role"] == "assistant"
+    assert gen_ai_completion["content"] == ""
+    assert_tool_calls(gen_ai_completion["tool_calls"], expected_tool_calls)
+
+
+def assert_tool_calls(tool_calls, expected_tool_calls: List[ToolCall]):
+    for i, tool_call in enumerate(tool_calls):
+        expected_call = expected_tool_calls[i]
+        args = tool_call["function"]["arguments"]
+        # The function arguments are also a string, which has different whitespace
+        # in Azure. Assert in a whitespace agnostic way first.
+        assert json.dumps(json.loads(args), sort_keys=True) == expected_call.arguments_json
+
+        assert tool_call == {
+            "id": expected_call.id,
+            "type": "function",
+            "function": {"name": expected_call.name, "arguments": args},
+        }, f"Unexpected tool_call at index {i}: {tool_call} != {expected_call}"

From 576a1237335bcc5241d7fe8c8493bad6516b3644 Mon Sep 17 00:00:00 2001
From: Anuraag Agrawal <anuraaga@gmail.com>
Date: Fri, 14 Mar 2025 16:30:44 +0900
Subject: [PATCH 2/5] Accidental

---
 .../tests/cassettes/test_chat_beta.yaml       | 140 ------------------
 1 file changed, 140 deletions(-)
 delete mode 100644 instrumentation/elastic-opentelemetry-instrumentation-openai/tests/cassettes/test_chat_beta.yaml

diff --git a/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/cassettes/test_chat_beta.yaml b/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/cassettes/test_chat_beta.yaml
deleted file mode 100644
index d359dbf..0000000
--- a/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/cassettes/test_chat_beta.yaml
+++ /dev/null
@@ -1,140 +0,0 @@
-interactions:
-- request:
-    body: |-
-      {
-        "messages": [
-          {
-            "role": "user",
-            "content": "Answer in up to 3 words: Which ocean contains Bouvet Island?"
-          }
-        ],
-        "model": "gpt-4o-mini",
-        "stream": false
-      }
-    headers:
-      accept:
-      - application/json
-      accept-encoding:
-      - gzip, deflate
-      authorization:
-      - Bearer test_openai_api_key
-      connection:
-      - keep-alive
-      content-length:
-      - '140'
-      content-type:
-      - application/json
-      host:
-      - api.openai.com
-      user-agent:
-      - OpenAI/Python 1.66.3
-      x-stainless-arch:
-      - arm64
-      x-stainless-async:
-      - 'false'
-      x-stainless-helper-method:
-      - beta.chat.completions.parse
-      x-stainless-lang:
-      - python
-      x-stainless-os:
-      - MacOS
-      x-stainless-package-version:
-      - 1.66.3
-      x-stainless-read-timeout:
-      - '600'
-      x-stainless-retry-count:
-      - '0'
-      x-stainless-runtime:
-      - CPython
-      x-stainless-runtime-version:
-      - 3.13.2
-    method: POST
-    uri: https://api.openai.com/v1/chat/completions
-  response:
-    body:
-      string: |-
-        {
-          "id": "chatcmpl-BAtHlTExnZD4baw8rCAETtH5zmgD9",
-          "object": "chat.completion",
-          "created": 1741935497,
-          "model": "gpt-4o-mini-2024-07-18",
-          "choices": [
-            {
-              "index": 0,
-              "message": {
-                "role": "assistant",
-                "content": "Atlantic Ocean",
-                "refusal": null,
-                "annotations": []
-              },
-              "logprobs": null,
-              "finish_reason": "stop"
-            }
-          ],
-          "usage": {
-            "prompt_tokens": 22,
-            "completion_tokens": 3,
-            "total_tokens": 25,
-            "prompt_tokens_details": {
-              "cached_tokens": 0,
-              "audio_tokens": 0
-            },
-            "completion_tokens_details": {
-              "reasoning_tokens": 0,
-              "audio_tokens": 0,
-              "accepted_prediction_tokens": 0,
-              "rejected_prediction_tokens": 0
-            }
-          },
-          "service_tier": "default",
-          "system_fingerprint": "fp_06737a9306"
-        }
-    headers:
-      CF-RAY:
-      - 9201e1b838715eb9-NRT
-      Connection:
-      - keep-alive
-      Content-Type:
-      - application/json
-      Date:
-      - Fri, 14 Mar 2025 06:58:17 GMT
-      Server:
-      - cloudflare
-      Set-Cookie: test_set_cookie
-      Transfer-Encoding:
-      - chunked
-      X-Content-Type-Options:
-      - nosniff
-      access-control-expose-headers:
-      - X-Request-ID
-      alt-svc:
-      - h3=":443"; ma=86400
-      cf-cache-status:
-      - DYNAMIC
-      content-length:
-      - '820'
-      openai-organization: test_openai_org_id
-      openai-processing-ms:
-      - '253'
-      openai-version:
-      - '2020-10-01'
-      strict-transport-security:
-      - max-age=31536000; includeSubDomains; preload
-      x-ratelimit-limit-requests:
-      - '10000'
-      x-ratelimit-limit-tokens:
-      - '200000'
-      x-ratelimit-remaining-requests:
-      - '9999'
-      x-ratelimit-remaining-tokens:
-      - '199968'
-      x-ratelimit-reset-requests:
-      - 8.64s
-      x-ratelimit-reset-tokens:
-      - 9ms
-      x-request-id:
-      - req_381ebd7d156c172900193e7a98982e79
-    status:
-      code: 200
-      message: OK
-version: 1

From 4e7d9947af7c866f4c59d59d036e205db1a45801 Mon Sep 17 00:00:00 2001
From: Anuraag Agrawal <anuraaga@gmail.com>
Date: Fri, 14 Mar 2025 16:36:03 +0900
Subject: [PATCH 3/5] Set min version

---
 .../tests/test_beta_chat_completions.py       | 19 ++++++++++++++++++-
 1 file changed, 18 insertions(+), 1 deletion(-)

diff --git a/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/test_beta_chat_completions.py b/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/test_beta_chat_completions.py
index 76cabe0..270e2b6 100644
--- a/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/test_beta_chat_completions.py
+++ b/instrumentation/elastic-opentelemetry-instrumentation-openai/tests/test_beta_chat_completions.py
@@ -67,6 +67,7 @@
 TEST_CHAT_INPUT = "Answer in up to 3 words: Which ocean contains Bouvet Island?"
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
     client = openai.OpenAI()
@@ -131,6 +132,7 @@ def test_chat(default_openai_env, trace_exporter, metrics_reader, logs_exporter)
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_with_developer_role_message(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
     client = openai.OpenAI()
@@ -203,7 +205,7 @@ def test_chat_with_developer_role_message(default_openai_env, trace_exporter, me
     )
 
 
-@pytest.mark.skipif(OPENAI_VERSION < (1, 35, 0), reason="service tier added in 1.35.0")
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_all_the_client_options(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
     client = openai.OpenAI()
@@ -292,6 +294,7 @@ def test_chat_all_the_client_options(default_openai_env, trace_exporter, metrics
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_multiple_choices_with_capture_message_content(
     default_openai_env, trace_exporter, metrics_reader, logs_exporter
@@ -365,6 +368,7 @@ def test_chat_multiple_choices_with_capture_message_content(
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_function_calling_with_tools(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
     client = openai.OpenAI()
@@ -467,6 +471,7 @@ def test_chat_function_calling_with_tools(default_openai_env, trace_exporter, me
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_tools_with_capture_message_content(default_openai_env, trace_exporter, logs_exporter, metrics_reader):
     # Redo the instrumentation dance to be affected by the environment variable
@@ -577,6 +582,7 @@ def test_chat_tools_with_capture_message_content(default_openai_env, trace_expor
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.integration
 def test_chat_tools_with_capture_message_content_integration(trace_exporter, logs_exporter, metrics_reader):
     client = get_integration_client()
@@ -687,6 +693,7 @@ def test_chat_tools_with_capture_message_content_integration(trace_exporter, log
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 def test_chat_connection_error(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
     client = openai.Client(base_url="http://localhost:9999/v5", api_key="not-read", max_retries=1)
     messages = [
@@ -737,6 +744,7 @@ def test_chat_connection_error(default_openai_env, trace_exporter, metrics_reade
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.integration
 def test_chat_with_capture_message_content_integration(trace_exporter, logs_exporter, metrics_reader):
     model = os.getenv("TEST_CHAT_MODEL", TEST_CHAT_MODEL)
@@ -812,6 +820,7 @@ def test_chat_with_capture_message_content_integration(trace_exporter, logs_expo
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_with_capture_message_content(default_openai_env, trace_exporter, logs_exporter, metrics_reader):
     client = openai.OpenAI()
@@ -882,6 +891,7 @@ def test_chat_with_capture_message_content(default_openai_env, trace_exporter, l
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_tools_with_followup_and_capture_message_content(
     default_openai_env, trace_exporter, metrics_reader, logs_exporter
@@ -1053,6 +1063,7 @@ def test_chat_tools_with_followup_and_capture_message_content(
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.asyncio
 @pytest.mark.vcr()
 async def test_chat_async(default_openai_env, trace_exporter, metrics_reader, logs_exporter):
@@ -1118,6 +1129,7 @@ async def test_chat_async(default_openai_env, trace_exporter, metrics_reader, lo
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.asyncio
 @pytest.mark.vcr()
 async def test_chat_async_with_capture_message_content(
@@ -1191,6 +1203,7 @@ async def test_chat_async_with_capture_message_content(
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.integration
 @pytest.mark.asyncio
 async def test_chat_async_with_capture_message_content_integration(trace_exporter, logs_exporter, metrics_reader):
@@ -1264,6 +1277,7 @@ async def test_chat_async_with_capture_message_content_integration(trace_exporte
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 @pytest.mark.asyncio
 async def test_chat_async_tools_with_capture_message_content(
@@ -1377,6 +1391,7 @@ async def test_chat_async_tools_with_capture_message_content(
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_without_model_parameter(default_openai_env, trace_exporter, metrics_reader):
     client = openai.OpenAI()
@@ -1422,6 +1437,7 @@ def test_chat_without_model_parameter(default_openai_env, trace_exporter, metric
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_with_model_not_found(default_openai_env, trace_exporter, metrics_reader):
     client = openai.OpenAI()
@@ -1467,6 +1483,7 @@ def test_chat_with_model_not_found(default_openai_env, trace_exporter, metrics_r
     )
 
 
+@pytest.mark.skipif(OPENAI_VERSION < (1, 40, 0), reason="beta completions added in 1.40.0")
 @pytest.mark.vcr()
 def test_chat_exported_schema_version(default_openai_env, trace_exporter, metrics_reader):
     client = openai.OpenAI()

From 4f6727b9f8fe0ec625ec4af077bc38af2aecc349 Mon Sep 17 00:00:00 2001
From: Anuraag Agrawal <anuraaga@gmail.com>
Date: Fri, 14 Mar 2025 16:42:56 +0900
Subject: [PATCH 4/5] Check version before patching

---
 .../instrumentation/openai/__init__.py        | 24 ++++++++++---------
 1 file changed, 13 insertions(+), 11 deletions(-)

diff --git a/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py b/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py
index 0289823..acde7ae 100644
--- a/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py
+++ b/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py
@@ -99,27 +99,29 @@ def _instrument(self, **kwargs):
 
         register_post_import_hook(self._patch, "openai")
 
-    def _patch(self, _module):
+    def _patch(self, module):
+        version = tuple([int(x) for x in getattr(getattr(module, "version"), "VERSION").split(".")])
         wrap_function_wrapper(
             "openai.resources.chat.completions",
             "Completions.create",
             self._chat_completion_wrapper,
         )
-        wrap_function_wrapper(
-            "openai.resources.beta.chat.completions",
-            "Completions.parse",
-            self._chat_completion_wrapper,
-        )
         wrap_function_wrapper(
             "openai.resources.chat.completions",
             "AsyncCompletions.create",
             self._async_chat_completion_wrapper,
         )
-        wrap_function_wrapper(
-            "openai.resources.beta.chat.completions",
-            "AsyncCompletions.parse",
-            self._async_chat_completion_wrapper,
-        )
+        if version >= (1, 40, 0):
+            wrap_function_wrapper(
+                "openai.resources.beta.chat.completions",
+                "Completions.parse",
+                self._chat_completion_wrapper,
+            )
+            wrap_function_wrapper(
+                "openai.resources.beta.chat.completions",
+                "AsyncCompletions.parse",
+                self._async_chat_completion_wrapper,
+            )
         wrap_function_wrapper(
             "openai.resources.embeddings",
             "Embeddings.create",

From 39861f2289043ae975a5478010b9b8908c15a870 Mon Sep 17 00:00:00 2001
From: Anuraag Agrawal <anuraaga@gmail.com>
Date: Fri, 14 Mar 2025 16:44:58 +0900
Subject: [PATCH 5/5] Check version before unwrap

---
 .../src/opentelemetry/instrumentation/openai/__init__.py  | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py b/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py
index acde7ae..fddc770 100644
--- a/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py
+++ b/instrumentation/elastic-opentelemetry-instrumentation-openai/src/opentelemetry/instrumentation/openai/__init__.py
@@ -101,6 +101,7 @@ def _instrument(self, **kwargs):
 
     def _patch(self, module):
         version = tuple([int(x) for x in getattr(getattr(module, "version"), "VERSION").split(".")])
+        self.beta_chat_available = version >= (1, 40, 0)
         wrap_function_wrapper(
             "openai.resources.chat.completions",
             "Completions.create",
@@ -111,7 +112,7 @@ def _patch(self, module):
             "AsyncCompletions.create",
             self._async_chat_completion_wrapper,
         )
-        if version >= (1, 40, 0):
+        if self.beta_chat_available:
             wrap_function_wrapper(
                 "openai.resources.beta.chat.completions",
                 "Completions.parse",
@@ -139,9 +140,10 @@ def _uninstrument(self, **kwargs):
         import openai
 
         unwrap(openai.resources.chat.completions.Completions, "create")
-        unwrap(openai.resources.beta.chat.completions.Completions, "parse")
         unwrap(openai.resources.chat.completions.AsyncCompletions, "create")
-        unwrap(openai.resources.beta.chat.completions.AsyncCompletions, "parse")
+        if self.beta_chat_available:
+            unwrap(openai.resources.beta.chat.completions.Completions, "parse")
+            unwrap(openai.resources.beta.chat.completions.AsyncCompletions, "parse")
         unwrap(openai.resources.embeddings.Embeddings, "create")
         unwrap(openai.resources.embeddings.AsyncEmbeddings, "create")