open-telemetry
diff --git a/‎instrumentation/opentelemetry-instrumentation-botocore/src/opentelemetry/instrumentation/botocore/extensions/bedrock_utils.py‎
Lines changed: 21 additions & 1 deletion b/‎instrumentation/opentelemetry-instrumentation-botocore/src/opentelemetry/instrumentation/botocore/extensions/bedrock_utils.py‎
Lines changed: 21 additions & 1 deletion
diff --git a/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_no_content_tool_call.yaml‎
Lines changed: 0 additions & 468 deletions b/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_no_content_tool_call.yaml‎
Lines changed: 0 additions & 468 deletions
diff --git a/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_no_content_tool_call[amazon.nova].yaml‎
Lines changed: 456 additions & 0 deletions b/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_no_content_tool_call[amazon.nova].yaml‎
Lines changed: 456 additions & 0 deletions
diff --git a/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_no_content_tool_call[anthropic.claude].yaml‎
Lines changed: 460 additions & 0 deletions b/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_no_content_tool_call[anthropic.claude].yaml‎
Lines changed: 460 additions & 0 deletions
diff --git a/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_with_content_tool_call.yaml‎
Lines changed: 0 additions & 473 deletions b/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_with_content_tool_call.yaml‎
Lines changed: 0 additions & 473 deletions
diff --git a/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_with_content_tool_call[amazon.nova].yaml‎
Lines changed: 643 additions & 0 deletions b/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_with_content_tool_call[amazon.nova].yaml‎
Lines changed: 643 additions & 0 deletions
diff --git a/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_with_content_tool_call[anthropic.claude].yaml‎
Lines changed: 484 additions & 0 deletions b/‎instrumentation/opentelemetry-instrumentation-botocore/tests/cassettes/test_invoke_model_with_response_stream_with_content_tool_call[anthropic.claude].yaml‎
Lines changed: 484 additions & 0 deletions
diff --git a/‎instrumentation/opentelemetry-instrumentation-botocore/tests/test_botocore_bedrock.py‎
Lines changed: 172 additions & 51 deletions b/‎instrumentation/opentelemetry-instrumentation-botocore/tests/test_botocore_bedrock.py‎
Lines changed: 172 additions & 51 deletions
@@ -216,25 +216,45 @@ def _process_amazon_titan_chunk(self, chunk):
 
     def _process_amazon_nova_chunk(self, chunk):
         # pylint: disable=too-many-branches
-        # TODO:  handle tool calls!
         if "messageStart" in chunk:
             # {'messageStart': {'role': 'assistant'}}
             if chunk["messageStart"].get("role") == "assistant":
                 self._record_message = True
                 self._message = {"role": "assistant", "content": []}
             return
 
+        if "contentBlockStart" in chunk:
+            # {'contentBlockStart': {'start': {'toolUse': {'toolUseId': 'id', 'name': 'name'}}, 'contentBlockIndex': 31}}
+            if self._record_message:
+                self._message["content"].append(self._content_block)
+                self._content_block = {}
+            start = chunk["contentBlockStart"].get("start", {})
+            if "toolUse" in start:
+                self._content_block = start
+            return
+
         if "contentBlockDelta" in chunk:
             # {'contentBlockDelta': {'delta': {'text': "Hello"}, 'contentBlockIndex': 0}}
+            # {'contentBlockDelta': {'delta': {'toolUse': {'input': '{"location":"San Francisco"}'}}, 'contentBlockIndex': 31}}
             if self._record_message:
                 delta = chunk["contentBlockDelta"].get("delta", {})
                 if "text" in delta:
                     self._content_block.setdefault("text", "")
                     self._content_block["text"] += delta["text"]
+                elif "toolUse" in delta:
+                    self._content_block.setdefault("toolUse", {})
+                    self._content_block["toolUse"]["input"] = json.loads(
+                        delta["toolUse"]["input"]
+                    )
             return
 
         if "contentBlockStop" in chunk:
             # {'contentBlockStop': {'contentBlockIndex': 0}}
+            if self._record_message:
+                # create a new content block only for tools
+                if "toolUse" in self._content_block:
+                    self._message["content"].append(self._content_block)
+                    self._content_block = {}
             return
 
         if "messageStop" in chunk:
 
@@ -2032,20 +2032,24 @@ def invoke_model_with_response_stream_tool_call(
     expect_content,
 ):
     # pylint:disable=too-many-locals,too-many-statements,too-many-branches
-    messages = [
-        {
-            "role": "user",
-            "content": [
-                {
-                    "text": "What is the weather in Seattle and San Francisco today? Please expect one tool call for Seattle and one for San Francisco",
-                    "type": "text",
-                }
-            ],
+    user_prompt = "What is the weather in Seattle and San Francisco today? Please give one tool call for Seattle and one for San Francisco"
+    if "anthropic.claude" in llm_model_value:
+        user_msg_content = {
+            "text": user_prompt,
+            "type": "text",
         }
-    ]
+    else:
+        user_msg_content = {
+            "text": user_prompt,
+        }
+    messages = [{"role": "user", "content": [user_msg_content]}]
 
     max_tokens = 1000
-    tool_config = get_anthropic_tool_config()
+    if "anthropic.claude" in llm_model_value:
+        tool_config = get_anthropic_tool_config()
+    else:
+        tool_config = get_tool_config()
+
     body = get_invoke_model_body(
         llm_model_value,
         messages=messages,
@@ -2059,12 +2063,16 @@ def invoke_model_with_response_stream_tool_call(
 
     content = []
     content_block = {}
+    # used only by anthropic claude
     input_json_buf = ""
+    # used only by amazon nova
+    tool_use = None
     for event in response_0["body"]:
         json_bytes = event["chunk"].get("bytes", b"")
         decoded = json_bytes.decode("utf-8")
         chunk = json.loads(decoded)
 
+        # anthropic claude
         if (message_type := chunk.get("type")) is not None:
             if message_type == "content_block_start":
                 content_block = chunk["content_block"]
@@ -2079,28 +2087,81 @@ def invoke_model_with_response_stream_tool_call(
                 content.append(content_block)
                 content_block = None
                 input_json_buf = ""
+        else:
+            if "contentBlockDelta" in chunk:
+                delta = chunk["contentBlockDelta"]["delta"]
+                if "text" in delta:
+                    content_block.setdefault("text", "")
+                    content_block["text"] += delta["text"]
+                elif "toolUse" in delta:
+                    tool_use["toolUse"]["input"] = json.loads(
+                        delta["toolUse"]["input"]
+                    )
+            elif "contentBlockStart" in chunk:
+                if content_block:
+                    content.append(content_block)
+                    content_block = {}
+                start = chunk["contentBlockStart"]["start"]
+                if "toolUse" in start:
+                    tool_use = start
+            elif "contentBlockStop" in chunk:
+                if tool_use:
+                    content.append(tool_use)
+                    tool_use = {}
 
     assert content
 
-    tool_requests_ids = [
-        item["id"] for item in content if item["type"] == "tool_use"
-    ]
+    if "anthropic.claude" in llm_model_value:
+        tool_requests_ids = [
+            item["id"] for item in content if item["type"] == "tool_use"
+        ]
+    else:
+        tool_requests_ids = [
+            item["toolUse"]["toolUseId"]
+            for item in content
+            if "toolUse" in item
+        ]
+
     assert len(tool_requests_ids) == 2
-    tool_call_result = {
-        "role": "user",
-        "content": [
-            {
-                "type": "tool_result",
-                "tool_use_id": tool_requests_ids[0],
-                "content": "50 degrees and raining",
-            },
-            {
-                "type": "tool_result",
-                "tool_use_id": tool_requests_ids[1],
-                "content": "70 degrees and sunny",
-            },
-        ],
-    }
+
+    if "anthropic.claude" in llm_model_value:
+        tool_call_result = {
+            "role": "user",
+            "content": [
+                {
+                    "type": "tool_result",
+                    "tool_use_id": tool_requests_ids[0],
+                    "content": "50 degrees and raining",
+                },
+                {
+                    "type": "tool_result",
+                    "tool_use_id": tool_requests_ids[1],
+                    "content": "70 degrees and sunny",
+                },
+            ],
+        }
+    else:
+        tool_call_result = {
+            "role": "user",
+            "content": [
+                {
+                    "toolResult": {
+                        "toolUseId": tool_requests_ids[0],
+                        "content": [
+                            {"json": {"weather": "50 degrees and raining"}}
+                        ],
+                    }
+                },
+                {
+                    "toolResult": {
+                        "toolUseId": tool_requests_ids[1],
+                        "content": [
+                            {"json": {"weather": "70 degrees and sunny"}}
+                        ],
+                    }
+                },
+            ],
+        }
 
     # remove extra attributes from response
     messages.append({"role": "assistant", "content": content})
@@ -2112,14 +2173,43 @@ def invoke_model_with_response_stream_tool_call(
         max_tokens=max_tokens,
         tools=tool_config,
     )
+    import pprint
+
+    pprint.pprint(messages[1])
     response_1 = bedrock_runtime_client.invoke_model_with_response_stream(
         body=body,
         modelId=llm_model_value,
     )
 
-    # consume the body to have it traced
-    for _ in response_1["body"]:
-        pass
+    content_block = {}
+    response_1_content = []
+    for event in response_1["body"]:
+        json_bytes = event["chunk"].get("bytes", b"")
+        decoded = json_bytes.decode("utf-8")
+        chunk = json.loads(decoded)
+
+        # anthropic claude
+        if (message_type := chunk.get("type")) is not None:
+            if message_type == "content_block_start":
+                content_block = chunk["content_block"]
+            elif message_type == "content_block_delta":
+                if chunk["delta"]["type"] == "text_delta":
+                    content_block["text"] += chunk["delta"]["text"]
+            elif message_type == "content_block_stop":
+                response_1_content.append(content_block)
+                content_block = None
+        else:
+            if "contentBlockDelta" in chunk:
+                delta = chunk["contentBlockDelta"]["delta"]
+                if "text" in delta:
+                    content_block.setdefault("text", "")
+                    content_block["text"] += delta["text"]
+            elif "messageStop" in chunk:
+                if content_block:
+                    response_1_content.append(content_block)
+                    content_block = {}
+
+    assert response_1_content
 
     (span_0, span_1) = span_exporter.get_finished_spans()
     assert_stream_completion_attributes(
@@ -2194,21 +2284,38 @@ def invoke_model_with_response_stream_tool_call(
         assistant_body,
         span_1,
     )
-    tool_message_0 = {
-        "id": tool_requests_ids[0],
-        "content": tool_call_result["content"][0]["content"]
-        if expect_content
-        else None,
-    }
+
+    if "anthropic.claude" in llm_model_value:
+        tool_message_0 = {
+            "id": tool_requests_ids[0],
+            "content": tool_call_result["content"][0]["content"]
+            if expect_content
+            else None,
+        }
+        tool_message_1 = {
+            "id": tool_requests_ids[1],
+            "content": tool_call_result["content"][1]["content"]
+            if expect_content
+            else None,
+        }
+    else:
+        tool_message_0 = {
+            "id": tool_requests_ids[0],
+            "content": tool_call_result["content"][0]["toolResult"]["content"]
+            if expect_content
+            else None,
+        }
+        tool_message_1 = {
+            "id": tool_requests_ids[1],
+            "content": tool_call_result["content"][1]["toolResult"]["content"]
+            if expect_content
+            else None,
+        }
+
     assert_message_in_logs(
         logs[4], "gen_ai.tool.message", tool_message_0, span_1
     )
-    tool_message_1 = {
-        "id": tool_requests_ids[1],
-        "content": tool_call_result["content"][1]["content"]
-        if expect_content
-        else None,
-    }
+
     assert_message_in_logs(
         logs[5], "gen_ai.tool.message", tool_message_1, span_1
     )
@@ -2225,27 +2332,31 @@ def invoke_model_with_response_stream_tool_call(
         "finish_reason": "end_turn",
         "message": {
             "role": "assistant",
-            "content": [
-                {
-                    "type": "text",
-                    "text": "\n\nGreat! I have the current weather information for both cities. Here's the weather in Seattle and San Francisco today:\n\nSeattle: 50 degrees and raining\nSan Francisco: 70 degrees and sunny\n\nAs you can see, the weather is quite different in these two cities today. Seattle is experiencing cooler temperatures with rain, which is fairly typical for the city. On the other hand, San Francisco is enjoying a warm and sunny day. If you're planning any activities, you might want to consider indoor options for Seattle, while it's a great day for outdoor activities in San Francisco.\n\nIs there anything else you'd like to know about the weather in these cities or any other locations?",
-                }
-            ],
+            "content": response_1_content,
         },
     }
     if not expect_content:
         choice_body["message"].pop("content")
     assert_message_in_logs(logs[7], "gen_ai.choice", choice_body, span_1)
 
 
+@pytest.mark.parametrize(
+    "model_family",
+    ["amazon.nova", "anthropic.claude"],
+)
 @pytest.mark.vcr()
 def test_invoke_model_with_response_stream_with_content_tool_call(
     span_exporter,
     log_exporter,
     bedrock_runtime_client,
     instrument_with_content,
+    model_family,
 ):
-    llm_model_value = "us.anthropic.claude-3-5-sonnet-20240620-v1:0"
+    if model_family == "amazon.nova":
+        llm_model_value = "amazon.nova-micro-v1:0"
+    elif model_family == "anthropic.claude":
+        llm_model_value = "us.anthropic.claude-3-5-sonnet-20240620-v1:0"
+
     invoke_model_with_response_stream_tool_call(
         span_exporter,
         log_exporter,
@@ -2412,13 +2523,23 @@ def test_invoke_model_with_response_stream_no_content_different_events(
     assert_message_in_logs(logs[4], "gen_ai.choice", choice_body, span)
 
 
+@pytest.mark.parametrize(
+    "model_family",
+    ["amazon.nova", "anthropic.claude"],
+)
 @pytest.mark.vcr()
 def test_invoke_model_with_response_stream_no_content_tool_call(
     span_exporter,
     log_exporter,
     bedrock_runtime_client,
     instrument_no_content,
+    model_family,
 ):
+    if model_family == "amazon.nova":
+        llm_model_value = "amazon.nova-micro-v1:0"
+    elif model_family == "anthropic.claude":
+        llm_model_value = "us.anthropic.claude-3-5-sonnet-20240620-v1:0"
+
     llm_model_value = "us.anthropic.claude-3-5-sonnet-20240620-v1:0"
     invoke_model_with_response_stream_tool_call(
         span_exporter,