Add better tracing for sync_provider

danielmillerp · danielmillerp · commit e063b122137e · 2025-11-04T12:36:08.000-05:00
diff --git a/src/agentex/lib/adk/providers/_modules/sync_provider.py b/src/agentex/lib/adk/providers/_modules/sync_provider.py
@@ -109,10 +109,94 @@ async def get_response(
 
                 response = await self.original_model.get_response(**kwargs)
 
-                # Set span output
-                if span:
+                # Set span output with structured data
+                if span and response:
+                    new_items = []
+                    final_output = None
+
+                    # Extract final output text from response
+                    response_final_output = getattr(response, 'final_output', None)
+                    if response_final_output:
+                        final_output = response_final_output
+
+                    # Extract items from the response output
+                    response_output = getattr(response, 'output', None)
+                    if response_output:
+                        output_items = response_output if isinstance(response_output, list) else [response_output]
+
+                        for item in output_items:
+                            item_type = getattr(item, 'type', None)
+
+                            # Handle reasoning items
+                            if item_type == 'reasoning':
+                                reasoning_summary = []
+                                summary = getattr(item, 'summary', None)
+                                if summary:
+                                    for summary_part in summary:
+                                        text = getattr(summary_part, 'text', None)
+                                        if text:
+                                            reasoning_summary.append({
+                                                "text": text,
+                                                "type": "summary_text"
+                                            })
+
+                                new_items.append({
+                                    "id": getattr(item, 'id', None),
+                                    "type": "reasoning",
+                                    "status": getattr(item, 'status', None),
+                                    "content": None,
+                                    "summary": reasoning_summary if reasoning_summary else None,
+                                })
+
+                            # Handle tool call items
+                            elif item_type == 'function_call':
+                                new_items.append({
+                                    "id": getattr(item, 'id', None),
+                                    "name": getattr(item, 'name', None),
+                                    "type": "function_call",
+                                    "status": getattr(item, 'status', 'completed'),
+                                    "call_id": getattr(item, 'call_id', None),
+                                    "arguments": getattr(item, 'arguments', None),
+                                })
+
+                            # Handle tool output items
+                            elif item_type == 'function_call_output':
+                                new_items.append({
+                                    "type": "function_call_output",
+                                    "output": getattr(item, 'output', None),
+                                    "call_id": getattr(item, 'call_id', None),
+                                })
+
+                            # Handle message items
+                            elif item_type == 'message':
+                                content = []
+                                message_text = ""
+                                item_content = getattr(item, 'content', None)
+                                if item_content:
+                                    for content_part in item_content:
+                                        text = getattr(content_part, 'text', None)
+                                        if text:
+                                            content.append({
+                                                "text": text,
+                                                "type": "output_text",
+                                            })
+                                            message_text = text
+
+                                new_items.append({
+                                    "id": getattr(item, 'id', None),
+                                    "role": getattr(item, 'role', 'assistant'),
+                                    "type": "message",
+                                    "status": getattr(item, 'status', 'completed'),
+                                    "content": content,
+                                })
+
+                                # Use message text as final output if we have it
+                                if message_text and not final_output:
+                                    final_output = message_text
+
                     span.output = {
-                        "response": str(response) if response else None,
+                        "new_items": new_items,
+                        "final_output": final_output,
                     }
 
                 return response
@@ -160,7 +244,9 @@ async def stream_response(
         # Wrap the streaming in a tracing span if tracer is available
         if self.tracer and self.trace_id:
             trace = self.tracer.trace(self.trace_id)
-            async with trace.span(
+
+            # Manually start the span instead of using context manager
+            span = await trace.start_span(
                 parent_id=self.parent_span_id,
                 name="run_agent_streamed",
                 input={
@@ -172,7 +258,9 @@ async def stream_response(
                     "handoffs": [str(h) for h in handoffs] if handoffs else [],
                     "previous_response_id": previous_response_id,
                 },
-            ) as span:
+            )
+
+            try:
                 # Get the stream from the original model
                 stream_kwargs = {
                     "system_instructions": system_instructions,
@@ -193,23 +281,170 @@ async def stream_response(
                 # Get the stream response from the original model and yield each event
                 stream_response = self.original_model.stream_response(**stream_kwargs)
 
-                # Pass through each event from the original stream
-                event_count = 0
-                final_output = None
+                # Pass through each event from the original stream and track items
+                new_items = []
+                final_response_text = ""
+                current_text_item = None
+                tool_call_map = {}  # Map call_id to tool name
+
                 async for event in stream_response:
-                    event_count += 1
-                    # Track the final output if available
-                    if hasattr(event, 'type') and event.type == 'raw_response_event':
-                        if hasattr(event.data, 'output'):
-                            final_output = event.data.output
+                    event_type = getattr(event, 'type', 'no-type')
+
+                    # Handle response.output_item.done events which contain completed items
+                    if event_type == 'response.output_item.done':
+                        item = getattr(event, 'item', None)
+                        if item is not None:
+                            item_type = getattr(item, 'type', None)
+
+                            # Handle function call (tool request)
+                            if item_type == 'function_call':
+                                call_id = getattr(item, 'call_id', None)
+                                name = getattr(item, 'name', None)
+                                new_items.append({
+                                    "id": getattr(item, 'id', None),
+                                    "name": name,
+                                    "type": "function_call",
+                                    "status": getattr(item, 'status', 'completed'),
+                                    "call_id": call_id,
+                                    "arguments": getattr(item, 'arguments', None),
+                                })
+                                if call_id and name:
+                                    tool_call_map[call_id] = name
+
+                            # Handle completed message items (final text output)
+                            elif item_type == 'message':
+                                content = []
+                                message_text = ""
+                                item_content = getattr(item, 'content', None)
+                                if item_content:
+                                    for content_part in item_content:
+                                        text = getattr(content_part, 'text', None)
+                                        if text:
+                                            content.append({
+                                                "text": text,
+                                                "type": "output_text",
+                                            })
+                                            # Use the complete text from the message as final_output
+                                            message_text = text
+
+                                new_items.append({
+                                    "id": getattr(item, 'id', None),
+                                    "role": getattr(item, 'role', 'assistant'),
+                                    "type": "message",
+                                    "status": getattr(item, 'status', 'completed'),
+                                    "content": content,
+                                })
+
+                                # Update final_response_text with the complete message text
+                                if message_text:
+                                    final_response_text = message_text
+
+                    # Track reasoning, tool calls, and responses from run_item_stream_event (kept for compatibility)
+                    if event_type == 'run_item_stream_event':
+                        item = getattr(event, 'item', None)
+                        if item is not None:
+                            item_type = getattr(item, 'type', None)
+
+                            # Handle reasoning items
+                            if item_type == 'reasoning_item':
+                                reasoning_summary = []
+                                raw_item = getattr(item, 'raw_item', None)
+                                if raw_item is not None:
+                                    summary = getattr(raw_item, 'summary', None)
+                                    if summary:
+                                        for summary_part in summary:
+                                            text = getattr(summary_part, 'text', None)
+                                            if text:
+                                                reasoning_summary.append({
+                                                    "text": text,
+                                                    "type": "summary_text"
+                                                })
+
+                                    new_items.append({
+                                        "id": getattr(raw_item, 'id', None),
+                                        "type": "reasoning",
+                                        "status": getattr(raw_item, 'status', None),
+                                        "content": None,
+                                        "summary": reasoning_summary if reasoning_summary else None,
+                                    })
+
+                            # Handle tool call items
+                            elif item_type == 'tool_call_item':
+                                raw_item = getattr(item, 'raw_item', None)
+                                if raw_item is not None:
+                                    call_id, tool_name, tool_arguments = _extract_tool_call_info(raw_item)
+                                    tool_call_map[call_id] = tool_name
+
+                                    new_items.append({
+                                        "id": getattr(raw_item, 'id', None),
+                                        "name": tool_name,
+                                        "type": "function_call",
+                                        "status": getattr(raw_item, 'status', 'completed'),
+                                        "call_id": call_id,
+                                        "arguments": str(tool_arguments) if isinstance(tool_arguments, dict) else tool_arguments,
+                                    })
+
+                            # Handle tool output items
+                            elif item_type == 'tool_call_output_item':
+                                raw_item = getattr(item, 'raw_item', None)
+                                if raw_item is not None:
+                                    call_id, tool_name, content = _extract_tool_response_info(tool_call_map, raw_item)
+
+                                    new_items.append({
+                                        "type": "function_call_output",
+                                        "output": content,
+                                        "call_id": call_id,
+                                    })
+
+                    # Accumulate text deltas to build final response
+                    # Note: OpenAI Agents SDK can emit events in different formats
+                    if hasattr(event, 'type') and event.type == 'response.output_text.delta':
+                        # Direct event type from OpenAI Agents SDK (observed in practice)
+                        if hasattr(event, 'delta'):
+                            final_response_text += event.delta
+
+                    # Handle raw_response_event wrapper (alternative event format, kept for compatibility)
+                    elif hasattr(event, 'type') and event.type == 'raw_response_event':
+                        if hasattr(event, 'data'):
+                            raw_event = event.data
+
+                            # Track when output items are added
+                            if isinstance(raw_event, ResponseOutputItemAddedEvent):
+                                if hasattr(raw_event, 'item') and raw_event.item.type == 'message':
+                                    current_text_item = {
+                                        "id": getattr(raw_event.item, 'id', None),
+                                        "role": getattr(raw_event.item, 'role', 'assistant'),
+                                        "type": "message",
+                                        "status": "in_progress",
+                                        "content": []
+                                    }
+
+                            # Check if this is a text delta event
+                            elif isinstance(raw_event, ResponseTextDeltaEvent):
+                                if hasattr(raw_event, 'delta') and raw_event.delta:
+                                    final_response_text += raw_event.delta
+
+                            # Track when output items are done
+                            elif isinstance(raw_event, ResponseOutputItemDoneEvent):
+                                if current_text_item and final_response_text:
+                                    current_text_item["status"] = "completed"
+                                    current_text_item["content"] = [{
+                                        "text": final_response_text,
+                                        "type": "output_text",
+                                    }]
+                                    new_items.append(current_text_item)
+                                    current_text_item = None
+
                     yield event
 
-                # Set span output
-                if span:
-                    span.output = {
-                        "event_count": event_count,
-                        "final_output": str(final_output) if final_output else None,
-                    }
+                # Set span output with structured data including tool calls and final response
+                span.output = {
+                    "new_items": new_items,
+                    "final_output": final_response_text if final_response_text else None,
+                }
+            finally:
+                # End the span after all events have been yielded
+                await trace.end_span(span)
         else:
             # No tracing, just stream normally
             # Get the stream from the original model