AgentOps-AI · dot-agi · Mar 24, 2025 · Mar 14, 2025 · Mar 14, 2025 · Mar 15, 2025
diff --git a/agentops/helpers/serialization.py b/agentops/helpers/serialization.py
@@ -72,8 +72,64 @@
     return str(obj)
 
 
+def model_to_dict(obj: Any) -> dict:
+    """Convert a model object to a dictionary safely.
+
+    Handles various model types including:
+    - Pydantic models (model_dump/dict methods)
+    - Dictionary-like objects
+    - API response objects with parse method
+    - Objects with __dict__ attribute
+
+    Args:
+        obj: The model object to convert to dictionary
+
+    Returns:
+        Dictionary representation of the object, or empty dict if conversion fails
+    """
+    if obj is None:
+        return {}
+    if isinstance(obj, dict):
+        return obj
+    if hasattr(obj, "model_dump"):  # Pydantic v2
+        return obj.model_dump()
+    elif hasattr(obj, "dict"):  # Pydantic v1
+        return obj.dict()
+    # TODO this is causing recursion on nested objects. 
+    # elif hasattr(obj, "parse"):  # Raw API response
+    #     return model_to_dict(obj.parse())
+    else:
+        # Try to use __dict__ as fallback
+        try:
+            return obj.__dict__
+        except:
+            return {}
+
+
 def safe_serialize(obj: Any) -> Any:
-    """Safely serialize an object to JSON-compatible format"""
+    """Safely serialize an object to JSON-compatible format
+
+    This function handles complex objects by:
+    1. Returning strings untouched (even if they contain JSON)
+    2. Converting models to dictionaries
+    3. Using custom JSON encoder to handle special types
+    4. Falling back to string representation only when necessary
+
+    Args:
+        obj: The object to serialize
+
+    Returns:
+        If obj is a string, returns the original string untouched.
+        Otherwise, returns a JSON string representation of the object.
+    """
+    # Return strings untouched
+    if isinstance(obj, str):
+        return obj
+
+    # Convert any model objects to dictionaries
+    if hasattr(obj, "model_dump") or hasattr(obj, "dict") or hasattr(obj, "parse"):
+        obj = model_to_dict(obj)
+
     try:
         return json.dumps(obj, cls=AgentOpsJSONEncoder)
     except (TypeError, ValueError) as e:

diff --git a/agentops/instrumentation/OpenTelemetry.md b/agentops/instrumentation/OpenTelemetry.md
@@ -0,0 +1,133 @@
+# OpenTelemetry Implementation Notes
+
+This document outlines best practices and implementation details for OpenTelemetry in AgentOps instrumentations.
+
+## Key Concepts
+
+### Context Propagation
+
+OpenTelemetry relies on proper context propagation to maintain parent-child relationships between spans. This is essential for:
+
+- Creating accurate trace waterfalls in visualizations
+- Ensuring all spans from the same logical operation share a trace ID
+- Allowing proper querying and filtering of related operations
+
+### Core Patterns
+
+When implementing instrumentations that need to maintain context across different execution contexts:
+
+1. **Store span contexts in dictionaries:**
+   ```python
+   # Use weakref dictionaries to avoid memory leaks
+   self._span_contexts = weakref.WeakKeyDictionary()
+   self._trace_root_contexts = weakref.WeakKeyDictionary()
+   ```
+
+2. **Create spans with explicit parent contexts:**
+   ```python
+   parent_context = self._get_parent_context(trace_obj)
+   with trace.start_as_current_span(
+       name=span_name,
+       context=parent_context,
+       kind=trace.SpanKind.CLIENT,
+       attributes=attributes,
+   ) as span:
+       # Span operations here
+       # Store the span's context for future reference
+       context = trace.set_span_in_context(span)
+       self._span_contexts[span_obj] = context
+   ```
+
+3. **Implement helper methods to retrieve appropriate parent contexts:**
+   ```python
+   def _get_parent_context(self, trace_obj):
+       # Try to get the trace's root context if it exists
+       if trace_obj in self._trace_root_contexts:
+           return self._trace_root_contexts[trace_obj]
+
+       # Otherwise, use the current context
+       return context_api.context.get_current()
+   ```
+
+4. **Debug trace continuity:**
+   ```python
+   current_span = trace.get_current_span()
+   span_context = current_span.get_span_context()
+   trace_id = format_trace_id(span_context.trace_id)
+   logging.debug(f"Current span trace ID: {trace_id}")
+   ```
+
+## Common Pitfalls
+
+1. **Naming conflicts:** Avoid using `trace` as a parameter name when you're also importing the OpenTelemetry `trace` module
+   ```python
+   # Bad
+   def on_trace_start(self, trace):
+       # This will cause conflicts with the imported trace module
+
+   # Good
+   def on_trace_start(self, trace_obj):
+       # No conflicts with OpenTelemetry's trace module
+   ```
+
+2. **Missing parent contexts:** Always explicitly provide parent contexts when available, don't rely on current context alone
+
+3. **Memory leaks:** Use `weakref.WeakKeyDictionary()` for storing spans to allow garbage collection
+
+4. **Lost context:** When calling async or callback functions, be sure to preserve and pass the context
+
+## Testing Context Propagation
+
+To verify proper context propagation:
+
+1. Enable debug logging for trace IDs
+2. Run a simple end-to-end test that generates multiple spans
+3. Verify all spans share the same trace ID
+4. Check that parent-child relationships are correctly established
+
+```python
+# Example debug logging
+logging.debug(f"Span {span.name} has trace ID: {format_trace_id(span.get_span_context().trace_id)}")
+```
+
+## Timestamp Handling in OpenTelemetry
+
+When working with OpenTelemetry spans and timestamps:
+
+1. **Automatic Timestamp Tracking:** OpenTelemetry automatically tracks timestamps for spans. When a span is created with `tracer.start_span()` or `tracer.start_as_current_span()`, the start time is captured automatically. When `span.end()` is called, the end time is recorded.
+
+2. **No Manual Timestamp Setting Required:** The standard instrumentation pattern does not require manually setting timestamp attributes on spans. Instead, OpenTelemetry handles this internally through the SpanProcessor and Exporter classes.
+
+3. **Timestamp Representation:** In the OpenTelemetry data model, timestamps are stored as nanoseconds since the Unix epoch (January 1, 1970).
+
+4. **Serialization Responsibility:** The serialization of timestamps from OTel spans to output formats like JSON is handled by the Exporter components. If timestamps aren't appearing correctly in output APIs, the issue is likely in the API exporter, not in the span creation code.
+
+5. **Debugging Timestamps:** To debug timestamp issues, verify that spans are properly starting and ending, rather than manually setting timestamp attributes:
+
+```python
+# Good pattern - timestamps handled by OpenTelemetry automatically
+with tracer.start_as_current_span("my_operation") as span:
+    # Do work
+    pass  # span.end() is called automatically
+```
+
+Note: If timestamps are missing in API output (e.g., empty "start_time" fields), focus on fixes in the exporter and serialization layer, not by manually tracking timestamps in instrumentation code.
+
+## Attributes in OpenTelemetry
+
+When working with span attributes in OpenTelemetry:
+
+1. **Root Attributes Node:** The root `attributes` object in the API output JSON should always be empty. This is by design. All attribute data should be stored in the `span_attributes` object.
+
+2. **Span Attributes:** The `span_attributes` object is where all user-defined and semantic attribute data should be stored. This allows for a structured, hierarchical representation of attributes.
+
+3. **Structure Difference:** While the root `attributes` appears as an empty object in the API output, this is normal and expected. Do not attempt to populate this object directly or duplicate data from `span_attributes` into it.
+
+4. **Setting Attributes:** Always set span attributes using the semantic conventions defined in the `agentops/semconv` module:
+
+```python
+from agentops.semconv import agent
+
+# Good pattern - using semantic conventions
+span.set_attribute(agent.AGENT_NAME, "My Agent")
+```
diff --git a/agentops/instrumentation/__init__.py b/agentops/instrumentation/__init__.py
@@ -68,8 +68,8 @@ def get_instance(self) -> BaseInstrumentor:
         provider_import_name="crewai",
     ),
     InstrumentorLoader(
-        module_name="opentelemetry.instrumentation.agents",
-        class_name="AgentsInstrumentor",
+        module_name="agentops.instrumentation.openai_agents",
+        class_name="OpenAIAgentsInstrumentor",
         provider_import_name="agents",
     ),
 ]

diff --git a/agentops/instrumentation/openai_agents/README.md b/agentops/instrumentation/openai_agents/README.md
@@ -0,0 +1,156 @@
+# OpenAI Agents SDK Instrumentation
+
+This module provides automatic instrumentation for the OpenAI Agents SDK, adding telemetry that follows OpenTelemetry semantic conventions for Generative AI systems.
+
+## Architecture Overview
+
+The OpenAI Agents SDK instrumentor works by:
+
+1. Intercepting the Agents SDK's trace processor interface to capture Agent, Function, Generation, and other span types
+2. Monkey-patching the Agents SDK `Runner` class to capture the full execution lifecycle, including streaming operations
+3. Converting all captured data to OpenTelemetry spans and metrics following semantic conventions
+
+The instrumentation is organized into several key components:
+
+1. **Instrumentor (`instrumentor.py`)**: The entry point that patches the Agents SDK and configures trace capture
+2. **Processor (`processor.py`)**: Receives events from the SDK and prepares them for export
+3. **Exporter (`exporter.py`)**: Converts SDK spans to OpenTelemetry spans and exports them
+4. **Attributes Module (`attributes/`)**: Specialized modules for extracting and formatting span attributes
+
+## Attribute Processing Modules
+
+The attribute modules extract and format OpenTelemetry-compatible attributes from span data:
+
+- **Common (`attributes/common.py`)**: Core attribute extraction functions for all span types and utility functions
+- **Completion (`attributes/completion.py`)**: Handles different completion content formats (Chat Completions API, Response API, Agents SDK) 
+- **Model (`attributes/model.py`)**: Extracts model information and parameters
+- **Tokens (`attributes/tokens.py`)**: Processes token usage data and metrics
+- **Response (`attributes/response.py`)**: Handles interpretation of Response API objects
+
+Each getter function in these modules is focused on a single responsibility and does not modify global state. Functions are designed to be composable, allowing different attribute types to be combined as needed in the exporter.
+
+## Span Types
+
+The instrumentor captures the following span types:
+
+- **Trace**: The root span representing an entire agent workflow execution
+  - Created using `get_base_trace_attributes()` to initialize with standard fields
+  - Captures workflow name, trace ID, and workflow-level metadata
+
+- **Agent**: Represents an agent's execution lifecycle
+  - Processed using `get_agent_span_attributes()` with `AGENT_SPAN_ATTRIBUTES` mapping
+  - Uses `SpanKind.CONSUMER` to indicate an agent receiving a request
+  - Captures agent name, input, output, tools, and other metadata
+
+- **Function**: Represents a tool/function call
+  - Processed using `get_function_span_attributes()` with `FUNCTION_SPAN_ATTRIBUTES` mapping
+  - Uses `SpanKind.CLIENT` to indicate an outbound call to a function
+  - Captures function name, input arguments, output results, and from_agent information
+
+- **Generation**: Captures details of model generation
+  - Processed using `get_generation_span_attributes()` with `GENERATION_SPAN_ATTRIBUTES` mapping
+  - Uses `SpanKind.CLIENT` to indicate an outbound call to an LLM
+  - Captures model name, configuration, usage statistics, and response content
+
+- **Response**: Lightweight span for tracking model response data
+  - Processed using `get_response_span_attributes()` with `RESPONSE_SPAN_ATTRIBUTES` mapping
+  - Extracts response content and metadata from different API formats
+
+- **Handoff**: Represents control transfer between agents
+  - Processed using `get_handoff_span_attributes()` with `HANDOFF_SPAN_ATTRIBUTES` mapping
+  - Tracks from_agent and to_agent information
+
+## Span Lifecycle Management
+
+The exporter (`exporter.py`) handles the full span lifecycle:
+
+1. **Start Events**:
+   - Create spans but DO NOT END them
+   - Store span references in tracking dictionaries
+   - Use OpenTelemetry's start_span to control when spans end
+   - Leave status as UNSET to indicate in-progress
+
+2. **End Events**:
+   - Look up existing span by ID in tracking dictionaries
+   - If found and not ended:
+     - Update span with all final attributes
+     - Set status to OK or ERROR based on task outcome
+     - End the span manually
+   - If not found or already ended:
+     - Create a new complete span with all data
+     - End it immediately
+
+3. **Error Handling**:
+   - Check if spans are already ended before attempting updates
+   - Provide informative log messages about span lifecycle
+   - Properly clean up tracking resources
+
+This approach is essential because:
+- Agents SDK sends separate start and end events for each task
+- We need to maintain a single span for the entire task lifecycle to get accurate timing
+- Final data (outputs, token usage, etc.) is only available at the end event
+- We want to avoid creating duplicate spans for the same task
+- Spans must be properly created and ended to avoid leaks
+
+The span lifecycle management ensures spans have:
+- Accurate start and end times (preserving the actual task duration)
+- Complete attribute data from both start and end events
+- Proper status reflecting task completion
+- All final outputs, errors, and metrics
+- Clean resource management with no memory leaks
+
+## Key Design Patterns
+
+### Semantic Conventions
+
+All attribute names follow the OpenTelemetry semantic conventions defined in `agentops.semconv`:
+
+```python
+# Using constants from semconv module
+attributes[CoreAttributes.TRACE_ID] = trace_id
+attributes[WorkflowAttributes.WORKFLOW_NAME] = trace.name
+attributes[SpanAttributes.LLM_SYSTEM] = "openai"
+attributes[MessageAttributes.COMPLETION_CONTENT.format(i=0)] = content
+```
+
+### Target → Source Attribute Mapping
+
+We use a consistent pattern for attribute extraction with typed mapping dictionaries:
+
+```python
+# Attribute mapping example
+AGENT_SPAN_ATTRIBUTES: AttributeMap = {
+    # target_attribute: source_attribute
+    AgentAttributes.AGENT_NAME: "name",
+    WorkflowAttributes.WORKFLOW_INPUT: "input",
+    WorkflowAttributes.FINAL_OUTPUT: "output",
+    # ...
+}
+```
+
+### Structured Attribute Handling
+
+- Always use MessageAttributes semantic conventions for content and tool calls
+- For chat completions, use MessageAttributes.COMPLETION_CONTENT.format(i=0) 
+- For tool calls, use MessageAttributes.TOOL_CALL_NAME.format(i=0, j=0), etc.
+- Never try to combine or aggregate contents into a single attribute
+- Each message component should have its own properly formatted attribute
+- This ensures proper display in OpenTelemetry backends and dashboards
+
+### Serialization Rules
+
+1. We do not serialize data structures arbitrarily; everything has a semantic convention
+2. Span attributes should use semantic conventions and avoid complex serialized structures
+3. Keep all string data in its original form - do not parse JSON within strings
+4. If a function has JSON attributes for its arguments, do not parse that JSON - keep as string
+5. If a completion or response body text/content contains JSON, keep it as a string
+7. Function arguments and tool call arguments should remain in their raw string form
+
+### Critical Notes for Attribute Handling
+
+- NEVER manually set the root completion attributes (`SpanAttributes.LLM_COMPLETIONS` or "gen_ai.completion")
+- Let OpenTelemetry backend derive these values from the detailed attributes
+- Setting root completion attributes creates duplication and inconsistency
+- Tests should verify attribute existence using MessageAttributes constants
+- Do not check for the presence of SpanAttributes.LLM_COMPLETIONS
+- Verify individual content/tool attributes instead of root attributes