fix(agents): Added statusCode propagation for workflow spans.

Murike · Murike · commit e261754d41fa · 2026-03-05T17:55:27.000-03:00
diff --git a/src/handlers/openai-agents/index.ts b/src/handlers/openai-agents/index.ts
@@ -470,7 +470,8 @@ export class GalileoTracingProcessor implements TracingProcessor {
         durationNs,
         metadata,
         tags,
-        createdAt: startedAt
+        createdAt: startedAt,
+        statusCode
       });
     }
 
@@ -487,7 +488,7 @@ export class GalileoTracingProcessor implements TracingProcessor {
       !firstNode &&
       (node.nodeType === 'workflow' || node.nodeType === 'agent')
     ) {
-      this._galileoLogger.conclude({ output, durationNs });
+      this._galileoLogger.conclude({ output, durationNs, statusCode });
     }
   }
 
diff --git a/src/utils/galileo-logger.ts b/src/utils/galileo-logger.ts
@@ -1115,6 +1115,7 @@ class GalileoLogger implements IGalileoLogger {
    * @param options.createdAt - (Optional) The timestamp when the span was created.
    * @param options.metadata - (Optional) Additional metadata as key-value pairs.
    * @param options.tags - (Optional) Array of tags to categorize the span.
+   * @param options.statusCode - (Optional) HTTP status code or execution status (e.g., 200 for success, 500 for error).
    * @param options.stepNumber - (Optional) The step number in a multi-step process.
    * @returns The created workflow span.
    */
@@ -1128,6 +1129,7 @@ class GalileoLogger implements IGalileoLogger {
     createdAt?: Date;
     metadata?: Record<string, string>;
     tags?: string[];
+    statusCode?: number;
     stepNumber?: number;
   }): WorkflowSpan {
     const span = new WorkflowSpan({
@@ -1139,6 +1141,7 @@ class GalileoLogger implements IGalileoLogger {
       createdAt: options.createdAt || GalileoApiClient.getTimestampRecord(),
       metadata: options.metadata,
       tags: options.tags,
+      statusCode: options.statusCode,
       metrics: new Metrics({ durationNs: options.durationNs }),
       stepNumber: options.stepNumber
     });
diff --git a/tests/handlers/openai-agents/integration.test.ts b/tests/handlers/openai-agents/integration.test.ts
@@ -562,3 +562,148 @@ describe('Output tracking integration', () => {
     ).toBe(true);
   });
 });
+
+describe('Workflow span statusCode propagation', () => {
+  test('test workflow span statusCode passed to addWorkflowSpan', async () => {
+    const mockLogger = createMockLogger();
+    const processor = new GalileoTracingProcessor(mockLogger as never, false);
+    const trace = makeTrace();
+
+    await processor.onTraceStart(trace);
+
+    // Create a workflow span (handoff type maps to workflow nodeType)
+    const workflow = makeSpan({
+      spanId: 'workflow-001',
+      parentId: 'trace-001',
+      spanData: { type: 'handoff', from_agent: 'Agent1', to_agent: 'Agent2' }
+    });
+
+    // Create a successful child LLM span
+    const llm = makeSpan({
+      spanId: 'llm-001',
+      parentId: 'workflow-001',
+      spanData: {
+        type: 'generation',
+        model: 'gpt-4',
+        input: [],
+        output: 'successful response'
+      },
+      error: null
+    });
+
+    await processor.onSpanStart(workflow);
+    await processor.onSpanStart(llm);
+    await processor.onSpanEnd(llm);
+    await processor.onSpanEnd(workflow);
+    await processor.onTraceEnd(trace);
+
+    // Verify addWorkflowSpan was called (note: statusCode may be 200 by default)
+    expect(mockLogger.addWorkflowSpan).toHaveBeenCalledTimes(1);
+    const workflowSpanCall = mockLogger.addWorkflowSpan.mock.calls[0][0];
+    // Verify statusCode parameter is being passed through (defaults to 200 for success)
+    expect(workflowSpanCall.statusCode).toBe(200);
+  });
+
+  test('test workflow span with direct error has statusCode 500', async () => {
+    const mockLogger = createMockLogger();
+    const processor = new GalileoTracingProcessor(mockLogger as never, false);
+    const trace = makeTrace();
+
+    await processor.onTraceStart(trace);
+
+    // Create a workflow span that itself has an error
+    const workflowWithError = makeSpan({
+      spanId: 'workflow-001',
+      parentId: 'trace-001',
+      spanData: { type: 'handoff', from_agent: 'Agent1', to_agent: 'Agent2' },
+      error: {
+        message: 'Workflow execution failed',
+        data: { reason: 'timeout' }
+      }
+    });
+
+    await processor.onSpanStart(workflowWithError);
+    await processor.onSpanEnd(workflowWithError);
+    await processor.onTraceEnd(trace);
+
+    // Verify addWorkflowSpan was called with statusCode 500
+    expect(mockLogger.addWorkflowSpan).toHaveBeenCalledTimes(1);
+    const workflowSpanCall = mockLogger.addWorkflowSpan.mock.calls[0][0];
+    expect(workflowSpanCall.statusCode).toBe(500);
+  });
+
+  test('test agent span statusCode passed to addAgentSpan', async () => {
+    const mockLogger = createMockLogger();
+    const processor = new GalileoTracingProcessor(mockLogger as never, false);
+    const trace = makeTrace();
+
+    await processor.onTraceStart(trace);
+
+    // Create an agent span
+    const agent = makeSpan({
+      spanId: 'agent-001',
+      parentId: 'trace-001',
+      spanData: { type: 'agent', name: 'TestAgent' }
+    });
+
+    // Create a child LLM span
+    const llm = makeSpan({
+      spanId: 'llm-001',
+      parentId: 'agent-001',
+      spanData: {
+        type: 'generation',
+        model: 'gpt-4',
+        input: [],
+        output: 'test output'
+      },
+      error: null
+    });
+
+    await processor.onSpanStart(agent);
+    await processor.onSpanStart(llm);
+    await processor.onSpanEnd(llm);
+    await processor.onSpanEnd(agent);
+    await processor.onTraceEnd(trace);
+
+    // Verify addAgentSpan was called with statusCode parameter
+    expect(mockLogger.addAgentSpan).toHaveBeenCalledTimes(1);
+    const agentSpanCall = mockLogger.addAgentSpan.mock.calls[0][0];
+    expect(agentSpanCall.statusCode).toBe(200);
+  });
+
+  test('test conclude called with statusCode for workflow spans', async () => {
+    const mockLogger = createMockLogger();
+    const processor = new GalileoTracingProcessor(mockLogger as never, false);
+    const trace = makeTrace();
+
+    await processor.onTraceStart(trace);
+
+    // Create nested workflow spans to test conclude calls
+    const outerWorkflow = makeSpan({
+      spanId: 'workflow-001',
+      parentId: 'trace-001',
+      spanData: { type: 'handoff', from_agent: 'Agent1', to_agent: 'Agent2' }
+    });
+
+    const innerWorkflow = makeSpan({
+      spanId: 'workflow-002',
+      parentId: 'workflow-001',
+      spanData: { type: 'custom', name: 'InnerWorkflow' }
+    });
+
+    await processor.onSpanStart(outerWorkflow);
+    await processor.onSpanStart(innerWorkflow);
+    await processor.onSpanEnd(innerWorkflow);
+    await processor.onSpanEnd(outerWorkflow);
+    await processor.onTraceEnd(trace);
+
+    // Verify conclude was called for the workflow spans
+    expect(mockLogger.conclude).toHaveBeenCalled();
+    // Find calls that pass statusCode
+    const concludeCalls = mockLogger.conclude.mock.calls;
+    const callsWithStatusCode = concludeCalls.filter(
+      (call) => call[0]?.statusCode !== undefined
+    );
+    expect(callsWithStatusCode.length).toBeGreaterThan(0);
+  });
+});

Original file line number	Diff line number	Diff line change
`@@ -470,7 +470,8 @@ export class GalileoTracingProcessor implements TracingProcessor {`
`470`	`470`	`durationNs,`
`471`	`471`	`metadata,`
`472`	`472`	`tags,`
`473`		`- createdAt: startedAt`
	`473`	`+ createdAt: startedAt,`
	`474`	`+ statusCode`
`474`	`475`	`});`
`475`	`476`	`}`
`476`	`477`
`@@ -487,7 +488,7 @@ export class GalileoTracingProcessor implements TracingProcessor {`
`487`	`488`	`!firstNode &&`
`488`	`489`	`(node.nodeType === 'workflow' \|\| node.nodeType === 'agent')`
`489`	`490`	`) {`
`490`		`- this._galileoLogger.conclude({ output, durationNs });`
	`491`	`+ this._galileoLogger.conclude({ output, durationNs, statusCode });`
`491`	`492`	`}`
`492`	`493`	`}`
`493`	`494`