feat: Add unit tests for aegis_workflow container orchestration behavior

Theaxiom · Theaxiom · commit 645fab2219f1 · 2026-03-05T22:32:04.000-08:00
diff --git a/src/activities/index.test.ts b/src/activities/index.test.ts
@@ -0,0 +1,123 @@
+import { beforeEach, describe, expect, it, vi } from 'vitest';
+import type { ExecuteContainerRunResponse } from '../types.js';
+
+const executeContainerRunMock = vi.fn();
+
+vi.mock('../grpc/client.js', () => ({
+  aegisRuntimeClient: {
+    executeContainerRun: executeContainerRunMock,
+    executeAgent: vi.fn(),
+    executeSystemCommand: vi.fn(),
+    validateWithJudges: vi.fn(),
+    storeTrajectoryPattern: vi.fn(),
+  },
+}));
+
+vi.mock('../logger.js', () => ({
+  logger: {
+    info: vi.fn(),
+    error: vi.fn(),
+    warn: vi.fn(),
+    debug: vi.fn(),
+  },
+}));
+
+import { executeParallelContainerRunActivity } from './index.js';
+
+function ok(exit_code: number, name = 'step'): ExecuteContainerRunResponse & { name?: string } {
+  return {
+    exit_code,
+    stdout: `${name}-stdout`,
+    stderr: `${name}-stderr`,
+    duration_ms: 10,
+    attempts: 1,
+  };
+}
+
+describe('executeParallelContainerRunActivity', () => {
+  beforeEach(() => {
+    executeContainerRunMock.mockReset();
+  });
+
+  it('returns failure result (no throw) for all_succeed when any step fails', async () => {
+    executeContainerRunMock
+      .mockResolvedValueOnce(ok(0, 'unit'))
+      .mockResolvedValueOnce(ok(2, 'lint'));
+
+    const result = await executeParallelContainerRunActivity({
+      execution_id: 'exec-1',
+      state_name: 'TEST',
+      completion: 'all_succeed',
+      steps: [
+        { name: 'unit', image: 'alpine', command: ['true'] },
+        { name: 'lint', image: 'alpine', command: ['false'] },
+      ],
+    });
+
+    expect(result.overall_success).toBe(false);
+    expect(result.completion).toBe('all_succeed');
+    expect(result.succeeded).toBe(1);
+    expect(result.failed).toBe(1);
+    expect(result.results).toHaveLength(2);
+  });
+
+  it('returns failure result (no throw) for any_succeed when all steps fail', async () => {
+    executeContainerRunMock.mockResolvedValue(ok(3));
+
+    const result = await executeParallelContainerRunActivity({
+      execution_id: 'exec-2',
+      state_name: 'TEST',
+      completion: 'any_succeed',
+      steps: [
+        { name: 'unit', image: 'alpine', command: ['false'] },
+        { name: 'lint', image: 'alpine', command: ['false'] },
+      ],
+    });
+
+    expect(result.overall_success).toBe(false);
+    expect(result.completion).toBe('any_succeed');
+    expect(result.succeeded).toBe(0);
+    expect(result.failed).toBe(2);
+  });
+
+  it('returns success for best_effort even when all steps fail', async () => {
+    executeContainerRunMock.mockResolvedValue(ok(1));
+
+    const result = await executeParallelContainerRunActivity({
+      execution_id: 'exec-3',
+      state_name: 'TEST',
+      completion: 'best_effort',
+      steps: [
+        { name: 'unit', image: 'alpine', command: ['false'] },
+        { name: 'lint', image: 'alpine', command: ['false'] },
+      ],
+    });
+
+    expect(result.overall_success).toBe(true);
+    expect(result.succeeded).toBe(0);
+    expect(result.failed).toBe(2);
+  });
+
+  it('converts rejected step call into non-zero step result and preserves aggregation', async () => {
+    executeContainerRunMock
+      .mockResolvedValueOnce(ok(0, 'unit'))
+      .mockRejectedValueOnce(new Error('grpc unavailable'));
+
+    const result = await executeParallelContainerRunActivity({
+      execution_id: 'exec-4',
+      state_name: 'TEST',
+      completion: 'all_succeed',
+      steps: [
+        { name: 'unit', image: 'alpine', command: ['true'] },
+        { name: 'lint', image: 'alpine', command: ['false'] },
+      ],
+    });
+
+    expect(result.overall_success).toBe(false);
+    const lint = result.results.find((r) => r.name === 'lint');
+    expect(lint).toBeDefined();
+    expect(lint?.exit_code).toBe(1);
+    expect(lint?.stderr).toContain('grpc unavailable');
+  });
+});
+
diff --git a/src/workflows/aegis-workflow.test.ts b/src/workflows/aegis-workflow.test.ts
@@ -0,0 +1,253 @@
+import { beforeEach, describe, expect, it, vi } from 'vitest';
+import type { TemporalWorkflowDefinition } from '../types.js';
+
+const activityMocks = {
+  executeAgentActivity: vi.fn(),
+  executeSystemCommandActivity: vi.fn(),
+  validateOutputActivity: vi.fn(),
+  executeParallelAgentsActivity: vi.fn(),
+  storeTrajectoryPatternActivity: vi.fn(),
+  fetchWorkflowDefinition: vi.fn(),
+  publishEventActivity: vi.fn(),
+  executeContainerRunActivity: vi.fn(),
+  executeParallelContainerRunActivity: vi.fn(),
+};
+
+vi.mock('../activities/index.js', () => activityMocks);
+
+vi.mock('@temporalio/workflow', () => ({
+  proxyActivities: () => activityMocks,
+  setHandler: vi.fn(),
+  defineSignal: vi.fn(() => Symbol('humanInput')),
+  condition: vi.fn(async (predicate: () => boolean) => predicate()),
+  workflowInfo: vi.fn(() => ({ workflowId: 'exec-123' })),
+}));
+
+import { aegis_workflow } from './aegis-workflow.js';
+
+function baseDefinition(states: TemporalWorkflowDefinition['states'], initial = 'BUILD'): TemporalWorkflowDefinition {
+  return {
+    workflow_id: 'wf-1',
+    name: 'ci-workflow',
+    version: '1.0.0',
+    initial_state: initial,
+    context: {},
+    states,
+  };
+}
+
+describe('aegis_workflow container orchestration behavior', () => {
+  beforeEach(() => {
+    for (const fn of Object.values(activityMocks)) {
+      fn.mockReset();
+    }
+    activityMocks.publishEventActivity.mockResolvedValue(undefined);
+    activityMocks.executeSystemCommandActivity.mockResolvedValue({
+      status: 'success',
+      exit_code: 0,
+      stdout: 'ok',
+      stderr: '',
+    });
+  });
+
+  it('stores ContainerRun output shape with nested output object for blackboard templates', async () => {
+    activityMocks.fetchWorkflowDefinition.mockResolvedValue(
+      baseDefinition({
+        BUILD: {
+          kind: 'ContainerRun',
+          container_run_name: 'build',
+          container_run_image: 'rust:1.75',
+          container_run_command: ['cargo', 'build'],
+          transitions: [],
+        },
+      })
+    );
+    activityMocks.executeContainerRunActivity.mockResolvedValue({
+      exit_code: 0,
+      stdout: 'build-ok',
+      stderr: '',
+      duration_ms: 120,
+      attempts: 1,
+    });
+
+    const result = await aegis_workflow({ workflow_name: 'ci-workflow', input: {} });
+    const build = result.blackboard?.BUILD;
+
+    expect(result.status).toBe('completed');
+    expect(build?.status).toBe('success');
+    expect(build?.output?.exit_code).toBe(0);
+    expect(build?.output?.stdout).toBe('build-ok');
+    expect(build?.exit_code).toBe(0);
+  });
+
+  it('routes on_success using container exit code 0', async () => {
+    activityMocks.fetchWorkflowDefinition.mockResolvedValue(
+      baseDefinition(
+        {
+          BUILD: {
+            kind: 'ContainerRun',
+            container_run_name: 'build',
+            container_run_image: 'rust:1.75',
+            container_run_command: ['cargo', 'build'],
+            transitions: [
+              { condition: 'on_success', target: 'PASS' },
+              { condition: 'on_failure', target: 'FAIL' },
+            ],
+          },
+          PASS: { kind: 'System', command: 'echo pass', transitions: [] },
+          FAIL: { kind: 'System', command: 'echo fail', transitions: [] },
+        },
+        'BUILD'
+      )
+    );
+    activityMocks.executeContainerRunActivity.mockResolvedValue({
+      exit_code: 0,
+      stdout: 'ok',
+      stderr: '',
+      duration_ms: 10,
+      attempts: 1,
+    });
+
+    const result = await aegis_workflow({ workflow_name: 'ci-workflow', input: {} });
+    expect(result.final_state).toBe('PASS');
+  });
+
+  it('routes on_failure using non-zero container exit code', async () => {
+    activityMocks.fetchWorkflowDefinition.mockResolvedValue(
+      baseDefinition(
+        {
+          BUILD: {
+            kind: 'ContainerRun',
+            container_run_name: 'build',
+            container_run_image: 'rust:1.75',
+            container_run_command: ['cargo', 'build'],
+            transitions: [
+              { condition: 'on_success', target: 'PASS' },
+              { condition: 'on_failure', target: 'FAIL' },
+            ],
+          },
+          PASS: { kind: 'System', command: 'echo pass', transitions: [] },
+          FAIL: { kind: 'System', command: 'echo fail', transitions: [] },
+        },
+        'BUILD'
+      )
+    );
+    activityMocks.executeContainerRunActivity.mockResolvedValue({
+      exit_code: 2,
+      stdout: '',
+      stderr: 'compile failed',
+      duration_ms: 10,
+      attempts: 1,
+    });
+
+    const result = await aegis_workflow({ workflow_name: 'ci-workflow', input: {} });
+    expect(result.final_state).toBe('FAIL');
+  });
+
+  it('supports exit_code_non_zero transition for ContainerRun outputs', async () => {
+    activityMocks.fetchWorkflowDefinition.mockResolvedValue(
+      baseDefinition(
+        {
+          BUILD: {
+            kind: 'ContainerRun',
+            container_run_name: 'build',
+            container_run_image: 'rust:1.75',
+            container_run_command: ['cargo', 'build'],
+            transitions: [
+              { condition: 'exit_code_non_zero', target: 'FAIL' },
+              { condition: 'always', target: 'PASS' },
+            ],
+          },
+          PASS: { kind: 'System', command: 'echo pass', transitions: [] },
+          FAIL: { kind: 'System', command: 'echo fail', transitions: [] },
+        },
+        'BUILD'
+      )
+    );
+    activityMocks.executeContainerRunActivity.mockResolvedValue({
+      exit_code: 9,
+      stdout: '',
+      stderr: 'failed',
+      duration_ms: 10,
+      attempts: 1,
+    });
+
+    const result = await aegis_workflow({ workflow_name: 'ci-workflow', input: {} });
+    expect(result.final_state).toBe('FAIL');
+  });
+
+  it('returns ParallelContainerRun blackboard output keyed by step name', async () => {
+    activityMocks.fetchWorkflowDefinition.mockResolvedValue(
+      baseDefinition(
+        {
+          TEST: {
+            kind: 'ParallelContainerRun',
+            parallel_container_steps: [
+              { name: 'unit-tests', image: 'rust:1.75', command: ['cargo', 'test'] },
+              { name: 'lint', image: 'rust:1.75', command: ['cargo', 'clippy'] },
+            ],
+            parallel_container_completion: 'all_succeed',
+            transitions: [],
+          },
+        },
+        'TEST'
+      )
+    );
+    activityMocks.executeParallelContainerRunActivity.mockResolvedValue({
+      overall_success: true,
+      completion: 'all_succeed',
+      succeeded: 2,
+      failed: 0,
+      results: [
+        { name: 'unit-tests', exit_code: 0, stdout: 'ok', stderr: '', duration_ms: 12 },
+        { name: 'lint', exit_code: 0, stdout: 'ok', stderr: '', duration_ms: 8 },
+      ],
+    });
+
+    const result = await aegis_workflow({ workflow_name: 'ci-workflow', input: {} });
+    const testOutput = result.blackboard?.TEST?.output;
+
+    expect(result.status).toBe('completed');
+    expect(testOutput?.['unit-tests']?.stdout).toBe('ok');
+    expect(testOutput?.['lint']?.exit_code).toBe(0);
+  });
+
+  it('routes on_failure for ParallelContainerRun when aggregation fails', async () => {
+    activityMocks.fetchWorkflowDefinition.mockResolvedValue(
+      baseDefinition(
+        {
+          TEST: {
+            kind: 'ParallelContainerRun',
+            parallel_container_steps: [
+              { name: 'unit', image: 'rust:1.75', command: ['cargo', 'test'] },
+              { name: 'lint', image: 'rust:1.75', command: ['cargo', 'clippy'] },
+            ],
+            parallel_container_completion: 'all_succeed',
+            transitions: [
+              { condition: 'on_success', target: 'PASS' },
+              { condition: 'on_failure', target: 'FAIL' },
+            ],
+          },
+          PASS: { kind: 'System', command: 'echo pass', transitions: [] },
+          FAIL: { kind: 'System', command: 'echo fail', transitions: [] },
+        },
+        'TEST'
+      )
+    );
+    activityMocks.executeParallelContainerRunActivity.mockResolvedValue({
+      overall_success: false,
+      completion: 'all_succeed',
+      succeeded: 1,
+      failed: 1,
+      results: [
+        { name: 'unit', exit_code: 0, stdout: 'ok', stderr: '', duration_ms: 12 },
+        { name: 'lint', exit_code: 2, stdout: '', stderr: 'lint fail', duration_ms: 8 },
+      ],
+    });
+
+    const result = await aegis_workflow({ workflow_name: 'ci-workflow', input: {} });
+    expect(result.final_state).toBe('FAIL');
+    expect(result.blackboard?.TEST?.status).toBe('failed');
+  });
+});
+