refactor: replace verbose flag with debug option

steviec · steviec · commit 964b4daefad2 · 2025-07-16T13:31:42.000-07:00
- Simplify CLI options by consolidating quiet/verbose into single debug flag
- Remove quiet mode functionality while preserving debug output capabilities
- Add conversation formatting for debug mode with message display
- Improve tool call validation error messages with context
diff --git a/src/cli.ts b/src/cli.ts
@@ -19,8 +19,7 @@ interface CliOptions {
   serverConfig: string;
   serverName?: string;
   timeout?: number;
-  quiet?: boolean;
-  verbose?: boolean;
+  debug?: boolean;
   junitXml?: string;
 }
 
@@ -113,8 +112,7 @@ Examples:
       'Specific server name to use from config (if multiple servers defined)'
     )
     .option('--timeout <ms>', 'Test timeout in milliseconds', '10000')
-    .option('--quiet', 'Suppress non-essential output')
-    .option('--verbose', 'Enable verbose output with additional details')
+    .option('--debug', 'Enable debug output with additional details')
     .option('--junit-xml [filename]', 'Generate JUnit XML output (default: junit.xml)')
     .action(async (testFile: string, options: CliOptions) => {
       await runTests(testFile, options);
diff --git a/src/testing/capabilities/runner.ts b/src/testing/capabilities/runner.ts
@@ -19,8 +19,7 @@ import type { DisplayManager } from '../display/DisplayManager.js';
 interface ServerOptions {
   serverConfig: ServerConfig;
   timeout?: number;
-  quiet?: boolean;
-  verbose?: boolean;
+  debug?: boolean;
 }
 
 export class CapabilitiesTestRunner {
diff --git a/src/testing/display/DisplayManager.ts b/src/testing/display/DisplayManager.ts
@@ -12,21 +12,14 @@ export class DisplayManager {
   constructor(options: DisplayOptions = {}) {
     this.formatters = [];
 
-    // Always include console formatter unless quiet mode
-    if (!options.quiet) {
-      this.formatters.push(new ConsoleFormatter(options));
-    }
+    // Always include console formatter
+    this.formatters.push(new ConsoleFormatter(options));
 
     // Add JUnit XML formatter if requested
     if (options.junitXml !== undefined) {
       const filename = options.junitXml || 'junit.xml';
       this.formatters.push(new JunitXmlFormatter(options, filename));
     }
-
-    // Ensure we have at least one formatter
-    if (this.formatters.length === 0) {
-      this.formatters.push(new ConsoleFormatter(options));
-    }
   }
 
   /**
@@ -69,11 +62,12 @@ export class DisplayManager {
     passed: boolean,
     errors: string[],
     model?: string,
-    prompt?: string
+    prompt?: string,
+    messages?: any[]
   ): void {
     this.emit({
       type: 'test_complete',
-      data: { name, model, passed, errors, prompt },
+      data: { name, model, passed, errors, prompt, messages },
     });
   }
 
diff --git a/src/testing/display/formatters/ConsoleFormatter.ts b/src/testing/display/formatters/ConsoleFormatter.ts
@@ -15,6 +15,7 @@ import type {
   TestCompleteEvent,
   SuiteCompleteEvent,
 } from '../types.js';
+import { formatConversation } from '../utils/conversationFormatter.js';
 
 export class ConsoleFormatter implements TestFormatter {
   private options: DisplayOptions;
@@ -26,10 +27,6 @@ export class ConsoleFormatter implements TestFormatter {
   }
 
   onEvent(event: TestEvent): void {
-    if (this.options.quiet) {
-      return;
-    }
-
     switch (event.type) {
       case 'suite_start':
         this.handleSuiteStart(event.data as SuiteStartEvent['data']);
@@ -88,21 +85,21 @@ export class ConsoleFormatter implements TestFormatter {
     if (data.model && data.model !== this.currentModel) {
       this.currentModel = data.model;
       // Model changes are now handled by section headers
-    } else if (data.message && !this.options.quiet) {
-      // Only show progress messages in verbose mode or if explicitly needed
-      if (this.options.verbose) {
+    } else if (data.message) {
+      // Only show progress messages in debug mode
+      if (this.options.debug) {
         console.log(data.message);
       }
     }
   }
 
   private handleTestStart(_data: TestStartEvent['data']): void {
     // For now, we don't show individual test starts
-    // Could add verbose mode later that shows "Running: test_name..."
+    // Could add debug mode later that shows "Running: test_name..."
   }
 
   private handleTestComplete(data: TestCompleteEvent['data']): void {
-    const { name, passed, errors, prompt } = data;
+    const { name, passed, errors, prompt, messages } = data;
 
     if (passed) {
       console.log(`✅ ${name}: PASSED`);
@@ -119,6 +116,14 @@ export class ConsoleFormatter implements TestFormatter {
         });
       }
     }
+
+    // Show conversation in debug mode
+    if (this.options.debug && messages && messages.length > 0) {
+      console.log();
+      const formattedLines = formatConversation(messages, prompt);
+      formattedLines.forEach(line => console.log(line));
+      console.log();
+    }
   }
 
   private handleSuiteComplete(data: SuiteCompleteEvent['data']): void {
diff --git a/src/testing/display/formatters/JsonFormatter.ts b/src/testing/display/formatters/JsonFormatter.ts
@@ -20,7 +20,7 @@ export class JsonFormatter implements TestFormatter {
   flush(): void {
     // TODO: Implement JSON output
     // Could output to file or stdout depending on options
-    if (this.options.verbose) {
+    if (this.options.debug) {
       console.log('JSON formatter not yet implemented');
     }
   }
diff --git a/src/testing/display/formatters/JunitXmlFormatter.ts b/src/testing/display/formatters/JunitXmlFormatter.ts
@@ -282,7 +282,7 @@ export class JunitXmlFormatter implements TestFormatter {
     writeFileSync(this.outputFile, xml, 'utf8');
 
     // Validate the generated XML
-    if (this.options.verbose) {
+    if (this.options.debug) {
       const validation = validateJunitXmlContent(xml);
       if (!validation.valid) {
         console.warn(`JUnit XML validation errors: ${validation.errors.join(', ')}`);
diff --git a/src/testing/display/types.ts b/src/testing/display/types.ts
@@ -30,6 +30,7 @@ export interface TestCompleteEvent extends TestEvent {
     passed: boolean;
     errors: string[];
     prompt?: string;
+    messages?: any[]; // CoreMessage[] from 'ai' package
   };
 }
 
@@ -84,8 +85,7 @@ export interface TestFormatter {
 
 export interface DisplayOptions {
   formatter?: string;
-  quiet?: boolean;
-  verbose?: boolean;
+  debug?: boolean;
   junitXml?: string;
   version?: string;
 }
diff --git a/src/testing/display/utils/conversationFormatter.ts b/src/testing/display/utils/conversationFormatter.ts
@@ -0,0 +1,123 @@
+/**
+ * Utility functions for formatting conversation messages for console output
+ */
+
+export interface ConversationMessage {
+  role: string;
+  content: any;
+  toolInvocations?: any[];
+}
+
+/**
+ * Format a conversation array into human-readable console output
+ */
+export function formatConversation(messages: ConversationMessage[], prompt?: string): string[] {
+  const output: string[] = [];
+
+  // Add horizontal line at the start
+  output.push(formatText('─'.repeat(60)));
+
+  // Include initial prompt if provided
+  if (prompt) {
+    output.push(formatRole('user'));
+    output.push(formatText(prompt));
+    output.push('');
+  }
+
+  messages.forEach(msg => {
+    // Format role header
+    const roleDisplay = formatRole(msg.role);
+    output.push(roleDisplay);
+
+    // Format content
+    const contentLines = formatContent(msg.content);
+    output.push(...contentLines);
+
+    // Handle legacy tool invocations
+    if (msg.toolInvocations && msg.toolInvocations.length > 0) {
+      msg.toolInvocations.forEach(tool => {
+        const toolLine = formatToolCall(tool.toolName, tool.args);
+        output.push(toolLine);
+      });
+    }
+
+    // Add space between messages
+    output.push('');
+  });
+
+  // Add horizontal line at the end
+  output.push(formatText('─'.repeat(60)));
+
+  return output;
+}
+
+/**
+ * Format role with appropriate colors
+ */
+export function formatRole(role: string): string {
+  switch (role) {
+    case 'user':
+      return '\x1b[32m[USER]\x1b[0m'; // Green
+    case 'assistant':
+      return '\x1b[36m[ASSISTANT]\x1b[0m'; // Cyan
+    case 'system':
+      return '\x1b[33m[SYSTEM]\x1b[0m'; // Yellow
+    case 'tool':
+      return '\x1b[35m[TOOL]\x1b[0m'; // Magenta
+    default:
+      return `\x1b[37m[${role.toUpperCase()}]\x1b[0m`; // White
+  }
+}
+
+/**
+ * Format text content with darker color
+ */
+export function formatText(text: string): string {
+  return `\x1b[90m${text}\x1b[0m`; // Dark gray/dim
+}
+
+/**
+ * Format content based on type
+ */
+export function formatContent(content: any): string[] {
+  const lines: string[] = [];
+
+  if (typeof content === 'string') {
+    lines.push(formatText(content));
+  } else if (Array.isArray(content)) {
+    // Handle content array (multimodal messages)
+    content.forEach((part: any) => {
+      if (part.type === 'text') {
+        lines.push(formatText(part.text));
+      } else if (part.type === 'tool-call') {
+        const toolLine = formatToolCall(part.toolName, part.args);
+        lines.push(toolLine);
+      } else if (part.type === 'tool-result') {
+        const resultLine = formatToolResult(part.result);
+        lines.push(resultLine);
+      }
+    });
+  } else {
+    // Fallback for other content types
+    lines.push(formatText(JSON.stringify(content)));
+  }
+
+  return lines;
+}
+
+/**
+ * Format tool call
+ */
+export function formatToolCall(toolName: string, args: any): string {
+  const argsStr = JSON.stringify(args);
+  return formatText(`🔧 Tool Call: ${toolName}(${argsStr})`);
+}
+
+/**
+ * Format tool result
+ */
+export function formatToolResult(result: any): string {
+  const resultStr = JSON.stringify(result);
+  const truncated = resultStr.length > 200 ? `${resultStr.substring(0, 200)}...` : resultStr;
+  return formatText(`✅ Tool Result: ${truncated}`);
+}
diff --git a/src/testing/evals/runner.ts b/src/testing/evals/runner.ts
@@ -19,8 +19,7 @@ export interface EvalSummary {
 interface EvalServerOptions {
   serverConfig: ServerConfig;
   timeout?: number;
-  quiet?: boolean;
-  verbose?: boolean;
+  debug?: boolean;
 }
 
 export class EvalTestRunner {
@@ -92,7 +91,8 @@ export class EvalTestRunner {
               result.passed,
               result.errors,
               model,
-              test.prompt
+              test.prompt,
+              result.messages
             );
           }
         }
@@ -109,15 +109,7 @@ export class EvalTestRunner {
         results,
       };
 
-      // Notify display manager about test suite completion
-      if (this.displayManager) {
-        this.displayManager.suiteComplete(
-          summary.total,
-          summary.passed,
-          summary.failed,
-          summary.duration
-        );
-      }
+      // Note: suiteComplete is called by the main runner, not here
 
       return summary;
     } finally {
@@ -212,7 +204,9 @@ export class EvalTestRunner {
     if (expectedToolCalls.required) {
       for (const requiredTool of expectedToolCalls.required) {
         if (!actualToolNames.includes(requiredTool)) {
-          errors.push(`Required tool '${requiredTool}' was not called`);
+          errors.push(
+            `Required tool '${requiredTool}' was not called (actual calls: ${actualToolNames.length > 0 ? actualToolNames.join(', ') : 'none'})`
+          );
         }
       }
     }
@@ -229,7 +223,9 @@ export class EvalTestRunner {
 
       for (const actualTool of actualToolNames) {
         if (!allowedTools.includes(actualTool)) {
-          errors.push(`Tool '${actualTool}' was called but not in allowed list`);
+          errors.push(
+            `Tool '${actualTool}' was called but not in allowed list (allowed: ${allowedTools.join(', ')})`
+          );
         }
       }
     }
diff --git a/src/testing/runner.ts b/src/testing/runner.ts
@@ -16,8 +16,7 @@ interface ServerOptions {
   serverConfig: string;
   serverName?: string;
   timeout?: number;
-  quiet?: boolean;
-  verbose?: boolean;
+  debug?: boolean;
   junitXml?: string;
 }
 
@@ -33,8 +32,7 @@ export class TestRunner {
     // Create display manager with options
     const displayOptions: DisplayOptions = {
       formatter: 'console',
-      quiet: serverOptions.quiet,
-      verbose: serverOptions.verbose,
+      debug: serverOptions.debug,
       junitXml: serverOptions.junitXml,
       version: this.getVersion(),
     };
@@ -82,8 +80,7 @@ export class TestRunner {
         {
           serverConfig,
           timeout: this.serverOptions.timeout,
-          quiet: this.serverOptions.quiet,
-          verbose: this.serverOptions.verbose,
+          debug: this.serverOptions.debug,
         },
         this.displayManager
       );
@@ -110,8 +107,7 @@ export class TestRunner {
           {
             serverConfig,
             timeout: this.serverOptions.timeout,
-            quiet: this.serverOptions.quiet,
-            verbose: this.serverOptions.verbose,
+            debug: this.serverOptions.debug,
           },
           this.displayManager
         );
diff --git a/test/unit/junit-xml-formatter.test.ts b/test/unit/junit-xml-formatter.test.ts
@@ -13,7 +13,7 @@ import { tmpdir } from 'os';
 describe('JunitXmlFormatter', () => {
   let formatter: JunitXmlFormatter;
   let outputFile: string;
-  const options: DisplayOptions = { verbose: false };
+  const options: DisplayOptions = { debug: false };
 
   beforeEach(() => {
     // Create a unique temp file for each test
diff --git a/test/unit/tool-validation.test.ts b/test/unit/tool-validation.test.ts

Original file line number	Diff line number	Diff line change
`@@ -19,8 +19,7 @@ import type { DisplayManager } from '../display/DisplayManager.js';`
`19`	`19`	`interface ServerOptions {`
`20`	`20`	`serverConfig: ServerConfig;`
`21`	`21`	`timeout?: number;`
`22`		`- quiet?: boolean;`
`23`		`- verbose?: boolean;`
	`22`	`+ debug?: boolean;`
`24`	`23`	`}`
`25`	`24`
`26`	`25`	`export class CapabilitiesTestRunner {`
Original file line number	Diff line number	Diff line change
`@@ -20,7 +20,7 @@ export class JsonFormatter implements TestFormatter {`
`20`	`20`	`flush(): void {`
`21`	`21`	`// TODO: Implement JSON output`
`22`	`22`	`// Could output to file or stdout depending on options`
`23`		`- if (this.options.verbose) {`
	`23`	`+ if (this.options.debug) {`
`24`	`24`	`console.log('JSON formatter not yet implemented');`
`25`	`25`	`}`
`26`	`26`	`}`