Added option to regenerate test artifact

jaredoconnell · jaredoconnell · commit 2063d43ae062 · 2025-06-16T18:22:13.000-04:00
diff --git a/tests/unit/entrypoints/assets/benchmarks_stripped_output.txt b/tests/unit/entrypoints/assets/benchmarks_stripped_output.txt
@@ -3,44 +3,29 @@
 Benchmarks Metadata:
     Run id:93e36b31-b454-471d-ba62-6b2671585485
     Duration:30.2 seconds
-    Profile:type=sweep, strategies=['synchronous', 'throughput', 'constant', 'constant', 'constant', 'constant',        
-    'constant', 'constant', 'constant', 'constant'], max_concurrency=None                                               
-    Args:max_number=None, max_duration=30.0, warmup_number=None, warmup_duration=None, cooldown_number=None,            
-    cooldown_duration=None                                                                                              
-    Worker:type_='generative_requests_worker' backend_type='openai_http' backend_target='example_target'                
-    backend_model='example_model' backend_info={'max_output_tokens': 16384, 'timeout': 300, 'http2': True,              
-    'authorization': False, 'organization': None, 'project': None, 'text_completions_path': '/v1/completions',          
-    'chat_completions_path': '/v1/chat/completions'}                                                                    
-    Request Loader:type_='generative_request_loader' data='prompt_tokens=256,output_tokens=128' data_args=None          
-    processor='example_processor' processor_args=None                                                                   
+    Profile:type=sweep, strategies=['synchronous', 'throughput', 'constant', 'constant', 'constant', 'constant', 'constant', 'constant', 'constant', 'constant'],                   
+    max_concurrency=None                                                                                                                                                            
+    Args:max_number=None, max_duration=30.0, warmup_number=None, warmup_duration=None, cooldown_number=None, cooldown_duration=None
+    Worker:type_='generative_requests_worker' backend_type='openai_http' backend_target='example_target' backend_model='example_model' backend_info={'max_output_tokens': 16384,    
+    'timeout': 300, 'http2': True, 'authorization': False, 'organization': None, 'project': None, 'text_completions_path': '/v1/completions', 'chat_completions_path':              
+    '/v1/chat/completions'}                                                                                                                                                         
+    Request Loader:type_='generative_request_loader' data='prompt_tokens=256,output_tokens=128' data_args=None processor='example_processor' processor_args=None
     Extras:None
                 
                 
 Benchmarks Info:
-========================================================================================================================
-===========================                                                                                             
-Metadata                                    |||| Requests Made  ||| Prompt Tok/Req ||| Output Tok/Req  ||| Prompt Tok   
-Total||| Output Tok Total  ||                                                                                           
-  Benchmark| Start Time| End Time| Duration (s)|  Comp|  Inc|  Err|  Comp|   Inc| Err|   Comp|  Inc|  Err|   Comp|  Inc|
-Err|   Comp|   Inc|   Err                                                                                               
------------|-----------|---------|-------------|------|-----|-----|------|------|----|-------|-----|-----|-------|-----|
------|-------|------|------                                                                                             
-synchronous|   16:59:28| 16:59:58|         30.0|    46|    1|    0| 257.1| 256.0| 0.0|  128.0|  0.0|  0.0|  11827|  256|
-0|   5888|     0|     0                                                                                                 
-========================================================================================================================
-===========================                                                                                             
+===================================================================================================================================================
+Metadata                                    |||| Requests Made  ||| Prompt Tok/Req ||| Output Tok/Req  ||| Prompt Tok Total||| Output Tok Total  ||
+  Benchmark| Start Time| End Time| Duration (s)|  Comp|  Inc|  Err|  Comp|   Inc| Err|   Comp|  Inc|  Err|   Comp|  Inc|  Err|   Comp|   Inc|   Err
+-----------|-----------|---------|-------------|------|-----|-----|------|------|----|-------|-----|-----|-------|-----|-----|-------|------|------
+synchronous|   16:59:28| 16:59:58|         30.0|    46|    1|    0| 257.1| 256.0| 0.0|  128.0|  0.0|  0.0|  11827|  256|    0|   5888|     0|     0
+===================================================================================================================================================
                  
                  
 Benchmarks Stats:
-========================================================================================================================
-=======================                                                                                                 
-Metadata   | Request Stats         || Out Tok/sec| Tot Tok/sec| Req Latency (sec)  ||| TTFT (ms)       ||| ITL (ms)     
-||| TPOT (ms)      ||                                                                                                   
-  Benchmark| Per Second| Concurrency|        mean|        mean|  mean|  median|   p99| mean| median|  p99| mean| median|
-p99| mean| median| p99                                                                                                  
------------|-----------|------------|------------|------------|------|--------|------|-----|-------|-----|-----|-------|
-----|-----|-------|----                                                                                                 
-synchronous|       1.55|        1.00|       198.1|       992.7|  0.64|    0.64|  0.69| 16.8|   16.4| 21.3|  4.9|    4.9|
-5.3|  4.9|    4.9| 5.2                                                                                                  
-========================================================================================================================
-=======================                                                                                                 
+===============================================================================================================================================
+Metadata   | Request Stats         || Out Tok/sec| Tot Tok/sec| Req Latency (sec)  ||| TTFT (ms)       ||| ITL (ms)       ||| TPOT (ms)      ||
+  Benchmark| Per Second| Concurrency|        mean|        mean|  mean|  median|   p99| mean| median|  p99| mean| median| p99| mean| median| p99
+-----------|-----------|------------|------------|------------|------|--------|------|-----|-------|-----|-----|-------|----|-----|-------|----
+synchronous|       1.55|        1.00|       198.1|       992.7|  0.64|    0.64|  0.69| 16.8|   16.4| 21.3|  4.9|    4.9| 5.3|  4.9|    4.9| 5.2
+===============================================================================================================================================
diff --git a/tests/unit/entrypoints/test_display_entrypoint.py b/tests/unit/entrypoints/test_display_entrypoint.py
@@ -7,6 +7,10 @@
 from guidellm.benchmark import display_benchmarks_report
 
 
+# Set to true to re-write the expected output.
+REGENERATE_ARTIFACTS = False
+
+
 @pytest.fixture
 def get_test_asset_dir():
     def _() -> Path:
@@ -32,14 +36,18 @@ def test_display_entrypoint_yaml(capfd, get_test_asset_dir):
 
 
 def generic_test_display_entrypoint(filename, capfd, get_test_asset_dir):
-    os.environ["COLUMNS"] = "120"  # CLI output depends on terminal width.
+    os.environ["COLUMNS"] = "180"  # CLI output depends on terminal width.
     asset_dir = get_test_asset_dir()
     display_benchmarks_report(asset_dir / filename)
     out, err = capfd.readouterr()
     expected_output_path = asset_dir / "benchmarks_stripped_output.txt"
-    with expected_output_path.open(encoding="utf_8") as file:
-        expected_output = file.read()
-    assert out == expected_output
+    if REGENERATE_ARTIFACTS:
+        expected_output_path.write_text(out)
+        assert False  # Fail to prevent accidentally leaving this set
+    else:
+        with expected_output_path.open(encoding="utf_8") as file:
+            expected_output = file.read()
+        assert out == expected_output
 
 
 if __name__ == "__main__":