hack changes together to get values for request over time data, wip

DaltheCow · DaltheCow · commit d59cadafee7c · 2025-03-11T13:46:15.000-04:00
diff --git a/src/guidellm/utils/generate_ui_data.py b/src/guidellm/utils/generate_ui_data.py
@@ -1,6 +1,7 @@
 import os
 import json
 import random
+import math
 from typing import Any, Dict, List
 from guidellm.core.distribution import Distribution
 from guidellm.core import TextGenerationBenchmarkReport, TextGenerationBenchmark
@@ -74,16 +75,72 @@ def generate_run_info(report: TextGenerationBenchmarkReport) -> Dict[str, Any]:
         "timestamp": timestamp
     }
 
+def linearly_interpolate_value(target_input, lower_input, lower_output, upperInput, upper_output):
+    fraction = (target_input - lower_input) / (upperInput - lower_input)
+    return lower_output + fraction * (upper_output - lower_output)
+
 def generate_request_over_time_data(benchmarks: List[TextGenerationBenchmark]) -> List[Dict[str, Any]]:
+
     request_over_time_results = []
     for benchmark in benchmarks:
         # compare benchmark start time to text generation result end time
         all_result_end_times = [result.end_time for result in benchmark.results if result.end_time is not None]
         request_over_time_values = list(map(lambda time: time - benchmark.start_time, all_result_end_times))
         request_distribution = Distribution(data=request_over_time_values)
         result = generate_metric_report(request_distribution, "requestsOverTime")
-        request_over_time_results.append(result["requestsOverTime"])
-    return request_over_time_results
+        result["requestsPerSecond"] = benchmark.completed_request_rate
+        request_over_time_results.append(result)
+
+    if len(benchmarks) == 1:
+        return request_over_time_results
+    
+    request_over_time_raw = []
+    sorted_bm = sorted(benchmarks, key=lambda bm: bm.completed_request_rate)
+    for benchmark in sorted_bm:
+        # compare benchmark start time to text generation result end time
+        all_result_end_times = [result.end_time for result in benchmark.results if result.end_time is not None]
+        request_over_time_values = list(map(lambda time: time - benchmark.start_time, all_result_end_times))
+        request_at_rps = { "rps": benchmark.completed_request_rate, "requests_over_time": request_over_time_values }
+        request_over_time_raw.append(request_at_rps)
+
+    rps_values = [request_obj["rps"] for request_obj in request_over_time_raw]
+    rps_range = list(range(math.ceil(min(rps_values)), math.ceil(max(rps_values))))
+    interpolated_request_values = []
+    lower_rps_index = 0
+    for rps in rps_range:
+        if rps > rps_values[lower_rps_index + 1]: lower_rps_index += 1
+        if rps == rps_values[lower_rps_index]:
+            interpolated_request_values.append({
+                "requests_per_second": rps,
+                "requests_over_time": request_over_time_raw[lower_rps_index]["requests_over_time"][:]
+            })
+            lower_rps_index += 1
+        elif rps < rps_values[lower_rps_index + 1]:
+            interpolated_requests_at_new_rps = []
+            for i in range(len(request_over_time_raw[lower_rps_index]["requests_over_time"])):
+                lower_request = request_over_time_raw[lower_rps_index]["requests_over_time"][i]
+                upper_request = request_over_time_raw[lower_rps_index + 1]["requests_over_time"][i]
+                new_value = linearly_interpolate_value(rps, rps_values[lower_rps_index], lower_request, rps_values[lower_rps_index + 1], upper_request)
+                interpolated_requests_at_new_rps.append(new_value)
+            interpolated_request_values.append({ "requests_per_second": rps, "requests_over_time": interpolated_requests_at_new_rps })
+        elif rps > rps_values[lower_rps_index + 1]:
+            while rps > rps_values[lower_rps_index + 1]:
+                lower_rps_index += 1
+            interpolated_requests_at_new_rps = []
+            for i in range(len(request_over_time_raw[lower_rps_index]["requests_over_time"])):
+                lower_request = request_over_time_raw[lower_rps_index]["requests_over_time"][i]
+                upper_request = request_over_time_raw[lower_rps_index + 1]["requests_over_time"][i]
+                new_value = linearly_interpolate_value(rps, rps_values[lower_rps_index], lower_request, rps_values[lower_rps_index + 1], upper_request)
+                interpolated_requests_at_new_rps.append(new_value)
+            interpolated_request_values.append({ "requests_per_second": rps, "requests_over_time": interpolated_requests_at_new_rps })
+    interpolated_request_over_time_results = []            
+    for request_value in interpolated_request_values:
+        request_distribution = Distribution(data=request_value["requests_over_time"])
+        result = generate_metric_report(request_distribution, "requestsOverTime")
+        result["requestsPerSecond"] = request_value["requests_per_second"]
+        interpolated_request_over_time_results.append(result)
+
+    return interpolated_request_over_time_results
 
 
 def generate_workload_details(report: TextGenerationBenchmarkReport) -> Dict[str, Any]:
@@ -93,13 +150,18 @@ def generate_workload_details(report: TextGenerationBenchmarkReport) -> Dict[str
     all_output_token_distribution = Distribution(data=all_output_token_data)
 
     prompt_token_data = generate_metric_report(all_prompt_token_distribution, "tokenDistributions")
-    prompt_token_samples = [result.prompt for benchmark in report.benchmarks for result in benchmark.results]
-    sample_prompts = random.sample(prompt_token_samples, min(5, len(prompt_token_samples)))
-    sample_prompts = list(map(lambda prompt: prompt.replace("\n", " ").replace("\"", "'"), sample_prompts))
     output_token_data = generate_metric_report(all_output_token_distribution, "tokenDistributions")
+
+    prompt_token_samples = [result.prompt for benchmark in report.benchmarks for result in benchmark.results]
     output_token_samples = [result.output for benchmark in report.benchmarks for result in benchmark.results]
-    sample_outputs = random.sample(output_token_samples, min(5, len(output_token_samples)))
 
+    num_samples = min(5, len(prompt_token_samples), len(output_token_samples))
+    sample_indices = random.sample(range(len(prompt_token_samples)), num_samples)
+
+    sample_prompts = [prompt_token_samples[i] for i in sample_indices]
+    sample_prompts = list(map(lambda prompt: prompt.replace("\n", " ").replace("\"", "'"), sample_prompts))
+
+    sample_outputs = [output_token_samples[i] for i in sample_indices]
     sample_outputs = list(map(lambda output: output.replace("\n", " ").replace("\"", "'"), sample_outputs))
 
     request_over_time_results = generate_request_over_time_data(report.benchmarks)