Ensure timezones are UTC

ianayl · ianayl · commit 9bd519fee870 · 2025-04-01T13:16:08.000-07:00
diff --git a/devops/scripts/benchmarks/compare.py b/devops/scripts/benchmarks/compare.py
@@ -1,4 +1,4 @@
-from utils.aggregate import SimpleMedian
+from utils.aggregate import Aggregator, SimpleMedian
 from utils.validate import Validate
 from utils.result import Result, BenchmarkRun
 from options import options
@@ -7,6 +7,7 @@
 import sys
 import json
 import argparse
+from datetime import datetime, timezone
 from pathlib import Path
 from dataclasses import dataclass, asdict
 
@@ -106,7 +107,7 @@ def check_benchmark_result(result: BenchmarkRun) -> bool:
             if result.name != result_name:
                 print(f"Warning: Result file {result_path} does not match specified result name {result.name}.")
                 return False
-            if result.date < datetime.strptime(cutoff, "%Y%m%d_%H%M%S"):
+            if result.date < datetime.strptime(cutoff, "%Y%m%d_%H%M%S").replace(tzinfo=timezone.utc):
                 return False
             return True
 
@@ -183,6 +184,14 @@ def to_hist_avg(
         Returns:
             A tuple returning (list of improved tests, list of regressed tests).
         """
+        def halfway_round(value: int, n: int):
+            """
+            Python's default round() does banker's rounding, which doesn't
+            make much sense here. This rounds 0.5 to 1, and -0.5 to -1
+            """
+            if value == 0: return 0
+            return int(value * 10**n + 0.5 * (value / abs(value))) / 10**n
+
         improvement = []
         regression = []
 
@@ -206,9 +215,11 @@ def perf_diff_entry() -> dict:
                 res["avg_type"] = hist_avg[test.name].average_type
                 return res
 
-            if delta > options.regression_threshold:
+            # Round to 2 decimal places: not going to fail a test on 0.001% over
+            # regression threshold
+            if halfway_round(delta, 2) > options.regression_threshold:
                 improvement.append(perf_diff_entry())
-            elif delta < -options.regression_threshold:
+            elif halfway_round(delta, 2) < -options.regression_threshold:
                 regression.append(perf_diff_entry())
 
         return improvement, regression
diff --git a/devops/scripts/benchmarks/history.py b/devops/scripts/benchmarks/history.py
@@ -120,7 +120,7 @@ def save(self, save_name, results: list[Result], to_file=True):
 
         # Use formatted timestamp for the filename
         timestamp = (
-            datetime.now().strftime("%Y%m%d_%H%M%S")
+            datetime.now(tz=timezone.utc).strftime("%Y%m%d_%H%M%S")
             if options.timestamp_override is None else 
             options.timestamp_override
         )

Original file line number	Diff line number	Diff line change
`@@ -120,7 +120,7 @@ def save(self, save_name, results: list[Result], to_file=True):`
`120`	`120`
`121`	`121`	`# Use formatted timestamp for the filename`
`122`	`122`	`timestamp = (`
`123`		`- datetime.now().strftime("%Y%m%d_%H%M%S")`
	`123`	`+ datetime.now(tz=timezone.utc).strftime("%Y%m%d_%H%M%S")`
`124`	`124`	`if options.timestamp_override is None else`
`125`	`125`	`options.timestamp_override`
`126`	`126`	`)`