|
1 | 1 | import random
|
| 2 | +import time |
| 3 | +from dataclasses import dataclass |
2 | 4 | from typing import Sequence
|
3 | 5 |
|
4 | 6 | import arviz
|
5 | 7 | import hagelkorn
|
6 | 8 | import numpy
|
| 9 | +import pandas |
7 | 10 | import pytest
|
8 | 11 |
|
| 12 | +import mcbackend |
9 | 13 | from mcbackend.meta import ChainMeta, DataVariable, RunMeta, Variable
|
10 | 14 | from mcbackend.npproto import utils
|
11 | 15 |
|
@@ -238,14 +242,115 @@ def test__to_inferencedata(self):
|
238 | 242 | pass
|
239 | 243 |
|
240 | 244 |
|
241 |
| -class CheckPerformance(BaseBackendTest): |
| 245 | +@dataclass |
| 246 | +class AppendSpeed: |
| 247 | + draws_per_second: float |
| 248 | + bytes_per_draw: float |
| 249 | + |
| 250 | + @property |
| 251 | + def mib_per_second(self) -> float: |
| 252 | + return self.draws_per_second * self.bytes_per_draw / 1024 / 1024 |
| 253 | + |
| 254 | + def __str__(self): |
| 255 | + return f"{self.mib_per_second:.1f} MiB/s ({self.draws_per_second:.1f} draws/s)" |
| 256 | + |
| 257 | + |
| 258 | +def run_chain(run: Run, chain_number: int = 0, tmax: float = 10) -> AppendSpeed: |
| 259 | + """Append with max speed to one chain for `tmax` seconds.""" |
| 260 | + draw = make_draw(run.meta.variables) |
| 261 | + bytes_per_draw = sum(v.size * v.itemsize for v in draw.values()) |
| 262 | + |
| 263 | + chain = run.init_chain(chain_number) |
| 264 | + t_start = time.time() |
| 265 | + d = 0 |
| 266 | + last_update = t_start |
| 267 | + while time.time() - t_start < tmax: |
| 268 | + chain.append(draw) |
| 269 | + d += 1 |
| 270 | + now = time.time() |
| 271 | + if now - last_update > 1: |
| 272 | + print(f"Inserted {d} draws") |
| 273 | + last_update = now |
| 274 | + |
| 275 | + assert len(chain) == d |
| 276 | + t_end = time.time() |
| 277 | + dps = d / (t_end - t_start) |
| 278 | + return AppendSpeed(dps, bytes_per_draw) |
| 279 | + |
| 280 | + |
| 281 | +class BackendBenchmark: |
| 282 | + """A collection of backend benchmarking methods.""" |
| 283 | + |
| 284 | + backend: mcbackend.Backend |
| 285 | + |
| 286 | + def run_all_benchmarks(self) -> pandas.DataFrame: |
| 287 | + """Runs each benchmark method and summarizes the results in a DataFrame.""" |
| 288 | + df = pandas.DataFrame( |
| 289 | + columns=["title", "bytes_per_draw", "append_speed", "description"] |
| 290 | + ).set_index("title") |
| 291 | + for attr in dir(BackendBenchmark): |
| 292 | + meth = getattr(self, attr, None) |
| 293 | + if callable(meth) and meth.__name__.startswith("measure_"): |
| 294 | + try: |
| 295 | + self.setup_method(meth) |
| 296 | + except TypeError: |
| 297 | + pass |
| 298 | + print(f"Running {meth.__name__}") |
| 299 | + speed = meth() |
| 300 | + df.loc[meth.__name__[8:], ["bytes_per_draw", "append_speed", "description"]] = ( |
| 301 | + speed.bytes_per_draw, |
| 302 | + str(speed), |
| 303 | + meth.__doc__, |
| 304 | + ) |
| 305 | + return df |
| 306 | + |
| 307 | + def measure_many_draws(self) -> AppendSpeed: |
| 308 | + """One chain of (), (3,) and (5,2) float32 variables.""" |
| 309 | + rmeta = RunMeta( |
| 310 | + rid=hagelkorn.random(), |
| 311 | + variables=[ |
| 312 | + Variable("v1", "float32", []), |
| 313 | + Variable("v2", "float32", list((3,))), |
| 314 | + Variable("v3", "float32", [5, 2]), |
| 315 | + ], |
| 316 | + ) |
| 317 | + return run_chain(self.backend.init_run(rmeta)) |
| 318 | + |
| 319 | + def measure_many_variables(self) -> AppendSpeed: |
| 320 | + """One chain with 300 variables of shapes (), (3,) and (5,2).""" |
| 321 | + rmeta = RunMeta( |
| 322 | + rid=hagelkorn.random(), |
| 323 | + variables=[Variable(f"v{v}", "float32", [5, 2][: v % 2]) for v in range(300)], |
| 324 | + ) |
| 325 | + return run_chain(self.backend.init_run(rmeta)) |
| 326 | + |
| 327 | + def measure_big_variables(self) -> AppendSpeed: |
| 328 | + """One chain with 3 variables of shapes (100,), (1000,) and (100, 100).""" |
| 329 | + rmeta = RunMeta( |
| 330 | + rid=hagelkorn.random(), |
| 331 | + variables=[ |
| 332 | + Variable("v1", "float32", list((100,))), |
| 333 | + Variable("v2", "float32", list((1000,))), |
| 334 | + Variable("v3", "float32", list((100, 100))), |
| 335 | + ], |
| 336 | + ) |
| 337 | + return run_chain(self.backend.init_run(rmeta)) |
| 338 | + |
| 339 | + |
| 340 | +class CheckPerformance(BaseBackendTest, BackendBenchmark): |
242 | 341 | """Checks that the backend is reasonably fast via various high-load tests."""
|
243 | 342 |
|
244 | 343 | def test__many_draws(self):
|
| 344 | + speed = self.measure_many_draws() |
| 345 | + assert speed.draws_per_second > 5000 or speed.mib_per_second > 1 |
245 | 346 | pass
|
246 | 347 |
|
247 | 348 | def test__many_variables(self):
|
| 349 | + speed = self.measure_many_variables() |
| 350 | + assert speed.draws_per_second > 500 or speed.mib_per_second > 5 |
248 | 351 | pass
|
249 | 352 |
|
250 | 353 | def test__big_variables(self):
|
| 354 | + speed = self.measure_big_variables() |
| 355 | + assert speed.draws_per_second > 500 or speed.mib_per_second > 5 |
251 | 356 | pass
|
0 commit comments