Skip to content

Commit 5ac9805

Browse files
feat: e2e actually works
1 parent 4a07c37 commit 5ac9805

31 files changed

+878
-475
lines changed

.gitignore

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -230,3 +230,6 @@ src/ui/next-env.d.ts
230230
!src/ui/public/manifest.json
231231
!src/ui/serve.json
232232
.eslintcache
233+
234+
# vllm-sim
235+
bin/

src/guidellm/__main__.py

Lines changed: 33 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -200,6 +200,33 @@ def benchmark():
200200
"Defaults to None."
201201
),
202202
)
203+
@click.option(
204+
"--max-errors",
205+
type=int,
206+
default=GenerativeTextScenario.get_default("max_errors"),
207+
help=(
208+
"The maximum number of errors allowed before stopping the benchmark. "
209+
"Defaults to None."
210+
),
211+
)
212+
@click.option(
213+
"--max-error-rate",
214+
type=float,
215+
default=GenerativeTextScenario.get_default("max_error_rate"),
216+
help=(
217+
"The maximum error rate allowed before stopping the benchmark. "
218+
"Should be a value between 0 and 1. Defaults to None."
219+
),
220+
)
221+
@click.option(
222+
"--max-global-error-rate",
223+
type=float,
224+
default=GenerativeTextScenario.get_default("max_global_error_rate"),
225+
help=(
226+
"The maximum global error rate allowed before stopping the benchmark. "
227+
"Should be a value between 0 and 1. Defaults to None."
228+
),
229+
)
203230
@click.option(
204231
"--disable-progress",
205232
is_flag=True,
@@ -263,6 +290,9 @@ def run(
263290
max_requests,
264291
warmup_percent,
265292
cooldown_percent,
293+
max_errors,
294+
max_error_rate,
295+
max_global_error_rate,
266296
disable_progress,
267297
display_scheduler_stats,
268298
disable_console_outputs,
@@ -290,6 +320,9 @@ def run(
290320
max_requests=max_requests,
291321
warmup_percent=warmup_percent,
292322
cooldown_percent=cooldown_percent,
323+
max_errors=max_errors,
324+
max_error_rate=max_error_rate,
325+
max_global_error_rate=max_global_error_rate,
293326
output_sampling=output_sampling,
294327
random_seed=random_seed,
295328
)

src/guidellm/backend/__init__.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,8 @@
55
and timing utilities for standardized communication with LLM providers.
66
"""
77

8+
# Import backend implementations to trigger registration
9+
from . import openai # noqa: F401
810
from .backend import (
911
Backend,
1012
BackendType,

src/guidellm/benchmark/__init__.py

Lines changed: 17 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -1,19 +1,21 @@
1-
from .aggregator import AggregatorT, BenchmarkAggregator, GenerativeBenchmarkAggregator
1+
from .aggregator import (
2+
AggregatorT,
3+
GenerativeRequestsAggregator,
4+
SchedulerStatsAggregator,
5+
)
26
from .benchmark import (
37
Benchmark,
4-
BenchmarkArgs,
58
BenchmarkMetrics,
69
BenchmarkSchedulerStats,
710
BenchmarkT,
811
GenerativeBenchmark,
12+
GenerativeBenchmarksReport,
913
GenerativeMetrics,
1014
GenerativeRequestStats,
11-
GenerativeTextErrorStats,
12-
StatusBreakdown,
1315
)
14-
from .benchmarker import Benchmarker, BenchmarkerResult, GenerativeBenchmarker
16+
from .benchmarker import Benchmarker
1517
from .entrypoints import benchmark_generative_text, reimport_benchmarks_report
16-
from .output import GenerativeBenchmarksConsole, GenerativeBenchmarksReport
18+
from .output import GenerativeBenchmarkerConsole
1719
from .profile import (
1820
AsyncProfile,
1921
ConcurrentProfile,
@@ -22,46 +24,37 @@
2224
SweepProfile,
2325
SynchronousProfile,
2426
ThroughputProfile,
25-
create_profile,
2627
)
2728
from .progress import (
28-
BenchmarkerProgressDisplay,
29-
BenchmarkerTaskProgressState,
30-
GenerativeTextBenchmarkerProgressDisplay,
31-
GenerativeTextBenchmarkerTaskProgressState,
29+
BenchmarkerProgress,
30+
BenchmarkerProgressGroup,
31+
GenerativeConsoleBenchmarkerProgress,
3232
)
3333

3434
__all__ = [
3535
"AggregatorT",
3636
"AsyncProfile",
3737
"Benchmark",
38-
"BenchmarkAggregator",
39-
"BenchmarkArgs",
4038
"BenchmarkMetrics",
4139
"BenchmarkSchedulerStats",
4240
"BenchmarkT",
4341
"Benchmarker",
44-
"BenchmarkerProgressDisplay",
45-
"BenchmarkerResult",
46-
"BenchmarkerTaskProgressState",
42+
"BenchmarkerProgress",
43+
"BenchmarkerProgressGroup",
4744
"ConcurrentProfile",
4845
"GenerativeBenchmark",
49-
"GenerativeBenchmarkAggregator",
50-
"GenerativeBenchmarker",
51-
"GenerativeBenchmarksConsole",
46+
"GenerativeBenchmarkerConsole",
5247
"GenerativeBenchmarksReport",
48+
"GenerativeConsoleBenchmarkerProgress",
5349
"GenerativeMetrics",
5450
"GenerativeRequestStats",
55-
"GenerativeTextBenchmarkerProgressDisplay",
56-
"GenerativeTextBenchmarkerTaskProgressState",
57-
"GenerativeTextErrorStats",
51+
"GenerativeRequestsAggregator",
5852
"Profile",
5953
"ProfileType",
60-
"StatusBreakdown",
54+
"SchedulerStatsAggregator",
6155
"SweepProfile",
6256
"SynchronousProfile",
6357
"ThroughputProfile",
6458
"benchmark_generative_text",
65-
"create_profile",
6659
"reimport_benchmarks_report",
6760
]

0 commit comments

Comments
 (0)