Skip to content

Commit 3697b30

Browse files
Pre CR fixes
1 parent 6dd313d commit 3697b30

File tree

4 files changed

+6
-5
lines changed

4 files changed

+6
-5
lines changed

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -147,7 +147,7 @@ The `guidellm benchmark` command is used to run benchmarks against a generative
147147

148148
- `--max-requests`: Sets the maximum number of requests for each benchmark run. If not provided, the benchmark will run until `--max-seconds` is reached or the dataset is exhausted.
149149

150-
- `--max-error-rate`: The maximum error rate after which a benchmark will stop. Applicable only for finite deterministic scenarios i.e `rate_type` is `constant` and `--max-seconds` exists OR `--max-requests` exists OR the dataset is finite. If `--max-error-rate` is `None`, benchmarks will continue regardless of error rate.
150+
- `--max-error-rate`: The maximum error rate after which a benchmark will stop. Applicable only for finite deterministic scenarios i.e `rate_type` is `constant` and `--max-seconds` exists OR `--max-requests` exists OR the dataset is finite. If `--max-error-rate` is `None` or not applicable, benchmarks will continue regardless of error rate.
151151

152152
- `--warmup-percent`: Specifies the percentage of the benchmark to treat as a warmup phase. Requests during this phase are excluded from the final results.
153153

src/guidellm/__main__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -170,7 +170,7 @@ def cli():
170170
"The maximum error rate after which a benchmark will stop. "
171171
"Applicable only for finite deterministic scenarios i.e rate_type is 'constant' and 'max_seconds' exists OR "
172172
"'max_requests' exists OR the dataset is finite. "
173-
"If None, benchmarks will continue regardless of error rate."
173+
"If None or not applicable, benchmarks will continue regardless of error rate."
174174
),
175175
)
176176
@click.option(

src/guidellm/benchmark/benchmark.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -710,7 +710,7 @@ def from_stats(
710710
*["incomplete"] * len(incomplete), # type: ignore[list-item]
711711
*["error"] * len(errored), # type: ignore[list-item]
712712
]
713-
start_time = min(req.start_time for req in total) # ToDo: Fix if total is empty
713+
start_time = min(req.start_time for req in total)
714714
end_time = max(req.end_time for req in total)
715715

716716
total_with_prompt, total_types_with_prompt = (

src/guidellm/scheduler/scheduler.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -102,7 +102,8 @@ async def run(
102102
If None, then no limit is set and either the iterator must be exhaustible
103103
or the max_number must be set.
104104
:param max_error_rate: The maximum error rate after which the scheduler shuts down.
105-
If not provided a default of 5% i.e 0.05 is used.
105+
Only applicable in benchmarks with finite deterministic number of requests.
106+
If None or not applicable then scheduler will continue regardless of errors.
106107
:return: An asynchronous generator that yields SchedulerResult objects.
107108
Each SchedulerResult object contains information about the request,
108109
the response, and the run information.
@@ -130,7 +131,7 @@ async def run(
130131
manager, executor, scheduling_strategy, max_error_rate is not None
131132
)
132133
if shutdown_event:
133-
assert not shutdown_event.is_set()
134+
assert not shutdown_event.is_set(), "shutdown_event is set before starting scheduling"
134135
run_info, requests_iter, times_iter = self._run_setup(
135136
futures, scheduling_strategy, max_number, max_duration, max_error_rate
136137
)

0 commit comments

Comments
 (0)