Skip to content

Commit 8f94d30

Browse files
authored
Merge branch 'main' into example1
2 parents 6300876 + 9573703 commit 8f94d30

File tree

18 files changed

+219
-200
lines changed

18 files changed

+219
-200
lines changed

.github/workflows/main.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -217,7 +217,7 @@ jobs:
217217
uses: peaceiris/actions-gh-pages@v3
218218
with:
219219
github_token: ${{ secrets.GITHUB_TOKEN }}
220-
publish_dir: ./ui/out
220+
publish_dir: ./src/ui/out
221221
destination_dir: ui/dev
222222
keep_files: false
223223
user_name: ${{ github.actor }}

.github/workflows/nightly.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -238,7 +238,7 @@ jobs:
238238
uses: peaceiris/actions-gh-pages@v3
239239
with:
240240
github_token: ${{ secrets.GITHUB_TOKEN }}
241-
publish_dir: ./ui/out
241+
publish_dir: ./src/ui/out
242242
destination_dir: ui/nightly
243243
keep_files: false
244244
user_name: ${{ github.actor }}

.github/workflows/release-candidate.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -282,7 +282,7 @@ jobs:
282282
uses: peaceiris/actions-gh-pages@v3
283283
with:
284284
github_token: ${{ secrets.GITHUB_TOKEN }}
285-
publish_dir: ./ui/out
285+
publish_dir: ./src/ui/out
286286
destination_dir: ui/release/latest
287287
keep_files: false
288288
user_name: ${{ github.actor }}

.github/workflows/release.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -281,7 +281,7 @@ jobs:
281281
uses: peaceiris/actions-gh-pages@v3
282282
with:
283283
github_token: ${{ secrets.GITHUB_TOKEN }}
284-
publish_dir: ./ui/out
284+
publish_dir: ./src/ui/out
285285
destination_dir: ui/latest
286286
keep_files: false
287287
user_name: ${{ github.actor }}

.pre-commit-config.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,7 @@ repos:
1111
hooks:
1212
- id: pdm-lock-check
1313
name: check lock file matches pyproject
14+
entry: sh -c "pdm lock -v --check || pdm lock --update-reuse"
1415
- repo: https://github.com/astral-sh/ruff-pre-commit
1516
rev: v0.11.7
1617
hooks:

src/guidellm/benchmark/aggregator.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -32,11 +32,11 @@
3232
GenerationRequest,
3333
GenerativeRequestLoaderDescription,
3434
RequestLoaderDescription,
35+
RequestT,
36+
ResponseT,
3537
)
3638
from guidellm.scheduler import (
3739
GenerativeRequestsWorkerDescription,
38-
RequestT,
39-
ResponseT,
4040
SchedulerRequestResult,
4141
WorkerDescription,
4242
)

src/guidellm/benchmark/benchmarker.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,12 +27,12 @@
2727
GenerationRequest,
2828
GenerativeRequestLoaderDescription,
2929
RequestLoaderDescription,
30+
RequestT,
31+
ResponseT,
3032
)
3133
from guidellm.scheduler import (
3234
GenerativeRequestsWorker,
3335
RequestsWorker,
34-
RequestT,
35-
ResponseT,
3636
Scheduler,
3737
SchedulerRequestResult,
3838
SchedulingStrategy,

src/guidellm/config.py

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
import json
2+
import os
23
from collections.abc import Sequence
34
from enum import Enum
45
from typing import Literal, Optional
@@ -131,8 +132,12 @@ class Settings(BaseSettings):
131132

132133
# Scheduler settings
133134
max_concurrency: int = 512
134-
max_worker_processes: int = 10
135-
max_add_requests_per_loop: int = 20
135+
max_worker_processes: int = Field(
136+
# use number of CPUs - 1, but at least 10
137+
default_factory=lambda: max((os.cpu_count() or 1) - 1, 10)
138+
)
139+
min_queued_requests: int = 20
140+
scheduler_start_delay: float = 5
136141

137142
# Data settings
138143
dataset: DatasetSettings = DatasetSettings()

src/guidellm/request/__init__.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5,11 +5,14 @@
55
RequestLoaderDescription,
66
)
77
from .request import GenerationRequest
8+
from .types import RequestT, ResponseT
89

910
__all__ = [
1011
"GenerationRequest",
1112
"GenerativeRequestLoader",
1213
"GenerativeRequestLoaderDescription",
1314
"RequestLoader",
1415
"RequestLoaderDescription",
16+
"RequestT",
17+
"ResponseT",
1518
]

src/guidellm/request/loader.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -30,10 +30,10 @@ class RequestLoaderDescription(StandardBaseModel):
3030

3131
class RequestLoader(Iterable):
3232
@abstractmethod
33-
def __iter__(self): ...
33+
def __iter__(self) -> Iterator: ...
3434

3535
@abstractmethod
36-
def __len__(self): ...
36+
def __len__(self) -> int: ...
3737

3838
@property
3939
@abstractmethod

0 commit comments

Comments
 (0)