Skip to content

Commit 515a1db

Browse files
author
chibu
committed
default config
1 parent e60aab1 commit 515a1db

File tree

2 files changed

+2
-5
lines changed

2 files changed

+2
-5
lines changed

examples/guidellm_example.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -11,10 +11,9 @@
1111
GUIDELLM__MAX_CONCURRENCY=256,
1212
GUIDELLM__REQUEST_TIMEOUT=21600,
1313
target="http://localhost:8000/v1",
14-
#data_type="emulated",
1514
max_seconds=30,
16-
#config = "benchmarking_32k",
17-
#data="prompt_tokens=128,output_tokens=128",
15+
scenario = "benchmarking_32kz",
16+
data="prompt_tokens=128,output_tokens=128",
1817
branch = "update_guidellm",
1918
vllm_kwargs={"enable-chunked-prefill": True}
2019
)

src/automation/configs.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,5 @@
1-
#DEFAULT_DOCKER_IMAGE = "498127099666.dkr.ecr.us-east-1.amazonaws.com/mlops/k8s-research-cuda12_5:latest"
21
DEFAULT_DOCKER_IMAGE = "498127099666.dkr.ecr.us-east-1.amazonaws.com/mlops/k8s-research-cuda12_8:latest"
32
#DEFAULT_OUTPUT_URI = "gs://neuralmagic-clearml"
43
DEFAULT_OUTPUT_URI = "http://10.128.20.60:8081"
54
DEFAULT_RESEARCH_BRANCH = "main"
65
DEFAULT_GUIDELLM_SCENARIO = "chat"
7-
#DEFAULT_GUIDELLM_SCENARIO = "benchmarking_summarization"

0 commit comments

Comments
 (0)