File tree Expand file tree Collapse file tree 2 files changed +2
-5
lines changed Expand file tree Collapse file tree 2 files changed +2
-5
lines changed Original file line number Diff line number Diff line change 11
11
GUIDELLM__MAX_CONCURRENCY = 256 ,
12
12
GUIDELLM__REQUEST_TIMEOUT = 21600 ,
13
13
target = "http://localhost:8000/v1" ,
14
- #data_type="emulated",
15
14
max_seconds = 30 ,
16
- #config = "benchmarking_32k ",
17
- # data="prompt_tokens=128,output_tokens=128",
15
+ scenario = "benchmarking_32kz " ,
16
+ data = "prompt_tokens=128,output_tokens=128" ,
18
17
branch = "update_guidellm" ,
19
18
vllm_kwargs = {"enable-chunked-prefill" : True }
20
19
)
Original file line number Diff line number Diff line change 1
- #DEFAULT_DOCKER_IMAGE = "498127099666.dkr.ecr.us-east-1.amazonaws.com/mlops/k8s-research-cuda12_5:latest"
2
1
DEFAULT_DOCKER_IMAGE = "498127099666.dkr.ecr.us-east-1.amazonaws.com/mlops/k8s-research-cuda12_8:latest"
3
2
#DEFAULT_OUTPUT_URI = "gs://neuralmagic-clearml"
4
3
DEFAULT_OUTPUT_URI = "http://10.128.20.60:8081"
5
4
DEFAULT_RESEARCH_BRANCH = "main"
6
5
DEFAULT_GUIDELLM_SCENARIO = "chat"
7
- #DEFAULT_GUIDELLM_SCENARIO = "benchmarking_summarization"
You can’t perform that action at this time.
0 commit comments