File tree Expand file tree Collapse file tree 3 files changed +5
-5
lines changed Expand file tree Collapse file tree 3 files changed +5
-5
lines changed Original file line number Diff line number Diff line change @@ -42,7 +42,7 @@ This document defines the process for releasing Gateway API Inference Extension.
42
42
``` shell
43
43
export VLLM_GPU=0.9.2
44
44
export VLLM_CPU=0.9.3
45
- export VLLM_SIM=0.1.2
45
+ export VLLM_SIM=0.3.0
46
46
```
47
47
48
48
## Release Process
Original file line number Diff line number Diff line change 14
14
spec :
15
15
containers :
16
16
- name : vllm-sim
17
- image : ghcr.io/llm-d/llm-d-inference-sim:v0.1.2
17
+ image : ghcr.io/llm-d/llm-d-inference-sim:v0.3.0
18
18
imagePullPolicy : Always
19
19
args :
20
20
- --model
23
23
- " 8000"
24
24
- --max-loras
25
25
- " 2"
26
- - --lora
27
- - food-review-1
26
+ - --lora-modules
27
+ - ' {"name": " food-review-1"} '
28
28
env :
29
29
- name : POD_NAME
30
30
valueFrom :
Original file line number Diff line number Diff line change @@ -35,7 +35,7 @@ VLLM_GPU="${VLLM_GPU:-0.9.1}"
35
35
# The CPU image is from https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo
36
36
VLLM_CPU=" ${VLLM_CPU:- 0.9.1} "
37
37
# The sim image is from https://github.com/llm-d/llm-d-inference-sim/pkgs/container/llm-d-inference-sim
38
- VLLM_SIM=" ${VLLM_SIM:- 0.1.1 } "
38
+ VLLM_SIM=" ${VLLM_SIM:- 0.3.0 } "
39
39
40
40
echo " Using release tag: ${RELEASE_TAG} "
41
41
echo " Using vLLM GPU image version: ${VLLM_GPU} "
You can’t perform that action at this time.
0 commit comments