Skip to content

Commit 0b4cbd2

Browse files
committed
use official dockerhub image and update example test
1 parent 24a601a commit 0b4cbd2

File tree

2 files changed

+9
-9
lines changed

2 files changed

+9
-9
lines changed

.github/workflows/pr-vllm.yml

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -301,21 +301,21 @@ jobs:
301301
# Examples Test # 30min
302302
cd /workdir/examples
303303
pip install tensorizer # for tensorizer test
304-
python3 offline_inference/basic/generate.py --model facebook/opt-125m
305-
# python3 offline_inference/basic/generate.py --model meta-llama/Llama-2-13b-chat-hf --cpu-offload-gb 10
304+
# python3 offline_inference/basic/generate.py --model facebook/opt-125m
305+
python3 offline_inference/basic/generate.py --model meta-llama/Llama-2-13b-chat-hf --cpu-offload-gb 10
306306
python3 offline_inference/basic/chat.py
307307
python3 offline_inference/prefix_caching.py
308308
python3 offline_inference/llm_engine_example.py
309309
python3 offline_inference/audio_language.py --seed 0
310310
python3 offline_inference/vision_language.py --seed 0
311311
python3 offline_inference/vision_language_pooling.py --seed 0
312312
python3 offline_inference/vision_language_multi_image.py --seed 0
313-
VLLM_USE_V1=0 python3 others/tensorize_vllm_model.py --model facebook/opt-125m serialize --serialized-directory /tmp/ --suffix v1 && python3 others/tensorize_vllm_model.py --model facebook/opt-125m deserialize --path-to-tensors /tmp/vllm/facebook/opt-125m/v1/model.tensors
314-
python3 offline_inference/encoder_decoder_multimodal.py --model-type whisper --seed 0
315-
python3 offline_inference/basic/classify.py
316-
python3 offline_inference/basic/embed.py
317-
python3 offline_inference/basic/score.py
318-
python3 offline_inference/simple_profiling.py
313+
# python3 offline_inference/spec_decode.py --test --method eagle --num_spec_tokens 3 --dataset-name hf --dataset-path philschmid/mt-bench --num-prompts 80 --temp 0 --top-p 1.0 --top-k -1 --tp 1 --enable-chunked-prefill --max-model-len 2048
314+
# python3 offline_inference/encoder_decoder_multimodal.py --model-type whisper --seed 0
315+
# python3 offline_inference/basic/classify.py
316+
# python3 offline_inference/basic/embed.py
317+
# python3 offline_inference/basic/score.py
318+
# python3 offline_inference/simple_profiling.py
319319
'
320320
321321
- name: Cleanup container and images

docker/vllm/Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
FROM public.ecr.aws/q9t5s3a7/vllm-release-repo:439368496db48d8f992ba8c606a0c0b1eebbfa69 as base
1+
FROM docker.io/vllm/vllm-openai:v0.11.1 as base
22
ARG PYTHON="python3"
33
LABEL maintainer="Amazon AI"
44
ARG EFA_VERSION="1.43.3"

0 commit comments

Comments
 (0)