Skip to content

Commit 3fb446a

Browse files
authored
gemma changes (#417)
1 parent 185b893 commit 3fb446a

File tree

1 file changed

+6
-2
lines changed

1 file changed

+6
-2
lines changed

gemma/gemma-3-27b-it/config.yaml

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
base_image:
2-
image: public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:d3286757f63d1baeccb34cb7dd272cfdc87e0952
2+
image: public.ecr.aws/q9t5s3a7/vllm-ci-postmerge-repo:f5d3acd47466f094beb36f7a5d05520466713f93
33
build_commands:
4-
- pip install git+https://github.com/huggingface/transformers@994cad2790af71d87c1cdd459a8484dada2c7115
4+
- pip install git+https://github.com/huggingface/transformers@071a161d3e38f56dbda2743b979f0afeed2cd4f1
55
model_metadata:
66
repo_id: google/gemma-3-27b-it
77
example_model_input: {
@@ -27,6 +27,8 @@ model_metadata:
2727
"max_tokens": 512,
2828
"temperature": 0.5
2929
}
30+
tags:
31+
- openai-compatible
3032
docker_server:
3133
start_command: sh -c "VLLM_USE_V1=1 HF_TOKEN=$(cat /secrets/hf_access_token) vllm
3234
serve google/gemma-3-27b-it --served-model-name gemma --max-num-seqs 8 --max-model-len
@@ -45,6 +47,8 @@ requirements:
4547
resources:
4648
accelerator: H100
4749
use_gpu: true
50+
secrets:
51+
hf_access_token: null
4852
runtime:
4953
health_checks:
5054
restart_check_delay_seconds: 300 # Waits 5 minutes after deployment before starting health checks

0 commit comments

Comments
 (0)