File tree Expand file tree Collapse file tree 6 files changed +18
-18
lines changed
tgi-llama-405b-deployment/config
tgi-llama-vision-deployment/config
tgi-multi-lora-deployment/config Expand file tree Collapse file tree 6 files changed +18
-18
lines changed Original file line number Diff line number Diff line change @@ -32,10 +32,10 @@ spec:
3232 - name : PORT
3333 value : " 8080"
3434 volumeMounts :
35- - mountPath : /data
36- name : data
35+ - mountPath : /tmp
36+ name : tmp
3737 volumes :
38- - name : data
38+ - name : tmp
3939 emptyDir : {}
4040 nodeSelector :
4141 cloud.google.com/compute-class : " Performance"
Original file line number Diff line number Diff line change @@ -30,14 +30,14 @@ spec:
3030 volumeMounts :
3131 - mountPath : /dev/shm
3232 name : dshm
33- - mountPath : /data
34- name : data
33+ - mountPath : /tmp
34+ name : tmp
3535 volumes :
3636 - name : dshm
3737 emptyDir :
3838 medium : Memory
3939 sizeLimit : 1Gi
40- - name : data
40+ - name : tmp
4141 emptyDir : {}
4242 nodeSelector :
4343 cloud.google.com/gke-accelerator : nvidia-tesla-t4
Original file line number Diff line number Diff line change @@ -35,14 +35,14 @@ spec:
3535 volumeMounts :
3636 - mountPath : /dev/shm
3737 name : dshm
38- - mountPath : /data
39- name : data
38+ - mountPath : /tmp
39+ name : tmp
4040 volumes :
4141 - name : dshm
4242 emptyDir :
4343 medium : Memory
4444 sizeLimit : 1Gi
45- - name : data
45+ - name : tmp
4646 emptyDir : {}
4747 nodeSelector :
4848 cloud.google.com/gke-accelerator : nvidia-l4
Original file line number Diff line number Diff line change @@ -35,14 +35,14 @@ spec:
3535 volumeMounts :
3636 - mountPath : /dev/shm
3737 name : dshm
38- - mountPath : /data
39- name : data
38+ - mountPath : /tmp
39+ name : tmp
4040 volumes :
4141 - name : dshm
4242 emptyDir :
4343 medium : Memory
4444 sizeLimit : 1Gi
45- - name : data
45+ - name : tmp
4646 emptyDir : {}
4747 nodeSelector :
4848 cloud.google.com/gke-accelerator : nvidia-h100-80gb
Original file line number Diff line number Diff line change @@ -30,14 +30,14 @@ spec:
3030 volumeMounts :
3131 - mountPath : /dev/shm
3232 name : dshm
33- - mountPath : /data
34- name : data
33+ - mountPath : /tmp
34+ name : tmp
3535 volumes :
3636 - name : dshm
3737 emptyDir :
3838 medium : Memory
3939 sizeLimit : 1Gi
40- - name : data
40+ - name : tmp
4141 emptyDir : {}
4242 nodeSelector :
4343 cloud.google.com/gke-accelerator : nvidia-l4
Original file line number Diff line number Diff line change @@ -37,14 +37,14 @@ spec:
3737 volumeMounts :
3838 - mountPath : /dev/shm
3939 name : dshm
40- - mountPath : /data
41- name : data
40+ - mountPath : /tmp
41+ name : tmp
4242 volumes :
4343 - name : dshm
4444 emptyDir :
4545 medium : Memory
4646 sizeLimit : 1Gi
47- - name : data
47+ - name : tmp
4848 emptyDir : {}
4949 nodeSelector :
5050 cloud.google.com/gke-accelerator : nvidia-l4
You can’t perform that action at this time.
0 commit comments