File tree Expand file tree Collapse file tree 3 files changed +6
-6
lines changed
Expand file tree Collapse file tree 3 files changed +6
-6
lines changed Original file line number Diff line number Diff line change @@ -40,7 +40,7 @@ roleRef:
4040 kind : ClusterRole
4141 name : pod-read
4242---
43- apiVersion : inference.networking.x-k8s.io/v1alpha1
43+ apiVersion : inference.networking.x-k8s.io/v1alpha2
4444kind : InferencePool
4545metadata :
4646 labels :
Original file line number Diff line number Diff line change 1- apiVersion : inference.networking.x-k8s.io/v1alpha1
1+ apiVersion : inference.networking.x-k8s.io/v1alpha2
22kind : InferenceModel
33metadata :
44 name : inferencemodel-sample
Original file line number Diff line number Diff line change 1- apiVersion : inference.networking.x-k8s.io/v1alpha1
1+ apiVersion : inference.networking.x-k8s.io/v1alpha2
22kind : InferencePool
33metadata :
44 name : vllm-llama2-7b-pool
1010 extensionRef :
1111 name : epp
1212---
13- apiVersion : inference.networking.x-k8s.io/v1alpha1
13+ apiVersion : inference.networking.x-k8s.io/v1alpha2
1414kind : InferenceModel
1515metadata :
1616 name : inferencemodel-sample
2424 - name : sql-lora-1fdg2
2525 weight : 100
2626---
27- apiVersion : inference.networking.x-k8s.io/v1alpha1
27+ apiVersion : inference.networking.x-k8s.io/v1alpha2
2828kind : InferenceModel
2929metadata :
3030 name : inferencemodel-sheddable
3737 - name : sql-lora-1fdg3
3838 weight : 100
3939---
40- apiVersion : inference.networking.x-k8s.io/v1alpha1
40+ apiVersion : inference.networking.x-k8s.io/v1alpha2
4141kind : InferenceModel
4242metadata :
4343 name : inferencemodel-generic
You can’t perform that action at this time.
0 commit comments