File tree Expand file tree Collapse file tree 3 files changed +35
-17
lines changed
gke-workflow/jax-vllm-offloading
workflows/jax-vllm-offloading Expand file tree Collapse file tree 3 files changed +35
-17
lines changed Original file line number Diff line number Diff line change 1- kubectl apply -f deployment/gateway-pod.yml
2- kubectl apply -f deployment/gateway-svc.yml
1+ kubectl apply -f transfer/ deployment/gateway-pod.yml
2+ kubectl apply -f transfer/ deployment/gateway-svc.yml
33
44kubectl apply -f huggingface-secret.yml
55
6- kubectl apply -f deployment/rollout.yml
7- kubectl apply -f deploymeny /trainer.yml
6+ kubectl apply -f transfer/ deployment/rollout.yml
7+ kubectl apply -f transfer/deployment /trainer.yml
Original file line number Diff line number Diff line change 1+ name : JAX-vLLM offloading
2+
3+ on :
4+ workflow_call :
5+ inputs :
6+ JAX_VLLM_OFFLOADING_IMAGE :
7+ type : string
8+ description : MaxText image from ghcr.io/nvidia
9+ default : ghcr.io/nvidia/jax-toolbox-internal:19461214142-jio-amd64
10+ required : false
11+ pull_request :
12+ types :
13+ - opened
14+ - reopened
15+ - ready_for_review
16+ - synchronize
17+ paths :
18+ - ' jax-inference-offloading/**'
19+ - ' .github/gke-workflow/jax-vllm-offloading/**'
20+ - ' .github/workflows/jax-vllm-offloading/**'
21+
22+ jobs :
23+ jax-vllm-offloading-transfer-gke-xpk :
24+ uses : .github/workflows/jax-vllm-offloading/gke_transfer.yml
25+ # needs: build # .github/workflows/jio.yaml
26+ with :
27+ # JAX_VLLM_OFFLOADING_IMAGE: ${{ needs.build.outputs.DOCKER_TAG_FINAL }}
28+ JAX_VLLM_OFFLOADING_IMAGE : ghcr.io/nvidia/jax-toolbox-internal:19461214142-jio-amd64
29+ secrets : inherit
Original file line number Diff line number Diff line change 1- name : ~Test JAX-vLLM offloading transfer (GKE, XPK)
1+ name : JAX-vLLM offloading transfer (GKE, XPK)
22
33on :
44 workflow_call :
88 description : MaxText image from ghcr.io/nvidia
99 default : ghcr.io/nvidia/jax-toolbox-internal:19461214142-jio-amd64
1010 required : false
11- pull_request :
12- types :
13- - opened
14- - reopened
15- - ready_for_review
16- - synchronize
17- paths :
18- - ' .github/workflows/_test_jax_vllm_offloading.yaml'
19- - ' .github/gke-workflow/jax-vllm-offloading/**'
20- - ' jax-inference-offloading/**'
2111
2212jobs :
2313 jax-vllm-offloading-transfer-gke-xpk :
2414 runs-on : gke-a3mega
2515
2616 env :
2717 WORKLOAD_NAME_PREFIX : gke-jax-vllm-transfer
28- # JAX_VLLM_OFFLOADING_IMAGE: ${{ inputs.JAX_VLLM_OFFLOADING_IMAGE }}
29- JAX_VLLM_OFFLOADING_IMAGE : ghcr.io/nvidia/jax-toolbox-internal:19461214142-jio-amd64
18+ JAX_VLLM_OFFLOADING_IMAGE : ${{ inputs.JAX_VLLM_OFFLOADING_IMAGE }}
3019
3120 NUM_NODES : 2
3221 ENV_FILE : ../../.github/gke-workflow/jax-vllm-offloading/transfer/jobset.env
You can’t perform that action at this time.
0 commit comments