Skip to content

Commit 64c2abc

Browse files
committed
Refactor CI workflows
1 parent b64763f commit 64c2abc

File tree

3 files changed

+35
-17
lines changed

3 files changed

+35
-17
lines changed
Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
1-
kubectl apply -f deployment/gateway-pod.yml
2-
kubectl apply -f deployment/gateway-svc.yml
1+
kubectl apply -f transfer/deployment/gateway-pod.yml
2+
kubectl apply -f transfer/deployment/gateway-svc.yml
33

44
kubectl apply -f huggingface-secret.yml
55

6-
kubectl apply -f deployment/rollout.yml
7-
kubectl apply -f deploymeny/trainer.yml
6+
kubectl apply -f transfer/deployment/rollout.yml
7+
kubectl apply -f transfer/deployment/trainer.yml
Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
name: JAX-vLLM offloading
2+
3+
on:
4+
workflow_call:
5+
inputs:
6+
JAX_VLLM_OFFLOADING_IMAGE:
7+
type: string
8+
description: MaxText image from ghcr.io/nvidia
9+
default: ghcr.io/nvidia/jax-toolbox-internal:19461214142-jio-amd64
10+
required: false
11+
pull_request:
12+
types:
13+
- opened
14+
- reopened
15+
- ready_for_review
16+
- synchronize
17+
paths:
18+
- 'jax-inference-offloading/**'
19+
- '.github/gke-workflow/jax-vllm-offloading/**'
20+
- '.github/workflows/jax-vllm-offloading/**'
21+
22+
jobs:
23+
jax-vllm-offloading-transfer-gke-xpk:
24+
uses: .github/workflows/jax-vllm-offloading/gke_transfer.yml
25+
# needs: build # .github/workflows/jio.yaml
26+
with:
27+
# JAX_VLLM_OFFLOADING_IMAGE: ${{ needs.build.outputs.DOCKER_TAG_FINAL }}
28+
JAX_VLLM_OFFLOADING_IMAGE: ghcr.io/nvidia/jax-toolbox-internal:19461214142-jio-amd64
29+
secrets: inherit

.github/workflows/_test_jax_vllm_offloading.yml renamed to .github/workflows/jax-vllm-offloading/gke_transfer.yml

Lines changed: 2 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
name: ~Test JAX-vLLM offloading transfer (GKE, XPK)
1+
name: JAX-vLLM offloading transfer (GKE, XPK)
22

33
on:
44
workflow_call:
@@ -8,25 +8,14 @@ on:
88
description: MaxText image from ghcr.io/nvidia
99
default: ghcr.io/nvidia/jax-toolbox-internal:19461214142-jio-amd64
1010
required: false
11-
pull_request:
12-
types:
13-
- opened
14-
- reopened
15-
- ready_for_review
16-
- synchronize
17-
paths:
18-
- '.github/workflows/_test_jax_vllm_offloading.yaml'
19-
- '.github/gke-workflow/jax-vllm-offloading/**'
20-
- 'jax-inference-offloading/**'
2111

2212
jobs:
2313
jax-vllm-offloading-transfer-gke-xpk:
2414
runs-on: gke-a3mega
2515

2616
env:
2717
WORKLOAD_NAME_PREFIX: gke-jax-vllm-transfer
28-
#JAX_VLLM_OFFLOADING_IMAGE: ${{ inputs.JAX_VLLM_OFFLOADING_IMAGE }}
29-
JAX_VLLM_OFFLOADING_IMAGE: ghcr.io/nvidia/jax-toolbox-internal:19461214142-jio-amd64
18+
JAX_VLLM_OFFLOADING_IMAGE: ${{ inputs.JAX_VLLM_OFFLOADING_IMAGE }}
3019

3120
NUM_NODES: 2
3221
ENV_FILE: ../../.github/gke-workflow/jax-vllm-offloading/transfer/jobset.env

0 commit comments

Comments
 (0)