File tree Expand file tree Collapse file tree 4 files changed +6
-5
lines changed
inference/trillium/JetStream-Maxtext
Llama-4-Maverick-17B-128E
Llama-4-Scout-17B-16E/docker Expand file tree Collapse file tree 4 files changed +6
-5
lines changed Original file line number Diff line number Diff line change @@ -275,6 +275,7 @@ The recipe uses the helm chart to run the above steps.
275275 helm install -f values.yaml \
276276 --set volumes.gcsMounts[0].bucketName=${GCS_BUCKET} \
277277 --set clusterName=$CLUSTER_NAME \
278+ --set pathwaysDir=" gs://${GCS_BUCKET} " \
278279 --set job.image.repository=${ARTIFACT_REGISTRY} /${JETSTREAM_MAXTEXT_IMAGE} \
279280 --set job.image.tag=${JETSTREAM_MAXTEXT_VERSION} \
280281 --set convert_hf_ckpt=false \
Original file line number Diff line number Diff line change 2323 - type : ct6e-standard-4t
2424 topology : 8x8
2525 numSlices : 1
26- pathwaysDir : " gs://jacobplatin "
26+ pathwaysDir : " {{ .Values.pathwaysDir }} "
2727 controller :
2828 deploymentMode : colocate_head_with_workers
2929 mainContainerName : jetstream
Original file line number Diff line number Diff line change @@ -22,7 +22,7 @@ huggingface:
2222 token : " hf_api_token"
2323
2424model :
25- name : meta-llama/Llama-4-Scout -17B-16E -Original
25+ name : meta-llama/Llama-4-Maverick -17B-128E -Original
2626
2727job :
2828 image :
@@ -46,7 +46,7 @@ jetstream:
4646convert_hf_ckpt : true
4747
4848maxtext_config :
49- load_parameters_path : " gs://jacobplatin/llama4/maverick-orbax-checkpoints/48-layer-unscanned/0/items "
49+ load_parameters_path : $CHECKPOINT_TPU_UNSCANNED
5050 max_prefill_predict_length : 128
5151 max_target_length : 256
5252 async_checkpointing : false
Original file line number Diff line number Diff line change @@ -16,10 +16,10 @@ steps:
1616- name : ' gcr.io/cloud-builders/docker'
1717 args :
1818 - ' build'
19- - ' --tag=${_ARTIFACT_REGISTRY}/maxtext-jetstream:latest '
19+ - ' --tag=${_ARTIFACT_REGISTRY}/${_JETSTREAM_MAXTEXT_IMAGE}:${_JETSTREAM_MAXTEXT_VERSION} '
2020 - ' --file=Dockerfile'
2121 - ' .'
2222 automapSubstitutions : true
2323
2424images :
25- - ' ${_ARTIFACT_REGISTRY}/maxtext-jetstream:latest '
25+ - ' ${_ARTIFACT_REGISTRY}/${_JETSTREAM_MAXTEXT_IMAGE}:${_JETSTREAM_MAXTEXT_VERSION} '
You can’t perform that action at this time.
0 commit comments