Skip to content

Commit 1e4c964

Browse files
update to use HF checkpoint for unscanning
1 parent 9edbc0f commit 1e4c964

File tree

2 files changed

+3
-25
lines changed

2 files changed

+3
-25
lines changed

inference/trillium/JetStream-Maxtext/Llama-4-Maverick-17B-128E/prepare-model/templates/model-serve-downloader.yaml

Lines changed: 2 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -83,29 +83,6 @@ spec:
8383
8484
huggingface-cli download {{ .Values.model.name }} --local-dir ${BASE_MODEL_PATH} --local-dir-use-symlinks False
8585
86-
# Rename weights to expected format
87-
88-
echo "Rename weights in ${BASE_MODEL_PATH}"
89-
found_files=0
90-
for old_filepath in "${BASE_MODEL_PATH}"/consolidated.??.pth; do
91-
if [ -f "$old_filepath" ]; then
92-
found_files=$((found_files + 1))
93-
old_filename=$(basename "$old_filepath")
94-
new_filename=$(echo "$old_filename" | sed 's/^consolidated/llama4-17b-128e/')
95-
new_filepath="${BASE_MODEL_PATH}/${new_filename}"
96-
97-
if [ "$old_filepath" != "$new_filepath" ]; then
98-
mv -v "$old_filepath" "$new_filepath"
99-
echo "Renamed $old_filepath to $new_filepath"
100-
else
101-
echo "File already named correctly: $old_filepath"
102-
fi
103-
fi
104-
done
105-
if [ "$found_files" -eq 0 ]; then
106-
echo "No consolidated.*.pth files found for renaming in ${BASE_MODEL_PATH}."
107-
fi
108-
10986
echo "Starting GCSFuse Mount"
11087
mkdir -p /gcs
11188
gcsfuse --client-protocol http2 ${GCS_FUSE_BUCKET} /gcs
@@ -115,7 +92,8 @@ spec:
11592
JAX_PLATFORMS=cpu python3 -m MaxText.llama4_ckpt_unscanned \
11693
--base-model-path ${BASE_MODEL_PATH} \
11794
--maxtext-model-path ${CHECKPOINT_TPU_UNSCANNED} \
118-
--model-size ${MODEL_SIZE}
95+
--model-size ${MODEL_SIZE} \
96+
--huggingface-checkpoint
11997
12098
gsutil -m cp -r ${CHECKPOINT_TPU_UNSCANNED} /gcs/{{ .Values.model.name }}/output/unscanned_ckpt/checkpoints/
12199

inference/trillium/JetStream-Maxtext/Llama-4-Maverick-17B-128E/values.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@ huggingface:
2222
token: "hf_api_token"
2323

2424
model:
25-
name: meta-llama/Llama-4-Maverick-17B-128E-Original
25+
name: meta-llama/Llama-4-Maverick-17B-128E
2626

2727
job:
2828
image:

0 commit comments

Comments
 (0)