Skip to content

Commit c4031be

Browse files
committed
test2
1 parent b49fb52 commit c4031be

File tree

1 file changed

+5
-1
lines changed

1 file changed

+5
-1
lines changed

.ci/scripts/utils.sh

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -146,10 +146,14 @@ download_stories_model_artifacts() {
146146
# Download stories110M.pt and tokenizer from Github
147147
curl -Ls "https://huggingface.co/karpathy/tinyllamas/resolve/main/stories110M.pt" --output stories110M.pt
148148
curl -Ls "https://raw.githubusercontent.com/karpathy/llama2.c/master/tokenizer.model" --output tokenizer.model
149+
150+
# Create tokenizer.bin.
151+
echo "Creating tokenizer.bin"
152+
$PYTHON_EXECUTABLE -m extension.llm.tokenizer.tokenizer -t tokenizer.model -o tokenizer.bin
153+
149154
# Create params.json file
150155
touch params.json
151156
echo '{"dim": 768, "multiple_of": 32, "n_heads": 12, "n_layers": 12, "norm_eps": 1e-05, "vocab_size": 32000}' > params.json
152-
python -m extension.llm.tokenizer.tokenizer -t tokenizer.model -o tokenizer.bin
153157
}
154158

155159
do_not_use_nightly_on_ci() {

0 commit comments

Comments
 (0)