@@ -31,27 +31,27 @@ rm -f $WORK_PATH/ggml-model-split*.gguf $WORK_PATH/ggml-model-merge*.gguf
3131# 1. Get a model
3232(
3333cd $WORK_PATH
34- " $ROOT_DIR " /scripts/hf.sh --repo ggml-org/gemma-1.1-2b-it-Q8_0- GGUF --file gemma-1.1-2b-it. Q8_0.gguf
34+ " $ROOT_DIR " /scripts/hf.sh --repo ggml-org/Qwen3-0.6B- GGUF --file Qwen3-0.6B- Q8_0.gguf
3535)
3636echo PASS
3737
3838# 2. Split with max tensors strategy
39- $SPLIT --split-max-tensors 28 $WORK_PATH /gemma-1.1-2b-it. Q8_0.gguf $WORK_PATH /ggml-model-split
39+ $SPLIT --split-max-tensors 28 $WORK_PATH /Qwen3-0.6B- Q8_0.gguf $WORK_PATH /ggml-model-split
4040echo PASS
4141echo
4242
4343# 2b. Test the sharded model is loading properly
44- $MAIN -no-cnv --model $WORK_PATH /ggml-model-split-00001-of-00006 .gguf --n-predict 32
44+ $MAIN -no-cnv --model $WORK_PATH /ggml-model-split-00001-of-00012 .gguf -p " I believe the meaning of life is " --n-predict 32
4545echo PASS
4646echo
4747
4848# 3. Merge
49- $SPLIT --merge $WORK_PATH /ggml-model-split-00001-of-00006 .gguf $WORK_PATH /ggml-model-merge.gguf
49+ $SPLIT --merge $WORK_PATH /ggml-model-split-00001-of-00012 .gguf $WORK_PATH /ggml-model-merge.gguf
5050echo PASS
5151echo
5252
5353# 3b. Test the merged model is loading properly
54- $MAIN -no-cnv --model $WORK_PATH /ggml-model-merge.gguf --n-predict 32
54+ $MAIN -no-cnv --model $WORK_PATH /ggml-model-merge.gguf -p " I believe the meaning of life is " - -n-predict 32
5555echo PASS
5656echo
5757
@@ -61,12 +61,12 @@ echo PASS
6161echo
6262
6363# 4b. Test the sharded model is loading properly
64- $MAIN -no-cnv --model $WORK_PATH /ggml-model-split-32-tensors-00001-of-00007 .gguf --n-predict 32
64+ $MAIN -no-cnv --model $WORK_PATH /ggml-model-split-32-tensors-00001-of-00011 .gguf -p " I believe the meaning of life is " --n-predict 32
6565echo PASS
6666echo
6767
6868# 5. Merge
69- # $SPLIT --merge $WORK_PATH/ggml-model-split-32-tensors-00001-of-00006 .gguf $WORK_PATH/ggml-model-merge-2.gguf
69+ # $SPLIT --merge $WORK_PATH/ggml-model-split-32-tensors-00001-of-00012 .gguf $WORK_PATH/ggml-model-merge-2.gguf
7070# echo PASS
7171# echo
7272
7676# echo
7777
7878# 6. Split with size strategy
79- $SPLIT --split-max-size 2G $WORK_PATH /ggml-model-merge.gguf $WORK_PATH /ggml-model-split-2G
79+ $SPLIT --split-max-size 500M $WORK_PATH /ggml-model-merge.gguf $WORK_PATH /ggml-model-split-500M
8080echo PASS
8181echo
8282
8383# 6b. Test the sharded model is loading properly
84- $MAIN -no-cnv --model $WORK_PATH /ggml-model-split-2G -00001-of-00002.gguf --n-predict 32
84+ $MAIN -no-cnv --model $WORK_PATH /ggml-model-split-500M -00001-of-00002.gguf -p " I believe the meaning of life is " --n-predict 32
8585echo PASS
8686echo
8787
0 commit comments