File tree Expand file tree Collapse file tree 4 files changed +10
-122
lines changed Expand file tree Collapse file tree 4 files changed +10
-122
lines changed Original file line number Diff line number Diff line change @@ -41,7 +41,7 @@ echo PASS
4141echo
4242
4343# 2b. Test the sharded model is loading properly
44- $MAIN --model $WORK_PATH /ggml-model-split-00001-of-00006.gguf --n-predict 32
44+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-split-00001-of-00006.gguf --n-predict 32
4545echo PASS
4646echo
4747
@@ -51,7 +51,7 @@ echo PASS
5151echo
5252
5353# 3b. Test the merged model is loading properly
54- $MAIN --model $WORK_PATH /ggml-model-merge.gguf --n-predict 32
54+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-merge.gguf --n-predict 32
5555echo PASS
5656echo
5757
@@ -61,7 +61,7 @@ echo PASS
6161echo
6262
6363# 4b. Test the sharded model is loading properly
64- $MAIN --model $WORK_PATH /ggml-model-split-32-tensors-00001-of-00007.gguf --n-predict 32
64+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-split-32-tensors-00001-of-00007.gguf --n-predict 32
6565echo PASS
6666echo
6767
7171# echo
7272
7373# 5b. Test the merged model is loading properly
74- # $MAIN --model $WORK_PATH/ggml-model-merge-2.gguf --n-predict 32
74+ # $MAIN -no-cnv - -model $WORK_PATH/ggml-model-merge-2.gguf --n-predict 32
7575# echo PASS
7676# echo
7777
@@ -81,7 +81,7 @@ echo PASS
8181echo
8282
8383# 6b. Test the sharded model is loading properly
84- $MAIN --model $WORK_PATH /ggml-model-split-2G-00001-of-00002.gguf --n-predict 32
84+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-split-2G-00001-of-00002.gguf --n-predict 32
8585echo PASS
8686echo
8787
Original file line number Diff line number Diff line change @@ -47,7 +47,7 @@ echo PASS
4747echo
4848
4949# 3a. Test the requanted model is loading properly
50- $MAIN --model $WORK_PATH /ggml-model-requant-00001-of-00006.gguf --n-predict 32
50+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-requant-00001-of-00006.gguf --n-predict 32
5151echo PASS
5252echo
5353
@@ -57,7 +57,7 @@ echo PASS
5757echo
5858
5959# 4b. Test the requanted model is loading properly
60- $MAIN --model $WORK_PATH /ggml-model-requant-merge.gguf --n-predict 32
60+ $MAIN -no-cnv - -model $WORK_PATH /ggml-model-requant-merge.gguf --n-predict 32
6161echo PASS
6262echo
6363
Load Diff This file was deleted.
Original file line number Diff line number Diff line change @@ -80,18 +80,18 @@ run_conversion_and_inference_lora() {
8080 # Run inference
8181 echo -e " \n\n---------------------------\n\n"
8282 echo " Running llama-cli without lora for $model_name with hidden_size $hidden_size ..."
83- OUTPUT_BASE=$( ./llama-cli -m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32.gguf \
83+ OUTPUT_BASE=$( ./llama-cli -no-cnv - m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32.gguf \
8484 -p " $EXPECTED_BASE_FIRST_WORD " -n 50 --seed 42 --temp 0)
8585
8686 echo -e " \n\n---------------------------\n\n"
8787 echo " Running llama-cli with hot lora for $model_name with hidden_size $hidden_size ..."
88- OUTPUT_LORA_HOT=$( ./llama-cli -m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32.gguf \
88+ OUTPUT_LORA_HOT=$( ./llama-cli -no-cnv - m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32.gguf \
8989 --lora $MODELS_REPO /$model_name /hidden_size=$hidden_size /lora/Lora-F32-LoRA.gguf \
9090 -p " $EXPECTED_LORA_FIRST_WORD " -n 50 --seed 42 --temp 0)
9191
9292 echo -e " \n\n---------------------------\n\n"
9393 echo " Running llama-cli with merged lora for $model_name with hidden_size $hidden_size ..."
94- OUTPUT_LORA_MERGED=$( ./llama-cli -m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32-lora-merged.gguf \
94+ OUTPUT_LORA_MERGED=$( ./llama-cli -no-cnv - m $MODELS_REPO /$model_name /hidden_size=$hidden_size /base/Base-F32-lora-merged.gguf \
9595 -p " $EXPECTED_LORA_FIRST_WORD " -n 50 --seed 42 --temp 0)
9696
9797 # Remove any initial white space
You can’t perform that action at this time.
0 commit comments