You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: ci/run.sh
+11-5Lines changed: 11 additions & 5 deletions
Original file line number
Diff line number
Diff line change
@@ -259,7 +259,7 @@ function gg_sum_test_scripts_release {
259
259
}
260
260
261
261
functiongg_get_model {
262
-
local gguf_0="$MNT/models/qwen3/0.6B/ggml-model-bf16.gguf"
262
+
local gguf_0="$MNT/models/qwen3/0.6B/ggml-model-f16.gguf"
263
263
if [[ -s$gguf_0 ]];then
264
264
echo -n "$gguf_0"
265
265
else
@@ -388,7 +388,9 @@ function gg_run_qwen3_0_6b {
388
388
(time ./bin/llama-cli -no-cnv --model ${model_q6_k} -ngl 99 -c 1024 -s 1234 -n 64 --ignore-eos -p "I believe the meaning of life is" ) 2>&1| tee -a $OUT/${ci}-tg-q6_k.log
389
389
390
390
(time ./bin/llama-perplexity --model ${model_f16} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-tg-f16.log
391
-
(time ./bin/llama-perplexity --model ${model_bf16} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-tg-bf16.log
391
+
if [ -z${GG_BUILD_NO_BF16} ];then
392
+
(time ./bin/llama-perplexity --model ${model_bf16} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-tg-bf16.log
393
+
fi
392
394
(time ./bin/llama-perplexity --model ${model_q8_0} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-tg-q8_0.log
393
395
(time ./bin/llama-perplexity --model ${model_q4_0} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-tg-q4_0.log
394
396
(time ./bin/llama-perplexity --model ${model_q4_1} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-tg-q4_1.log
@@ -400,7 +402,7 @@ function gg_run_qwen3_0_6b {
400
402
(time ./bin/llama-perplexity --model ${model_q5_k} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-tg-q5_k.log
401
403
(time ./bin/llama-perplexity --model ${model_q6_k} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-tg-q6_k.log
402
404
403
-
(time ./bin/llama-imatrix --model ${model_bf16} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-imatrix.log
405
+
(time ./bin/llama-imatrix --model ${model_f16} -f ${wiki_test} -ngl 99 -c 1024 -b 512 --chunks 2 ) 2>&1| tee -a $OUT/${ci}-imatrix.log
404
406
405
407
(time ./bin/llama-save-load-state --model ${model_q4_0} -ngl 10 -c 1024 -fa off ) 2>&1| tee -a $OUT/${ci}-save-load-state.log
406
408
(time ./bin/llama-save-load-state --model ${model_q4_0} -ngl 10 -c 1024 -fa on ) 2>&1| tee -a $OUT/${ci}-save-load-state.log
@@ -421,7 +423,9 @@ function gg_run_qwen3_0_6b {
421
423
}
422
424
423
425
check_ppl "f16""$(cat $OUT/${ci}-tg-f16.log | grep "^\[1\]")"| tee -a $OUT/${ci}-ppl.log
424
-
check_ppl "bf16""$(cat $OUT/${ci}-tg-bf16.log | grep "^\[1\]")"| tee -a $OUT/${ci}-ppl.log
426
+
if [ -z${GG_BUILD_NO_BF16} ];then
427
+
check_ppl "bf16""$(cat $OUT/${ci}-tg-bf16.log | grep "^\[1\]")"| tee -a $OUT/${ci}-ppl.log
428
+
fi
425
429
check_ppl "q8_0""$(cat $OUT/${ci}-tg-q8_0.log | grep "^\[1\]")"| tee -a $OUT/${ci}-ppl.log
426
430
check_ppl "q4_0""$(cat $OUT/${ci}-tg-q4_0.log | grep "^\[1\]")"| tee -a $OUT/${ci}-ppl.log
427
431
check_ppl "q4_1""$(cat $OUT/${ci}-tg-q4_1.log | grep "^\[1\]")"| tee -a $OUT/${ci}-ppl.log
0 commit comments