@@ -272,19 +272,19 @@ function gg_run_open_llama_3b_v2 {
272272 (time ./bin/main --model ${model_q5_k} -s 1234 -n 64 --ignore-eos -p " I believe the meaning of life is" ) 2>&1 | tee -a $OUT /${ci} -tg-q5_k.log
273273 (time ./bin/main --model ${model_q6_k} -s 1234 -n 64 --ignore-eos -p " I believe the meaning of life is" ) 2>&1 | tee -a $OUT /${ci} -tg-q6_k.log
274274
275- (time ./bin/perplexity --model ${model_f16} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-f16.log
276- (time ./bin/perplexity --model ${model_q8_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q8_0.log
277- (time ./bin/perplexity --model ${model_q4_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_0.log
278- (time ./bin/perplexity --model ${model_q4_1} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_1.log
279- (time ./bin/perplexity --model ${model_q5_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_0.log
280- (time ./bin/perplexity --model ${model_q5_1} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_1.log
281- (time ./bin/perplexity --model ${model_q2_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q2_k.log
282- (time ./bin/perplexity --model ${model_q3_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q3_k.log
283- (time ./bin/perplexity --model ${model_q4_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_k.log
284- (time ./bin/perplexity --model ${model_q5_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_k.log
285- (time ./bin/perplexity --model ${model_q6_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q6_k.log
286-
287- (time ./bin/imatrix --model ${model_f16} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -imatrix.log
275+ (time ./bin/perplexity --model ${model_f16} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-f16.log
276+ (time ./bin/perplexity --model ${model_q8_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q8_0.log
277+ (time ./bin/perplexity --model ${model_q4_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_0.log
278+ (time ./bin/perplexity --model ${model_q4_1} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_1.log
279+ (time ./bin/perplexity --model ${model_q5_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_0.log
280+ (time ./bin/perplexity --model ${model_q5_1} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_1.log
281+ (time ./bin/perplexity --model ${model_q2_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q2_k.log
282+ (time ./bin/perplexity --model ${model_q3_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q3_k.log
283+ (time ./bin/perplexity --model ${model_q4_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_k.log
284+ (time ./bin/perplexity --model ${model_q5_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_k.log
285+ (time ./bin/perplexity --model ${model_q6_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -tg-q6_k.log
286+
287+ (time ./bin/imatrix --model ${model_f16} -f ${wiki_test_60} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -imatrix.log
288288
289289 (time ./bin/save-load-state --model ${model_q4_0} ) 2>&1 | tee -a $OUT /${ci} -save-load-state.log
290290
@@ -343,17 +343,17 @@ function gg_run_open_llama_3b_v2 {
343343 python3 ../convert-lora-to-ggml.py ${path_lora}
344344
345345 # f16
346- (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-f16.log
347- (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} --lora ${lora_shakespeare} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-lora-f16.log
346+ (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-f16.log
347+ (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} --lora ${lora_shakespeare} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-lora-f16.log
348348 compare_ppl " f16 shakespeare" " $( cat $OUT /${ci} -ppl-shakespeare-f16.log | grep " ^\[1\]" ) " " $( cat $OUT /${ci} -ppl-shakespeare-lora-f16.log | grep " ^\[1\]" ) " | tee -a $OUT /${ci} -lora-ppl.log
349349
350350 # q8_0
351- (time ./bin/perplexity --model ${model_q8_0} -f ${shakespeare} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-q8_0.log
352- (time ./bin/perplexity --model ${model_q8_0} -f ${shakespeare} --lora ${lora_shakespeare} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-lora-q8_0.log
351+ (time ./bin/perplexity --model ${model_q8_0} -f ${shakespeare} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-q8_0.log
352+ (time ./bin/perplexity --model ${model_q8_0} -f ${shakespeare} --lora ${lora_shakespeare} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-lora-q8_0.log
353353 compare_ppl " q8_0 shakespeare" " $( cat $OUT /${ci} -ppl-shakespeare-q8_0.log | grep " ^\[1\]" ) " " $( cat $OUT /${ci} -ppl-shakespeare-lora-q8_0.log | grep " ^\[1\]" ) " | tee -a $OUT /${ci} -lora-ppl.log
354354
355355 # q8_0 + f16 lora-base
356- (time ./bin/perplexity --model ${model_q8_0} -f ${shakespeare} --lora ${lora_shakespeare} --lora-base ${model_f16} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-lora-q8_0-f16.log
356+ (time ./bin/perplexity --model ${model_q8_0} -f ${shakespeare} --lora ${lora_shakespeare} --lora-base ${model_f16} -c 128 -b 128 --chunks 1 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-lora-q8_0-f16.log
357357 compare_ppl " q8_0 / f16 base shakespeare" " $( cat $OUT /${ci} -ppl-shakespeare-q8_0.log | grep " ^\[1\]" ) " " $( cat $OUT /${ci} -ppl-shakespeare-lora-q8_0-f16.log | grep " ^\[1\]" ) " | tee -a $OUT /${ci} -lora-ppl.log
358358
359359 set +e
0 commit comments