@@ -196,17 +196,17 @@ function gg_run_open_llama_3b_v2 {
196
196
(time ./bin/main --model ${model_q5_k} -s 1234 -n 64 --ignore-eos -p " I believe the meaning of life is" ) 2>&1 | tee -a $OUT /${ci} -tg-q5_k.log
197
197
(time ./bin/main --model ${model_q6_k} -s 1234 -n 64 --ignore-eos -p " I believe the meaning of life is" ) 2>&1 | tee -a $OUT /${ci} -tg-q6_k.log
198
198
199
- (time ./bin/perplexity --model ${model_f16} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-f16.log
200
- (time ./bin/perplexity --model ${model_q8_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q8_0.log
201
- (time ./bin/perplexity --model ${model_q4_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_0.log
202
- (time ./bin/perplexity --model ${model_q4_1} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_1.log
203
- (time ./bin/perplexity --model ${model_q5_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_0.log
204
- (time ./bin/perplexity --model ${model_q5_1} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_1.log
205
- (time ./bin/perplexity --model ${model_q2_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q2_k.log
206
- (time ./bin/perplexity --model ${model_q3_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q3_k.log
207
- (time ./bin/perplexity --model ${model_q4_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_k.log
208
- (time ./bin/perplexity --model ${model_q5_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_k.log
209
- (time ./bin/perplexity --model ${model_q6_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -tg-q6_k.log
199
+ (time ./bin/perplexity --model ${model_f16} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-f16.log
200
+ (time ./bin/perplexity --model ${model_q8_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q8_0.log
201
+ (time ./bin/perplexity --model ${model_q4_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_0.log
202
+ (time ./bin/perplexity --model ${model_q4_1} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_1.log
203
+ (time ./bin/perplexity --model ${model_q5_0} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_0.log
204
+ (time ./bin/perplexity --model ${model_q5_1} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_1.log
205
+ (time ./bin/perplexity --model ${model_q2_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q2_k.log
206
+ (time ./bin/perplexity --model ${model_q3_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q3_k.log
207
+ (time ./bin/perplexity --model ${model_q4_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q4_k.log
208
+ (time ./bin/perplexity --model ${model_q5_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q5_k.log
209
+ (time ./bin/perplexity --model ${model_q6_k} -f ${wiki_test_60} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -tg-q6_k.log
210
210
211
211
function check_ppl {
212
212
qnt=" $1 "
@@ -260,8 +260,8 @@ function gg_run_open_llama_3b_v2 {
260
260
261
261
python3 ../convert-lora-to-ggml.py ${path_lora}
262
262
263
- (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-f16.log
264
- (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} --lora ${lora_shakespeare} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-lora-f16.log
263
+ (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-f16.log
264
+ (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} --lora ${lora_shakespeare} -c 128 -b 128 --chunks 2 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-lora-f16.log
265
265
266
266
compare_ppl " shakespeare" " $( cat $OUT /${ci} -ppl-shakespeare-f16.log | grep " ^\[1\]" ) " " $( cat $OUT /${ci} -ppl-shakespeare-lora-f16.log | grep " ^\[1\]" ) " | tee -a $OUT /${ci} -lora-ppl.log
267
267
0 commit comments