@@ -233,6 +233,38 @@ function gg_run_open_llama_3b_v2 {
233
233
check_ppl " q5_k" " $( cat $OUT /${ci} -tg-q5_k.log | grep " ^\[1\]" ) " | tee -a $OUT /${ci} -ppl.log
234
234
check_ppl " q6_k" " $( cat $OUT /${ci} -tg-q6_k.log | grep " ^\[1\]" ) " | tee -a $OUT /${ci} -ppl.log
235
235
236
+ # lora
237
+ function compare_ppl {
238
+ qnt=" $1 "
239
+ ppl1=$( echo " $2 " | grep -oE " [0-9]+\.[0-9]+" | tail -n 1)
240
+ ppl2=$( echo " $3 " | grep -oE " [0-9]+\.[0-9]+" | tail -n 1)
241
+
242
+ if [ $( echo " $ppl1 < $ppl2 " | bc) -eq 1 ]; then
243
+ printf ' - %s @ %s (FAIL: %s > %s)\n' " $qnt " " $ppl " " $ppl1 " " $ppl2 "
244
+ return 20
245
+ fi
246
+
247
+ printf ' - %s @ %s %s OK\n' " $qnt " " $ppl1 " " $ppl2 "
248
+ return 0
249
+ }
250
+
251
+ path_lora=" ../models-mnt/open-llama/3B-v2/lora"
252
+ path_shakespeare=" ../models-mnt/shakespeare"
253
+
254
+ shakespeare=" ${path_shakespeare} /shakespeare.txt"
255
+ lora_shakespeare=" ${path_lora} /ggml-adapter-model.bin"
256
+
257
+ gg_wget ${path_lora} https://huggingface.co/slaren/open_llama_3b_v2_shakespeare_lora/resolve/main/adapter_config.json
258
+ gg_wget ${path_lora} https://huggingface.co/slaren/open_llama_3b_v2_shakespeare_lora/resolve/main/adapter_model.bin
259
+ gg_wget ${path_shakespeare} https://huggingface.co/slaren/open_llama_3b_v2_shakespeare_lora/resolve/main/shakespeare.txt
260
+
261
+ python3 ../convert-lora-to-ggml.py ${path_lora}
262
+
263
+ (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-f16.log
264
+ (time ./bin/perplexity --model ${model_f16} -f ${shakespeare} --lora ${lora_shakespeare} -c 128 -b 128 --chunks 3 ) 2>&1 | tee -a $OUT /${ci} -ppl-shakespeare-lora-f16.log
265
+
266
+ compare_ppl " shakespeare" " $( cat $OUT /${ci} -ppl-shakespeare-f16.log | grep " ^\[1\]" ) " " $( cat $OUT /${ci} -ppl-shakespeare-lora-f16.log | grep " ^\[1\]" ) " | tee -a $OUT /${ci} -lora-ppl.log
267
+
236
268
set +e
237
269
}
238
270
@@ -253,6 +285,7 @@ function gg_sum_open_llama_3b_v2 {
253
285
gg_printf ' - q4_k:\n```\n%s\n```\n' " $( cat $OUT /${ci} -tg-q4_k.log) "
254
286
gg_printf ' - q5_k:\n```\n%s\n```\n' " $( cat $OUT /${ci} -tg-q5_k.log) "
255
287
gg_printf ' - q6_k:\n```\n%s\n```\n' " $( cat $OUT /${ci} -tg-q6_k.log) "
288
+ gg_printf ' - lora:\n%s\n' " $( cat $OUT /${ci} -lora-ppl.log) "
256
289
}
257
290
258
291
# open_llama_7b_v2
0 commit comments