We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 38b16df commit 01f2224Copy full SHA for 01f2224
convert-falcon-hf-to-gguf.py
@@ -107,6 +107,7 @@ def count_model_parts(dir_model: str) -> int:
107
else:
108
gguf_writer.add_head_count_kv(1)
109
gguf_writer.add_layer_norm_eps(hparams["layer_norm_epsilon"])
110
+gguf_writer.add_file_type(ftype)
111
112
# TOKENIZATION
113
scripts/run-all-ppl.sh
@@ -1,7 +1,7 @@
1
#!/bin/bash
2
3
qnt=(f16 q8_0 q6_k q5_k q5_1 q5_0 q4_k q4_1 q4_0 q3_k q2_k)
4
-args="--no-mmap -ngl 999 -t 8"
+args="-ngl 999 -t 8"
5
6
if [ -z "$1" ]; then
7
echo "usage: $0 <model> [qnt] [args]"
0 commit comments