Skip to content

Commit 443f7d5

Browse files
committed
Call add_tensor before write_* functions
1 parent 550b925 commit 443f7d5

File tree

2 files changed

+22
-6
lines changed

2 files changed

+22
-6
lines changed

convert-generic.py

Lines changed: 10 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -54,14 +54,19 @@
5454
model_instance.set_vocab()
5555

5656
# write model
57-
print("gguf: write header")
58-
model_instance.gguf_writer.write_header_to_file()
59-
print("gguf: write metadata")
60-
model_instance.gguf_writer.write_kv_data_to_file()
6157
if not args.vocab_only:
62-
print("gguf: write tensors")
6358
model_instance.write_tensors()
59+
print("gguf: write header")
60+
model_instance.gguf_writer.write_header_to_file()
61+
print("gguf: write metadata")
62+
model_instance.gguf_writer.write_kv_data_to_file()
63+
print("gguf: write tensors")
6464
model_instance.gguf_writer.write_tensors_to_file()
65+
else:
66+
print("gguf: write header")
67+
model_instance.gguf_writer.write_header_to_file()
68+
print("gguf: write metadata")
69+
model_instance.gguf_writer.write_kv_data_to_file()
6570

6671
model_instance.gguf_writer.close()
6772

model.py

Lines changed: 12 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -190,7 +190,18 @@ def set_gguf_parameters(self):
190190

191191

192192
class GPTNeoXModel(Model):
193-
pass
193+
def set_gguf_parameters(self):
194+
block_count = self.hparams["num_hidden_layers"]
195+
196+
self.gguf_writer.add_name(self.dir_model.name)
197+
self.gguf_writer.add_context_length(self.hparams["max_position_embeddings"])
198+
self.gguf_writer.add_embedding_length(self.hparams["hidden_size"])
199+
self.gguf_writer.add_block_count(block_count)
200+
self.gguf_writer.add_feed_forward_length(self.hparams["intermediate_size"])
201+
self.gguf_writer.add_rope_dimension_count(int(self.hparams["rotary_pct"]*(self.hparams["hidden_size"]//self.hparams["num_attention_heads"])))
202+
self.gguf_writer.add_head_count(self.hparams["num_attention_heads"])
203+
self.gguf_writer.add_parallel_residual(self.hparams["use_parallel_residual"] if "use_parallel_residual" in self.hparams else True)
204+
self.gguf_writer.add_layer_norm_eps(self.hparams["layer_norm_eps"])
194205

195206
class BloomModel(Model):
196207
def set_gguf_parameters(self):

0 commit comments

Comments
 (0)