File tree Expand file tree Collapse file tree 2 files changed +22
-6
lines changed Expand file tree Collapse file tree 2 files changed +22
-6
lines changed Original file line number Diff line number Diff line change 54
54
model_instance .set_vocab ()
55
55
56
56
# write model
57
- print ("gguf: write header" )
58
- model_instance .gguf_writer .write_header_to_file ()
59
- print ("gguf: write metadata" )
60
- model_instance .gguf_writer .write_kv_data_to_file ()
61
57
if not args .vocab_only :
62
- print ("gguf: write tensors" )
63
58
model_instance .write_tensors ()
59
+ print ("gguf: write header" )
60
+ model_instance .gguf_writer .write_header_to_file ()
61
+ print ("gguf: write metadata" )
62
+ model_instance .gguf_writer .write_kv_data_to_file ()
63
+ print ("gguf: write tensors" )
64
64
model_instance .gguf_writer .write_tensors_to_file ()
65
+ else :
66
+ print ("gguf: write header" )
67
+ model_instance .gguf_writer .write_header_to_file ()
68
+ print ("gguf: write metadata" )
69
+ model_instance .gguf_writer .write_kv_data_to_file ()
65
70
66
71
model_instance .gguf_writer .close ()
67
72
Original file line number Diff line number Diff line change @@ -190,7 +190,18 @@ def set_gguf_parameters(self):
190
190
191
191
192
192
class GPTNeoXModel (Model ):
193
- pass
193
+ def set_gguf_parameters (self ):
194
+ block_count = self .hparams ["num_hidden_layers" ]
195
+
196
+ self .gguf_writer .add_name (self .dir_model .name )
197
+ self .gguf_writer .add_context_length (self .hparams ["max_position_embeddings" ])
198
+ self .gguf_writer .add_embedding_length (self .hparams ["hidden_size" ])
199
+ self .gguf_writer .add_block_count (block_count )
200
+ self .gguf_writer .add_feed_forward_length (self .hparams ["intermediate_size" ])
201
+ self .gguf_writer .add_rope_dimension_count (int (self .hparams ["rotary_pct" ]* (self .hparams ["hidden_size" ]// self .hparams ["num_attention_heads" ])))
202
+ self .gguf_writer .add_head_count (self .hparams ["num_attention_heads" ])
203
+ self .gguf_writer .add_parallel_residual (self .hparams ["use_parallel_residual" ] if "use_parallel_residual" in self .hparams else True )
204
+ self .gguf_writer .add_layer_norm_eps (self .hparams ["layer_norm_eps" ])
194
205
195
206
class BloomModel (Model ):
196
207
def set_gguf_parameters (self ):
You can’t perform that action at this time.
0 commit comments