File tree Expand file tree Collapse file tree 1 file changed +5
-2
lines changed Expand file tree Collapse file tree 1 file changed +5
-2
lines changed Original file line number Diff line number Diff line change @@ -556,8 +556,11 @@ def set_gguf_parameters(self):
556
556
logger .info (f"gguf: experts used count = { n_experts_used } " )
557
557
558
558
if (head_dim := self .hparams .get ("head_dim" )) is not None :
559
- self .gguf_writer .add_key_length (head_dim )
560
- self .gguf_writer .add_value_length (head_dim )
559
+ # Workaround for incorrect AutoConfig value for DeepSeekV3 (is set correctly in DeepSeekV2Model class)
560
+ # https://github.com/huggingface/transformers/blob/19224c3642705c5b6988c9f5f4251f83323d05ae/src/transformers/models/deepseek_v3/configuration_deepseek_v3.py#L210
561
+ if self .hparams .get ("model_type" ) != "deepseek_v3" :
562
+ self .gguf_writer .add_key_length (head_dim )
563
+ self .gguf_writer .add_value_length (head_dim )
561
564
562
565
self .gguf_writer .add_file_type (self .ftype )
563
566
logger .info (f"gguf: file type = { self .ftype } " )
You can’t perform that action at this time.
0 commit comments