Skip to content

Commit 55f6b9f

Browse files
authored
convert : fix duplicate key DeepSeek-R1 conversion error (#14103)
1 parent 3678b83 commit 55f6b9f

File tree

1 file changed

+5
-2
lines changed

1 file changed

+5
-2
lines changed

convert_hf_to_gguf.py

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -556,8 +556,11 @@ def set_gguf_parameters(self):
556556
logger.info(f"gguf: experts used count = {n_experts_used}")
557557

558558
if (head_dim := self.hparams.get("head_dim")) is not None:
559-
self.gguf_writer.add_key_length(head_dim)
560-
self.gguf_writer.add_value_length(head_dim)
559+
# Workaround for incorrect AutoConfig value for DeepSeekV3 (is set correctly in DeepSeekV2Model class)
560+
# https://github.com/huggingface/transformers/blob/19224c3642705c5b6988c9f5f4251f83323d05ae/src/transformers/models/deepseek_v3/configuration_deepseek_v3.py#L210
561+
if self.hparams.get("model_type") != "deepseek_v3":
562+
self.gguf_writer.add_key_length(head_dim)
563+
self.gguf_writer.add_value_length(head_dim)
561564

562565
self.gguf_writer.add_file_type(self.ftype)
563566
logger.info(f"gguf: file type = {self.ftype}")

0 commit comments

Comments
 (0)