File tree Expand file tree Collapse file tree 1 file changed +7
-0
lines changed Expand file tree Collapse file tree 1 file changed +7
-0
lines changed Original file line number Diff line number Diff line change @@ -2761,6 +2761,13 @@ def set_gguf_parameters(self):
2761
2761
if (shared_expert_intermediate_size := self .hparams .get ('shared_expert_intermediate_size' )) is not None :
2762
2762
self .gguf_writer .add_expert_shared_feed_forward_length (shared_expert_intermediate_size )
2763
2763
logger .info (f"gguf: expert shared feed forward length = { shared_expert_intermediate_size } " )
2764
+ # YaRN is not enabled by default
2765
+ # To enable it, please refer to this guide: https://huggingface.co/Qwen/Qwen3-30B-A3B#processing-long-texts
2766
+ if self .hparams .get ("rope_scaling" ) is not None and "factor" in self .hparams ["rope_scaling" ]:
2767
+ if self .hparams ["rope_scaling" ].get ("type" ) == "yarn" :
2768
+ self .gguf_writer .add_rope_scaling_type (gguf .RopeScalingType .YARN )
2769
+ self .gguf_writer .add_rope_scaling_factor (self .hparams ["rope_scaling" ]["factor" ])
2770
+ self .gguf_writer .add_rope_scaling_orig_ctx_len (self .hparams ["rope_scaling" ]["original_max_position_embeddings" ])
2764
2771
2765
2772
_experts : list [dict [str , Tensor ]] | None = None
2766
2773
You can’t perform that action at this time.
0 commit comments