From 02ff08507146c516f10eda0d709d1897fc13b20f Mon Sep 17 00:00:00 2001 From: Vaibhavs10 Date: Tue, 17 Jun 2025 16:01:53 +0200 Subject: [PATCH] fix errors in conversion. --- convert_hf_to_gguf.py | 7 +++++-- gguf-py/gguf/constants.py | 1 + 2 files changed, 6 insertions(+), 2 deletions(-) diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index ef0501883..ce1500d69 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -6305,8 +6305,11 @@ class SmolLM3Model(LlamaModel): def set_gguf_parameters(self): super().set_gguf_parameters() - if self.model.config.no_rope_layers is not None: - self.gguf_writer.add_array("smollm3.no_rope_layers", self.model.config.no_rope_layers, gguf.GGUFValueType.INT32) + # if self.model.config.no_rope_layers is not None: + # self.gguf_writer.add_array("smollm3.no_rope_layers", self.model.config.no_rope_layers, gguf.GGUFValueType.INT32) + no_rope_layers = self.hparams.get("no_rope_layers") + if no_rope_layers is not None: + self.gguf_writer.add_array("smollm3.no_rope_layers", no_rope_layers) ###### CONVERSION LOGIC ###### diff --git a/gguf-py/gguf/constants.py b/gguf-py/gguf/constants.py index 054591dcf..70083cd4e 100644 --- a/gguf-py/gguf/constants.py +++ b/gguf-py/gguf/constants.py @@ -2114,6 +2114,7 @@ MODEL_TENSORS: dict[MODEL_ARCH, list[MODEL_TENSOR]] = { MODEL_TENSOR.ATTN_V, MODEL_TENSOR.ATTN_OUT, MODEL_TENSOR.ATTN_ROT_EMBD, + MODEL_TENSOR.FFN_NORM, MODEL_TENSOR.FFN_GATE, MODEL_TENSOR.FFN_DOWN, MODEL_TENSOR.FFN_UP,