From 7dee9ff59ad507304bf43a2682dbe0a89bbc3dce Mon Sep 17 00:00:00 2001 From: Daniel Bevenius Date: Tue, 20 Jan 2026 06:55:24 +0100 Subject: [PATCH] convert : use n_groups instead of hardcoded values in reshape (#18929) * convert : use n_groups instead of hardcoded values in reshape This commit modifies the conversion script for NemotronHModel to use the 'n_groups' hyperparameter, and allow Python to calculate the the last dimension, using -1, when reshaping the 'mixer.norm.weight' tensor. * use self.n_group instead of self.hparams["n_groups"] --- convert_hf_to_gguf.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index becbad046d..ab015dd2c3 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -9212,7 +9212,7 @@ class NemotronHModel(GraniteHybridModel): return [(mapped_name, reshaped_data)] if name.endswith("mixer.norm.weight"): - reshaped_data = data_torch.reshape(8, 512) + reshaped_data = data_torch.reshape(self.n_group, -1) mapped_name = self.map_tensor_name(name) return [(mapped_name, reshaped_data)]