convert : fix conversion from FP8 for Deepseek-V3.1-Base

2025-08-19 17:27:59 -04:00 · 2025-08-19 17:27:59 -04:00 · 899398277d
parent 1ae6ab7601
commit 899398277d
1 changed files with 2 additions and 0 deletions
--- a/convert_hf_to_gguf.py
+++ b/convert_hf_to_gguf.py
@ -254,6 +254,8 @@ class ModelBase:
                    # TODO: make sure it's a list of integers
                    for i, size in enumerate(weight_block_size):
                        scale = scale.repeat_interleave(size, i)
+                # unpad the scale (e.g. when the tensor size isn't a multiple of the block size)
+                scale = scale[tuple(slice(0, size) for size in weight.shape)]

                return weight.float() * scale