From 899398277dc3ee8f3be99be402fdbcbfed813f64 Mon Sep 17 00:00:00 2001 From: Francis Couture-Harpin Date: Tue, 19 Aug 2025 17:27:59 -0400 Subject: [PATCH] convert : fix conversion from FP8 for Deepseek-V3.1-Base --- convert_hf_to_gguf.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index a7c5e210f7..3b30d8c152 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -254,6 +254,8 @@ class ModelBase: # TODO: make sure it's a list of integers for i, size in enumerate(weight_block_size): scale = scale.repeat_interleave(size, i) + # unpad the scale (e.g. when the tensor size isn't a multiple of the block size) + scale = scale[tuple(slice(0, size) for size in weight.shape)] return weight.float() * scale