convert : fix squeeze for ssm_conv tensors

2025-04-16 03:26:08 +00:00 · 2025-03-25 19:54:18 +02:00 · 2025-03-25 19:54:18 +02:00 · 9c60fc4c78
commit 9c60fc4c78
parent 053b3f9aae
1 changed files with 4 additions and 0 deletions
--- a/convert_hf_to_gguf.py
+++ b/convert_hf_to_gguf.py
@ -3814,6 +3814,10 @@ class MambaModel(Model):
            logger.debug("A_log --> A ==> " + new_name)
            data_torch = -torch.exp(data_torch)

+        # [4 1 8192 1] -> [4 8192 1 1]
+        if new_name.endswith(".ssm_conv1d"):
+            data_torch = data_torch.squeeze()
+
        # assuming token_embd.weight is seen before output.weight
        if self._tok_embd is not None and new_name == output_name:
            if torch.equal(self._tok_embd, data_torch):