修改了由于minicpm的GQA结构带来的模型转换bug

2024-07-02 15:43:07 +08:00 · 2024-07-02 15:43:07 +08:00 · 47d821a08c
commit 47d821a08c
parent 023b8807e1
1 changed files with 1 additions and 1 deletions
--- a/convert-hf-to-gguf.py
+++ b/convert-hf-to-gguf.py
@ -1605,7 +1605,7 @@ class MiniCPMModel(Model):

    def _reverse_hf_permute(self, weights: Tensor, n_head: int, n_kv_head: int | None = None) -> Tensor:
        if n_kv_head is not None and n_head != n_kv_head:
-            n_head //= n_kv_head
+            n_head = n_kv_head

        return (
            weights.reshape(n_head, 2, weights.shape[0] // n_head // 2, *weights.shape[1:])