This commit is contained in:
LDLINGLINGLING 2024-07-04 22:48:52 +09:00 committed by GitHub
commit 33099de0b9
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -1608,7 +1608,7 @@ class MiniCPMModel(Model):
def _reverse_hf_permute(self, weights: Tensor, n_head: int, n_kv_head: int | None = None) -> Tensor:
if n_kv_head is not None and n_head != n_kv_head:
n_head //= n_kv_head
n_head = n_kv_head
return (
weights.reshape(n_head, 2, weights.shape[0] // n_head // 2, *weights.shape[1:])