From a20a94f566273932e352758424d6cbbb2ec1f73b Mon Sep 17 00:00:00 2001 From: Molly Sophia Date: Fri, 20 Dec 2024 15:03:34 +0800 Subject: [PATCH] RWKV 6: Fix error in ggml_cuda_op_bin_bcast Signed-off-by: Molly Sophia --- convert_hf_to_gguf.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index 4a0b00f69..5b73aec6d 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -3007,6 +3007,9 @@ class Rwkv6Model(Model): if new_name.endswith("time_mix_w2.weight"): data_torch = data_torch.permute(0, 2, 1) + if new_name.endswith("time_mix_decay.weight") or "lerp" in new_name: + data_torch = data_torch.squeeze() + rescale_every_n_layers = self.hparams["rescale_every"] if rescale_every_n_layers > 0: if new_name.endswith("time_mix_output.weight") or new_name.endswith("channel_mix_value.weight"):