From 5eb28c4710b6737063fbc2ec0b9b3cdc1a82a0eb Mon Sep 17 00:00:00 2001 From: Gabe Goodhart Date: Mon, 23 Sep 2024 11:03:18 -0600 Subject: [PATCH] fix(conversion): Simplify tensor name mapping in conversion Branch: GraniteMoE Co-Authored-By: git@compilade.net Signed-off-by: Gabe Goodhart --- convert_hf_to_gguf.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index d62ecb997..1cad8ef54 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -4129,8 +4129,8 @@ class GraniteMoeModel(GraniteModel): if name.endswith("block_sparse_moe.input_linear.weight"): gate, up = data_torch.chunk(2, dim=-2) return [ - (self.map_tensor_name(f"model.layers.{bid}.block_sparse_moe.input_linear.gate.weight"), gate), - (self.map_tensor_name(f"model.layers.{bid}.block_sparse_moe.input_linear.up.weight"), up), + (self.format_tensor_name(gguf.MODEL_TENSOR.FFN_GATE_EXP, bid), gate), + (self.format_tensor_name(gguf.MODEL_TENSOR.FFN_UP_EXP, bid), up), ] return super().modify_tensors(data_torch, name, bid)