fix(conversion): Simplify tensor name mapping in conversion

Branch: GraniteMoE Co-Authored-By: git@compilade.net Signed-off-by: Gabe Goodhart <ghart@us.ibm.com>
2024-09-23 11:03:18 -06:00 · 2024-09-23 11:03:18 -06:00 · 5eb28c4710
commit 5eb28c4710
parent 71bc4c1f93
1 changed files with 2 additions and 2 deletions
--- a/convert_hf_to_gguf.py
+++ b/convert_hf_to_gguf.py
@ -4129,8 +4129,8 @@ class GraniteMoeModel(GraniteModel):
        if name.endswith("block_sparse_moe.input_linear.weight"):
            gate, up = data_torch.chunk(2, dim=-2)
            return [
-                (self.map_tensor_name(f"model.layers.{bid}.block_sparse_moe.input_linear.gate.weight"), gate),
-                (self.map_tensor_name(f"model.layers.{bid}.block_sparse_moe.input_linear.up.weight"), up),
+                (self.format_tensor_name(gguf.MODEL_TENSOR.FFN_GATE_EXP, bid), gate),
+                (self.format_tensor_name(gguf.MODEL_TENSOR.FFN_UP_EXP, bid), up),
            ]

        return super().modify_tensors(data_torch, name, bid)