From 45e9d164ac749e8e8a2b0e26485b65797ffacbd3 Mon Sep 17 00:00:00 2001 From: Yoshi Suhara Date: Thu, 8 Aug 2024 09:18:59 -0700 Subject: [PATCH] Fix formatting issues --- convert_hf_to_gguf.py | 1 + gguf-py/gguf/constants.py | 4 ++-- src/llama.cpp | 6 +++--- 3 files changed, 6 insertions(+), 5 deletions(-) diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index 35011a760..28867d28f 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -3734,6 +3734,7 @@ class ChatGLMModel(Model): name = name.removeprefix("transformer.") return [(self.map_tensor_name(name), data_torch)] + @Model.register("NemotronForCausalLM") class NemotronModel(Model): model_arch = gguf.MODEL_ARCH.NEMOTRON diff --git a/gguf-py/gguf/constants.py b/gguf-py/gguf/constants.py index 3bd56ac29..63d51d872 100644 --- a/gguf-py/gguf/constants.py +++ b/gguf-py/gguf/constants.py @@ -1081,7 +1081,7 @@ MODEL_TENSORS: dict[MODEL_ARCH, list[MODEL_TENSOR]] = { MODEL_TENSOR.FFN_NORM, MODEL_TENSOR.FFN_DOWN, MODEL_TENSOR.FFN_UP, - ], + ], # TODO } @@ -1125,7 +1125,7 @@ MODEL_TENSOR_SKIP: dict[MODEL_ARCH, list[MODEL_TENSOR]] = { MODEL_ARCH.NEMOTRON: [ MODEL_TENSOR.ROPE_FREQS, MODEL_TENSOR.ATTN_ROT_EMBD, - ], + ], } # diff --git a/src/llama.cpp b/src/llama.cpp index e9c0c8c0e..587b53230 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -1315,7 +1315,7 @@ static const std::map> LLM_TENSOR_NA { LLM_TENSOR_FFN_DOWN, "blk.%d.ffn_down" }, { LLM_TENSOR_FFN_UP, "blk.%d.ffn_up" }, }, - }, + }, { LLM_ARCH_UNKNOWN, { @@ -5262,7 +5262,7 @@ static void llm_load_hparams( case 32: model.type = e_model::MODEL_4B; break; default: model.type = e_model::MODEL_UNKNOWN; } - } break; + } break; default: (void)0; } @@ -7631,7 +7631,7 @@ static bool llm_load_tensors( layer.ffn_down_b = ml.create_tensor(ctx_split, tn(LLM_TENSOR_FFN_DOWN, "bias", i), {n_embd}, llama_model_loader::TENSOR_NOT_REQUIRED); layer.ffn_up_b = ml.create_tensor(ctx_split, tn(LLM_TENSOR_FFN_UP, "bias", i), {n_ff}, llama_model_loader::TENSOR_NOT_REQUIRED); } - } break; + } break; default: throw std::runtime_error("unknown architecture"); }