nvidia uses the LLaMAForCausalLM string in their config.json, example nvidia/Llama3-ChatQA-2-8B

2024-09-14 10:48:09 -07:00 · 2024-09-14 10:48:09 -07:00 · aaf7f53d46
commit aaf7f53d46
parent 822b6322de
1 changed files with 1 additions and 1 deletions
--- a/convert_hf_to_gguf.py
+++ b/convert_hf_to_gguf.py
@ -1487,7 +1487,7 @@ class StableLMModel(Model):
                raise ValueError(f"Unprocessed norms: {norms}")


-@Model.register("LlamaForCausalLM", "MistralForCausalLM", "MixtralForCausalLM")
+@Model.register("LLaMAForCausalLM", "LlamaForCausalLM", "MistralForCausalLM", "MixtralForCausalLM")
 class LlamaModel(Model):
    model_arch = gguf.MODEL_ARCH.LLAMA