diff --git a/convert-hf-to-gguf.py b/convert-hf-to-gguf.py index 51549ac72..f5ed70eb3 100755 --- a/convert-hf-to-gguf.py +++ b/convert-hf-to-gguf.py @@ -2392,7 +2392,8 @@ class CommandR2Model(Model): # max_position_embeddings = 8192 in config.json but model was actually # trained on 128k context length - self.hparams["max_position_embeddings"] = self.hparams["model_max_length"] + # aya-23 models don't have model_max_length specified + self.hparams["max_position_embeddings"] = self.find_hparam(["model_max_length", "max_position_embeddings"]) def set_gguf_parameters(self): super().set_gguf_parameters()