From da43a545ef4905a5e4f532efff9ecc9c45c82e85 Mon Sep 17 00:00:00 2001 From: wheelspawn Date: Tue, 18 Jun 2024 10:04:58 -0500 Subject: [PATCH] rename normalization layers --- convert-hf-to-gguf.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/convert-hf-to-gguf.py b/convert-hf-to-gguf.py index 0365d57d3..c7a66afae 100755 --- a/convert-hf-to-gguf.py +++ b/convert-hf-to-gguf.py @@ -2197,6 +2197,9 @@ class BertModel(Model): # we are only using BERT for embeddings so we don't need the pooling layer if name in ("embeddings.position_ids", "pooler.dense.weight", "pooler.dense.bias") or "cls." in name: return [] # we don't need these + + name = name.replace("gamma", "weight") + name = name.replace("beta", "bias") try_suffixes = (".weight", ".bias", ".beta", ".gamma") return [(self.map_tensor_name(name, try_suffixes), data_torch)]