py: a bit cleaner
This commit is contained in:
parent
c3a654c0fb
commit
b986af80de
1 changed files with 10 additions and 9 deletions
|
@ -1734,17 +1734,18 @@ class LlamaModel(Model):
|
||||||
n_kv_head = self.hparams.get("num_key_value_heads")
|
n_kv_head = self.hparams.get("num_key_value_heads")
|
||||||
is_vision_tensor = "vision_tower" in name or "vision_model" in name
|
is_vision_tensor = "vision_tower" in name or "vision_model" in name
|
||||||
|
|
||||||
# For vision model
|
if is_vision_tensor:
|
||||||
if name.startswith("language_model"):
|
if name.startswith("model.text_model"):
|
||||||
name = name.replace("language_model.", "")
|
name = name.replace("text_model.", "") # for SmolVLM
|
||||||
if name.startswith("model.text_model"):
|
else:
|
||||||
name = name.replace("text_model.", "") # for SmolVLM
|
name = name.replace("model.vision_tower.", "")
|
||||||
else:
|
if "post_layernorm" in name and self.vision_arch != gguf.MODEL_ARCH.VISION_IDEFICS3:
|
||||||
name = name.replace("model.vision_tower.", "")
|
return [] # skip post_layernorm
|
||||||
if "post_layernorm" in name and self.vision_arch != gguf.MODEL_ARCH.VISION_IDEFICS3:
|
|
||||||
return [] # skip post_layernorm
|
|
||||||
|
|
||||||
if not is_vision_tensor:
|
if not is_vision_tensor:
|
||||||
|
if name.startswith("language_model"):
|
||||||
|
# language model tensors, remove the prefix
|
||||||
|
name = name.replace("language_model.", "")
|
||||||
if name.endswith(("q_proj.weight", "q_proj.bias")):
|
if name.endswith(("q_proj.weight", "q_proj.bias")):
|
||||||
data_torch = LlamaModel.permute(data_torch, n_head, n_head)
|
data_torch = LlamaModel.permute(data_torch, n_head, n_head)
|
||||||
if name.endswith(("k_proj.weight", "k_proj.bias")):
|
if name.endswith(("k_proj.weight", "k_proj.bias")):
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue