convert : read/write n_head_kv

This commit is contained in:
Georgi Gerganov 2024-05-21 19:40:01 +03:00
parent e9acbce624
commit 92711138f9
No known key found for this signature in database
GPG key ID: 449E073F9DC10735
2 changed files with 4 additions and 3 deletions

View file

@ -1787,6 +1787,7 @@ class Phi3MiniModel(Model):
n_embd = self.find_hparam(["hidden_size", "n_embd"])
n_head = self.find_hparam(["num_attention_heads", "n_head"])
n_head_kv = self.find_hparam(["num_key_value_heads", "n_head_kv"])
rms_eps = self.find_hparam(["rms_norm_eps"])
max_pos_embds = self.find_hparam(["n_positions", "max_position_embeddings"])
orig_max_pos_embds = self.find_hparam(["original_max_position_embeddings"])
@ -1799,7 +1800,7 @@ class Phi3MiniModel(Model):
self.gguf_writer.add_feed_forward_length(self.find_hparam(["intermediate_size"]))
self.gguf_writer.add_block_count(block_count)
self.gguf_writer.add_head_count(n_head)
self.gguf_writer.add_head_count_kv(n_head)
self.gguf_writer.add_head_count_kv(n_head_kv)
self.gguf_writer.add_layer_norm_rms_eps(rms_eps)
self.gguf_writer.add_rope_dimension_count(rope_dims)
self.gguf_writer.add_rope_freq_base(self.find_hparam(["rope_theta"]))