llama : add n_expert and n_expert_used to hparams + change quants

This commit is contained in:
Georgi Gerganov 2023-12-10 13:57:54 +02:00
parent d1259b7b35
commit e640cbe055
No known key found for this signature in database
GPG key ID: 449E073F9DC10735
6 changed files with 111 additions and 54 deletions

View file

@ -38,6 +38,8 @@ class Keys:
FEED_FORWARD_LENGTH = "{arch}.feed_forward_length"
USE_PARALLEL_RESIDUAL = "{arch}.use_parallel_residual"
TENSOR_DATA_LAYOUT = "{arch}.tensor_data_layout"
EXPERT_COUNT = "{arch}.expert_count"
EXPERT_USED_COUNT = "{arch}.expert_used_count"
class Attention:
HEAD_COUNT = "{arch}.attention.head_count"