llama : support for Llama-3_1-Nemotron-51B (#10669)
* conflict resolution * move comments after bracket to its own line
This commit is contained in:
parent
dab76c92cc
commit
6f0c9e034b
4 changed files with 471 additions and 1 deletions
|
@ -198,6 +198,7 @@ class TensorNameMap:
|
|||
"transformer.h.{bid}.self_attention.dense", # falcon
|
||||
"h.{bid}.self_attention.dense", # bloom
|
||||
"model.layers.{bid}.self_attn.o_proj", # llama-hf nemotron olmoe olmo2
|
||||
"model.layers.{bid}.self_attn.linear_attn", # deci
|
||||
"layers.{bid}.attention.wo", # llama-pth
|
||||
"encoder.layer.{bid}.attention.output.dense", # bert
|
||||
"transformer.h.{bid}.attn.out_proj", # gpt-j
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue