add support for starcoder2
This commit is contained in:
parent
e743386728
commit
e8e6103f42
2 changed files with 4 additions and 0 deletions
|
@ -249,6 +249,8 @@ class Model:
|
||||||
return gguf.MODEL_ARCH.FALCON
|
return gguf.MODEL_ARCH.FALCON
|
||||||
if arch == "GPTBigCodeForCausalLM":
|
if arch == "GPTBigCodeForCausalLM":
|
||||||
return gguf.MODEL_ARCH.STARCODER
|
return gguf.MODEL_ARCH.STARCODER
|
||||||
|
if arch == "Starcoder2ForCausalLM":
|
||||||
|
return gguf.MODEL_ARCH.LLAMA
|
||||||
if arch == "GPTRefactForCausalLM":
|
if arch == "GPTRefactForCausalLM":
|
||||||
return gguf.MODEL_ARCH.REFACT
|
return gguf.MODEL_ARCH.REFACT
|
||||||
if arch == "PersimmonForCausalLM":
|
if arch == "PersimmonForCausalLM":
|
||||||
|
|
|
@ -210,6 +210,7 @@ class TensorNameMap:
|
||||||
"model.layers.layers.{bid}.mlp.up_proj", # plamo
|
"model.layers.layers.{bid}.mlp.up_proj", # plamo
|
||||||
"model.layers.{bid}.feed_forward.w3", # internlm2
|
"model.layers.{bid}.feed_forward.w3", # internlm2
|
||||||
"encoder.layers.{bid}.mlp.fc11", # nomic-bert
|
"encoder.layers.{bid}.mlp.fc11", # nomic-bert
|
||||||
|
"model.layers.{bid}.mlp.c_fc", # starcoder2
|
||||||
),
|
),
|
||||||
|
|
||||||
MODEL_TENSOR.FFN_UP_EXP: (
|
MODEL_TENSOR.FFN_UP_EXP: (
|
||||||
|
@ -256,6 +257,7 @@ class TensorNameMap:
|
||||||
"model.layers.layers.{bid}.mlp.down_proj", # plamo
|
"model.layers.layers.{bid}.mlp.down_proj", # plamo
|
||||||
"model.layers.{bid}.feed_forward.w2", # internlm2
|
"model.layers.{bid}.feed_forward.w2", # internlm2
|
||||||
"encoder.layers.{bid}.mlp.fc2", # nomic-bert
|
"encoder.layers.{bid}.mlp.fc2", # nomic-bert
|
||||||
|
"model.layers.{bid}.mlp.c_proj", # starcoder2
|
||||||
),
|
),
|
||||||
|
|
||||||
MODEL_TENSOR.FFN_DOWN_EXP: (
|
MODEL_TENSOR.FFN_DOWN_EXP: (
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue