convert : fix grok tensor names
This commit is contained in:
parent
f421b32d5a
commit
c704c778f6
1 changed files with 2 additions and 2 deletions
|
@ -1351,7 +1351,7 @@ class GrokModel(Model):
|
|||
for wid in ["linear", "linear_1", "linear_v"]:
|
||||
full = True
|
||||
for xid in range(n_experts):
|
||||
ename = f"transformer.decoder_layer.{bid}.moe.{xid}.{wid}"
|
||||
ename = f"transformer.decoder_layer.{bid}.moe.{xid}.{wid}.weight"
|
||||
if ename not in experts:
|
||||
full = False
|
||||
break
|
||||
|
@ -1360,7 +1360,7 @@ class GrokModel(Model):
|
|||
|
||||
datas = []
|
||||
for xid in range(n_experts):
|
||||
ename = f"transformer.decoder_layer.{bid}.moe.{xid}.{wid}"
|
||||
ename = f"transformer.decoder_layer.{bid}.moe.{xid}.{wid}.weight"
|
||||
datas.append(experts[ename])
|
||||
del experts[ename]
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue