convert : fix grok tensor names
This commit is contained in:
parent
f421b32d5a
commit
c704c778f6
1 changed files with 2 additions and 2 deletions
|
@ -1351,7 +1351,7 @@ class GrokModel(Model):
|
||||||
for wid in ["linear", "linear_1", "linear_v"]:
|
for wid in ["linear", "linear_1", "linear_v"]:
|
||||||
full = True
|
full = True
|
||||||
for xid in range(n_experts):
|
for xid in range(n_experts):
|
||||||
ename = f"transformer.decoder_layer.{bid}.moe.{xid}.{wid}"
|
ename = f"transformer.decoder_layer.{bid}.moe.{xid}.{wid}.weight"
|
||||||
if ename not in experts:
|
if ename not in experts:
|
||||||
full = False
|
full = False
|
||||||
break
|
break
|
||||||
|
@ -1360,7 +1360,7 @@ class GrokModel(Model):
|
||||||
|
|
||||||
datas = []
|
datas = []
|
||||||
for xid in range(n_experts):
|
for xid in range(n_experts):
|
||||||
ename = f"transformer.decoder_layer.{bid}.moe.{xid}.{wid}"
|
ename = f"transformer.decoder_layer.{bid}.moe.{xid}.{wid}.weight"
|
||||||
datas.append(experts[ename])
|
datas.append(experts[ename])
|
||||||
del experts[ename]
|
del experts[ename]
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue