model: dbrx: weird fix expert reshape

This commit is contained in:
Pierrick HYMBERT 2024-04-07 20:14:43 +02:00
parent e2c919962b
commit 50b4373673

View file

@ -1528,7 +1528,7 @@ class DbrxModel(Model):
for exp_tensor_name in exp_tensor_names.keys(): for exp_tensor_name in exp_tensor_names.keys():
if name.find(exp_tensor_name) != -1 and name.find(".weight") == -1: if name.find(exp_tensor_name) != -1 and name.find(".weight") == -1:
experts = True experts = True
expert_reshape = exp_tensor_names[exp_tensor_name].reverse() expert_reshape = exp_tensor_names[exp_tensor_name][::-1]
break break
old_dtype = data_torch.dtype old_dtype = data_torch.dtype