Wrong input was being fed to moe layer. This needs to be corrected

Co-authored-by: Megha Agarwal <16129366+megha95@users.noreply.github.com>
This commit is contained in:
Pierrick Hymbert 2024-04-12 21:41:14 +02:00 committed by GitHub
parent 542585fbea
commit ecbfb1b584
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -7165,7 +7165,7 @@ struct llm_build_context {
// feed-forward network
// MoE branch
cur = llm_build_norm(ctx0, cur, hparams,
cur = llm_build_norm(ctx0, ffn_inp, hparams,
model.layers[il].attn_out_norm, NULL,
LLM_NORM, cb, il);
cb(cur, "attn_out_norm", il);