llama : fix incorrect Qwen2Moe ffn_moe_out graph callback (#12631)

This commit is contained in:
Sigbjørn Skjæret 2025-03-28 22:13:02 +01:00 committed by GitHub
parent b4ae50810e
commit 3714c3ee1a
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -6323,7 +6323,7 @@ struct llm_build_qwen2moe : public llm_graph_context {
false, 0.0,
LLAMA_EXPERT_GATING_FUNC_TYPE_SOFTMAX,
il);
cb(cur, "ffn_moe_out", il);
cb(moe_out, "ffn_moe_out", il);
// FFN shared expert
{