mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-04-16 03:26:08 +00:00
llama : fix incorrect Qwen2Moe ffn_moe_out graph callback (#12631)
This commit is contained in:
parent
b4ae50810e
commit
3714c3ee1a
@ -6323,7 +6323,7 @@ struct llm_build_qwen2moe : public llm_graph_context {
|
||||
false, 0.0,
|
||||
LLAMA_EXPERT_GATING_FUNC_TYPE_SOFTMAX,
|
||||
il);
|
||||
cb(cur, "ffn_moe_out", il);
|
||||
cb(moe_out, "ffn_moe_out", il);
|
||||
|
||||
// FFN shared expert
|
||||
{
|
||||
|
Loading…
x
Reference in New Issue
Block a user