llama : fix incorrect Qwen2Moe ffn_moe_out graph callback (#12631)

2025-06-29 12:35:16 +00:00 · 2025-03-28 22:13:02 +01:00
parent b4ae50810e
commit 3714c3ee1a
1 changed files with 1 additions and 1 deletions
--- a/src/llama-model.cpp
+++ b/src/llama-model.cpp
@ -6323,7 +6323,7 @@ struct llm_build_qwen2moe : public llm_graph_context {
                        false, 0.0,
                        LLAMA_EXPERT_GATING_FUNC_TYPE_SOFTMAX,
                        il);
-            cb(cur, "ffn_moe_out", il);
+            cb(moe_out, "ffn_moe_out", il);
            // FFN shared expert
            {