llama : deci : support ffn-free with attention (#13296)

2025-06-28 20:25:20 +00:00 · 2025-05-07 12:49:27 +02:00
parent 39e73ae0d6
commit bc4e1128f7
1 changed files with 1 additions and 1 deletions
--- a/src/llama-model.cpp
+++ b/src/llama-model.cpp
@ -4792,7 +4792,7 @@ struct llm_build_deci : public llm_graph_context {
            }

            // FFN-free layer of Llama-3_1-Nemotron-Ultra-253B
-            if (n_head == 0 && n_ff == 0) {
+            if (n_ff == 0) {
                continue;
            }