llama : deci : support ffn-free with attention (#13296)

This commit is contained in:
Sigbjørn Skjæret
2025-05-07 12:49:27 +02:00
committed by GitHub
parent 39e73ae0d6
commit bc4e1128f7

View File

@ -4792,7 +4792,7 @@ struct llm_build_deci : public llm_graph_context {
} }
// FFN-free layer of Llama-3_1-Nemotron-Ultra-253B // FFN-free layer of Llama-3_1-Nemotron-Ultra-253B
if (n_head == 0 && n_ff == 0) { if (n_ff == 0) {
continue; continue;
} }