context : fix reorder logic (#13267)

ggml-ci
2025-08-15 12:42:40 -04:00 · 2025-05-02 20:54:13 +03:00
parent 3f3769ba76
commit a75cb30dc9
1 changed files with 3 additions and 3 deletions
--- a/src/llama-context.cpp
+++ b/src/llama-context.cpp
@@ -1050,6 +1050,9 @@ int llama_context::decode(llama_batch & inp_batch) {
    // finalize the batch processing
    kv_guard.commit();

+    // set to total number of outputs in the batch, for use in llama_get_logits_ith
+    n_outputs = n_outputs_all;
+
    // set output mappings
    {
        bool sorted_output = true;
@@ -1103,9 +1106,6 @@ int llama_context::decode(llama_batch & inp_batch) {
        }
    }

-    // set to total number of outputs in the batch, for use in llama_get_logits_ith
-    n_outputs = n_outputs_all;
-
    // wait for the computation to finish (automatically done when obtaining the model output)
    //synchronize();