kv-cache : simplify the interface (#13660)

* kv-cache : simplify the interface ggml-ci * context : revert llama_batch_allocr position change ggml-ci
2025-08-17 21:51:27 -04:00 · 2025-05-21 15:11:13 +03:00
parent b44890df2e
commit 797f2ac062
9 changed files with 89 additions and 153 deletions
--- a/src/llama-batch.cpp
+++ b/src/llama-batch.cpp
@@ -1,5 +1,6 @@
 #include "llama-batch.h"

+#include <cassert>
 #include <cstring>
 #include <algorithm>

@@ -281,9 +282,10 @@ llama_batch_allocr::llama_batch_allocr(struct llama_batch in_batch, llama_pos p0
    batch = in_batch;
    GGML_ASSERT(batch.n_tokens > 0);
    if (!batch.pos) {
+        assert(p0 >= 0);
        pos.resize(batch.n_tokens);
        for (int32_t i = 0; i < batch.n_tokens; i++) {
-            pos[i] = i + p0;
+            pos[i] = p0 + i;
        }
        batch.pos = pos.data();
    }