llama : auto-batch preparation (#13845)

* llama : auto-batch ggml-ci * context : simplify if branching
2025-07-28 21:23:55 -04:00 · 2025-05-31 12:55:57 +03:00
parent 51fa76f172
commit 3f55f781f1
5 changed files with 67 additions and 54 deletions
--- a/src/llama-context.h
+++ b/src/llama-context.h
@@ -50,8 +50,9 @@ struct llama_context {
          llama_kv_cache * get_kv_self();
    const llama_kv_cache * get_kv_self() const;

+    // return true of the KV cache was updated
    // TODO: remove
-    void kv_self_update();
+    bool kv_self_update();

    enum llama_pooling_type pooling_type() const;