Merge branch 'master' into xsn/private_batch_api

2025-08-12 11:27:43 -04:00 · 2025-03-13 15:55:18 +01:00
parent 46596caf6d be7c303410
commit 17f954c8e2
173 changed files with 26425 additions and 16117 deletions
--- a/examples/llama-bench/llama-bench.cpp
+++ b/examples/llama-bench/llama-bench.cpp
@@ -1580,7 +1580,7 @@ int main(int argc, char ** argv) {

        test t(inst, lmodel, ctx);

-        llama_kv_cache_clear(ctx);
+        llama_kv_self_clear(ctx);

        // cool off before the test
        if (params.delay) {
@@ -1620,7 +1620,7 @@ int main(int argc, char ** argv) {
        }

        for (int i = 0; i < params.reps; i++) {
-            llama_kv_cache_clear(ctx);
+            llama_kv_self_clear(ctx);

            uint64_t t_start = get_time_ns();