server : enable KV cache defrag by default (#10233)

ggml-ci
2025-08-19 14:31:06 -04:00 · 2024-11-11 08:38:43 +02:00
parent 4b3a9212b6
commit b141e5f6ef
2 changed files with 12 additions and 10 deletions
--- a/common/common.h
+++ b/common/common.h
@@ -178,7 +178,7 @@ struct common_params {
    float   yarn_beta_fast        = 32.0f; // YaRN low correction dim
    float   yarn_beta_slow        =  1.0f; // YaRN high correction dim
    int32_t yarn_orig_ctx         =     0; // YaRN original context length
-    float   defrag_thold          = -1.0f; // KV cache defragmentation threshold
+    float   defrag_thold          =  0.1f; // KV cache defragmentation threshold

    struct cpu_params cpuparams;
    struct cpu_params cpuparams_batch;