speculative : update default params (#11954)

* speculative : update default params * speculative : do not discard the last drafted token
2025-08-25 09:38:35 -04:00 · 2025-02-19 13:29:42 +02:00
parent 9626d9351a
commit abd4d0bc4f
4 changed files with 9 additions and 9 deletions
--- a/common/speculative.h
+++ b/common/speculative.h
@@ -9,7 +9,7 @@ struct common_speculative_params {
    int n_draft = 16;  // max drafted tokens
    int n_reuse = 256;

-    float p_min = 0.9f; // min probability required to accept a token in the draft
+    float p_min = 0.75f; // min probability required to accept a token in the draft
 };

 struct common_speculative * common_speculative_init(struct llama_context * ctx_dft);