fix: Fix wrong bool condition for split equal in hybrid cache

Branch: HybridRecurrentCache Signed-off-by: Gabe Goodhart <ghart@us.ibm.com>
2025-09-04 06:15:41 -04:00 · 2025-05-28 11:02:54 -06:00
parent 423c89401d
commit 6c6ec0003a
1 changed files with 1 additions and 1 deletions
--- a/src/llama-kv-cache-hybrid-recurrent.cpp
+++ b/src/llama-kv-cache-hybrid-recurrent.cpp
@@ -96,7 +96,7 @@ llama_pos llama_kv_cache_hybrid_recurrent::seq_pos_max(llama_seq_id seq_id) cons
 llama_memory_state_ptr llama_kv_cache_hybrid_recurrent::init_batch(const llama_batch & batch, uint32_t n_ubatch, bool embd_pooled, bool logits_all) {

    // since this includes a recurrent cache, we cannot use split_simple
-    auto sbatch = llama_sbatch(batch, hparams.n_embd, true, logits_all);
+    auto sbatch = llama_sbatch(batch, hparams.n_embd, false, logits_all);

    // follow the recurrent pattern for creating the ubatch splits
    std::vector<llama_ubatch> ubatches;