kv-cache : simplify + fix warning for recurrent models (#12756)

ggml-ci
This commit is contained in:
Georgi Gerganov
2025-04-04 21:48:10 +03:00
committed by GitHub
parent 1be76e4620
commit 3e1d29348b
4 changed files with 80 additions and 173 deletions

View File

@ -15,7 +15,7 @@ public:
virtual void seq_add (llama_seq_id seq_id, llama_pos p0, llama_pos p1, llama_pos delta) = 0;
virtual void seq_div (llama_seq_id seq_id, llama_pos p0, llama_pos p1, int d) = 0;
virtual llama_pos seq_pos_max(llama_seq_id seq_id) = 0;
virtual llama_pos seq_pos_max(llama_seq_id seq_id) const = 0;
virtual bool get_can_edit() const = 0;
};