context : add get_ctx_padding()

ggml-ci
2025-07-20 17:49:18 +00:00 · 2025-01-17 11:51:35 +02:00
parent b4ec1d4429
commit f0713498fd
3 changed files with 10 additions and 1 deletions
--- a/src/llama-context.h
+++ b/src/llama-context.h
@ -84,8 +84,11 @@ struct llama_context {
                ggml_cgraph * graph,
                       bool   batched);

+    // max token position across all sequences in the current context
    llama_pos pos_max() const;

+    uint32_t get_ctx_padding(const llama_cparams & cparams) const;
+
    void reset();

    void prepare_k_shift();