context : do not clear output buffer on reserve (#13152)

Co-authored-by: pockers21 <liyang2@uniontech.com>
2025-08-16 05:02:58 -04:00 · 2025-04-28 06:45:40 -07:00
parent d2b2031e5f
commit fb0471d175
1 changed files with 0 additions and 2 deletions
--- a/src/llama-context.cpp
+++ b/src/llama-context.cpp
@@ -1536,8 +1536,6 @@ int32_t llama_context::output_reserve(int32_t n_outputs) {
    // set all ids as invalid (negative)
    std::fill(output_ids.begin(), output_ids.end(), -1);

-    ggml_backend_buffer_clear(buf_output.get(), 0);
-
    this->n_outputs     = 0;
    this->n_outputs_max = n_outputs_max;