server : fix incorrect usage of llama_get_embeddings() (#14225)

* server : fix incorrect usage of llama_get_embeddings() ggml-ci * cont : fix the fix ggml-ci
2025-06-26 11:45:21 +00:00 · 2025-06-16 22:33:27 +03:00
parent 6adc3c3ebc
commit 89fea80d29
2 changed files with 11 additions and 10 deletions
--- a/include/llama.h
+++ b/include/llama.h
@ -965,6 +965,7 @@ extern "C" {
    LLAMA_API int32_t llama_n_threads_batch(struct llama_context * ctx);

    // Set whether the context outputs embeddings or not
+    // TODO: rename to avoid confusion with llama_get_embeddings()
    LLAMA_API void llama_set_embeddings(struct llama_context * ctx, bool embeddings);

    // Set whether to use causal attention or not