server : fix token duplication when streaming with stop strings (#10997)

2025-06-29 12:35:16 +00:00 · 2024-12-28 15:08:54 +00:00
parent d79d8f39b4
commit 16cdce7b68
1 changed files with 2 additions and 0 deletions
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@ -1856,6 +1856,8 @@ struct server_context {
                result.text_to_send = slot.generated_text.substr(pos, std::string::npos);
                slot.n_sent_text += result.text_to_send.size();
                // add the token to slot queue and cache
            } else {
                result.text_to_send = "";
            }
            slot.add_token(result);