llama : minor sampling refactor (2) (#9386)

2025-08-12 03:21:10 -04:00 · 2024-09-09 17:10:46 +02:00
parent 38ca6f644b
commit 5fb5e24811
12 changed files with 115 additions and 113 deletions
--- a/examples/batched/batched.cpp
+++ b/examples/batched/batched.cpp
@@ -172,8 +172,6 @@ int main(int argc, char ** argv) {

            const llama_token new_token_id = llama_sampler_sample(smpl, ctx, i_batch[i]);

-            llama_sampler_accept(smpl, new_token_id);
-
            // is it an end of generation? -> mark the stream as finished
            if (llama_token_is_eog(model, new_token_id) || n_cur == n_predict) {
                i_batch[i] = -1;