Server: fix seed for multiple slots (#6835)

* Server: add tests for consistent results * sampling: separate rng per sampling context
2025-06-27 03:55:20 +00:00 · 2024-04-24 11:08:36 +02:00
parent c0d1b3e03e
commit 28103f4832
11 changed files with 145 additions and 30 deletions
--- a/examples/main/main.cpp
+++ b/examples/main/main.cpp
@ -240,7 +240,6 @@ int main(int argc, char ** argv) {
                return 1;
            }
            session_tokens.resize(n_token_count_out);
-            llama_set_rng_seed(ctx, params.seed);
            LOG_TEE("%s: loaded a session with prompt size of %d tokens\n", __func__, (int)session_tokens.size());
        }
    }