rerank : use [SEP] token instead of [BOS] (#9737)

* rerank : use [SEP] token instead of [BOS] ggml-ci * common : sanity check for non-NULL tokens ggml-ci * ci : adjust rank score interval ggml-ci * ci : add shebang to run.sh ggml-ci
2025-06-27 03:55:20 +00:00 · 2024-10-05 15:55:04 +03:00
parent 58b16695e1
commit 8c475b97b8
5 changed files with 45 additions and 16 deletions
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@ -2027,7 +2027,7 @@ struct server_context {
                                continue;
                            }

-                            // prompt: <s>query</s><s>doc</s>
+                            // prompt: [BOS]query[EOS][SEP]doc[EOS]
                            prompt_tokens.clear();
                            prompt_tokens.push_back(llama_token_bos(model));
                            {
@ -2035,7 +2035,7 @@ struct server_context {
                                prompt_tokens.insert(prompt_tokens.end(), part.begin(), part.end());
                            }
                            prompt_tokens.push_back(llama_token_eos(model));
-                            prompt_tokens.push_back(llama_token_bos(model));
+                            prompt_tokens.push_back(llama_token_sep(model));
                            {
                                const auto part = tokenize(slot.prompt[1], false);
                                prompt_tokens.insert(prompt_tokens.end(), part.begin(), part.end());