mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-06-28 12:25:03 +00:00
speculative : fix seg fault in certain cases (#12454)
This commit is contained in:
@ -331,11 +331,11 @@ int main(int argc, char ** argv) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
active_seqs.erase(s);
|
active_seqs.erase(s);
|
||||||
for(int i = 0; i < n_seq_dft; i++) {
|
for (int i = 0; i < n_seq_dft; i++) {
|
||||||
if (i == s) {
|
if (i == s) {
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
if (drafts[i].tokens[i_dft] == drafts[s].tokens[i_dft]) {
|
if (drafts[i].active && drafts[i].tokens[i_dft] == drafts[s].tokens[i_dft]) {
|
||||||
// synchronize active status for sequences with the same drafted token
|
// synchronize active status for sequences with the same drafted token
|
||||||
drafts[i].active = drafts[i].active && accept;
|
drafts[i].active = drafts[i].active && accept;
|
||||||
if (!drafts[i].active) {
|
if (!drafts[i].active) {
|
||||||
|
Reference in New Issue
Block a user