mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-04-19 17:12:10 +08:00
speculative : fix seg fault in certain cases (#12454)
This commit is contained in:
parent
99aa304fb9
commit
c6af2161b2
@ -331,11 +331,11 @@ int main(int argc, char ** argv) {
|
||||
}
|
||||
|
||||
active_seqs.erase(s);
|
||||
for(int i = 0; i < n_seq_dft; i++) {
|
||||
for (int i = 0; i < n_seq_dft; i++) {
|
||||
if (i == s) {
|
||||
continue;
|
||||
}
|
||||
if (drafts[i].tokens[i_dft] == drafts[s].tokens[i_dft]) {
|
||||
if (drafts[i].active && drafts[i].tokens[i_dft] == drafts[s].tokens[i_dft]) {
|
||||
// synchronize active status for sequences with the same drafted token
|
||||
drafts[i].active = drafts[i].active && accept;
|
||||
if (!drafts[i].active) {
|
||||
|
Loading…
x
Reference in New Issue
Block a user