mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-06-28 04:30:15 -05:00
Reset i_last when low acceptance streak occurs (#1701)
By resetting i_last to zero, we will include the current context when rebuilding the speculative map.
This commit is contained in:
parent
fb07c1e6e5
commit
0a167082a3
@ -693,6 +693,7 @@ struct common_speculative_state_ngram_mod : public common_speculative_state {
|
||||
|
||||
mod.reset();
|
||||
n_low = 0;
|
||||
i_last = 0;
|
||||
}
|
||||
} else {
|
||||
n_low = 0;
|
||||
@ -1459,4 +1460,4 @@ void mtp_accept_tokens(
|
||||
mtp_update_kv_cache(ctx, accepted_batch, false);
|
||||
|
||||
llama_batch_free(accepted_batch);
|
||||
}
|
||||
}
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user