mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-28 12:24:35 +00:00
This commit is contained in:
parent
d9fb3b2e01
commit
c8880e786c
@ -170,7 +170,7 @@ llama_tokens common_speculative_gen_draft(
|
|||||||
for (int i = reuse_i + reuse_n + 1; i < (int) prompt.size(); ++i) {
|
for (int i = reuse_i + reuse_n + 1; i < (int) prompt.size(); ++i) {
|
||||||
result.push_back(prompt[i]);
|
result.push_back(prompt[i]);
|
||||||
|
|
||||||
if (result.size() >= params.n_draft) {
|
if (params.n_draft <= (int) result.size()) {
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user