server : do not speculate during prompt processing

ggml-ci
This commit is contained in:
Georgi Gerganov 2024-12-03 10:58:43 +02:00
parent 642330ac7c
commit 33d7b70c88
No known key found for this signature in database
GPG Key ID: 449E073F9DC10735

View File

@ -2322,6 +2322,10 @@ struct server_context {
continue;
}
if (slot.state != SLOT_STATE_GENERATING) {
continue;
}
llama_token id = slot.sampled;
struct common_speculative_params params_spec;