server : do not speculate during prompt processing

ggml-ci
2024-12-24 10:24:35 +00:00 · 2024-12-03 10:58:43 +02:00 · 2024-12-03 10:58:43 +02:00 · 33d7b70c88
commit 33d7b70c88
parent 642330ac7c
1 changed files with 4 additions and 0 deletions
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@ -2322,6 +2322,10 @@ struct server_context {
                    continue;
                }

+                if (slot.state != SLOT_STATE_GENERATING) {
+                    continue;
+                }
+
                llama_token id = slot.sampled;

                struct common_speculative_params params_spec;