server : bach has to be allocated for n_parallel sequences

2024-12-26 11:24:35 +00:00 · 2023-10-20 20:42:45 +03:00 · 2023-10-20 20:42:45 +03:00 · 113dd60005
commit 113dd60005
parent 6b2437e32d
1 changed files with 3 additions and 1 deletions
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@ -631,7 +631,9 @@ struct llama_server_context
            LOG_TEE(" -> Slot %i - max context: %i\n", slot.id, max_ctx_per_slot);
            slots.push_back(slot);
        }
-        batch = llama_batch_init(n_ctx, 0, 1);
+
+        batch = llama_batch_init(n_ctx, 0, params.n_parallel);
+
        // empty system prompt
        system_prompt = "";
        num_tokens_system = 0;