From 132f55795e51094954f1b1f647f97648be724a3a Mon Sep 17 00:00:00 2001 From: compilade Date: Mon, 15 Apr 2024 08:56:55 -0400 Subject: [PATCH] llama : fix restoring the number of outputs from state files (#6687) --- llama.cpp | 2 ++ 1 file changed, 2 insertions(+) diff --git a/llama.cpp b/llama.cpp index cf95cea14..a5ef2fd8f 100644 --- a/llama.cpp +++ b/llama.cpp @@ -15478,6 +15478,8 @@ size_t llama_state_set_data(struct llama_context * ctx, const uint8_t * src) { GGML_ASSERT((uint32_t) id < ctx->cparams.n_batch); ctx->output_ids[id] = i; } + + ctx->n_outputs = n_outputs; } }