From 6556c90171ceb9719aab64214f3d2d456d7b045d Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Wed, 9 Oct 2024 09:12:34 +0300 Subject: [PATCH] server : update slot->prompt after restore --- examples/server/server.cpp | 3 +++ 1 file changed, 3 insertions(+) diff --git a/examples/server/server.cpp b/examples/server/server.cpp index b3773d256..39cc3c6f8 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -1778,6 +1778,9 @@ struct server_context { } slot->cache_tokens.resize(token_count); + // TODO: maybe detokenize the slot->cache_tokens instead? + slot->prompt = string_format("[restored %d tokens from file]", (int) token_count); + const int64_t t_end = ggml_time_us(); const double t_restore_ms = (t_end - t_start) / 1000.0;