From 3ae86704e698c2003b729b17771d8646462b6b80 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Fri, 11 Oct 2024 09:16:00 +0300 Subject: [PATCH] server : update prompt on slot restore (#9800) --- examples/server/server.cpp | 3 +++ 1 file changed, 3 insertions(+) diff --git a/examples/server/server.cpp b/examples/server/server.cpp index c6e7c140f..314a506a1 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -1778,6 +1778,9 @@ struct server_context { } slot->cache_tokens.resize(token_count); + // TODO: maybe detokenize the slot->cache_tokens instead? + slot->prompt = string_format("[restored %d tokens from file]", (int) token_count); + const int64_t t_end = ggml_time_us(); const double t_restore_ms = (t_end - t_start) / 1000.0;