server: fixed wrong variable name in timing json (#2579)

* server: fixed wrong variable name in timing json * remove redunct entry
2024-12-24 10:24:35 +00:00 · 2023-08-12 06:35:14 +08:00 · 2023-08-12 06:35:14 +08:00 · 53dc399472
commit 53dc399472
parent 9ca4abed89
1 changed files with 1 additions and 2 deletions
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@ -1008,7 +1008,7 @@ static json format_timings(llama_server_context &llama)
    assert(timings.n_eval == llama.num_tokens_predicted);
    return json{
-        {"prompt_n", timings.n_eval},
+        {"prompt_n", timings.n_p_eval},
        {"prompt_ms", timings.t_p_eval_ms},
        {"prompt_per_token_ms", timings.t_p_eval_ms / timings.n_p_eval},
        {"prompt_per_second", 1e3 / timings.t_p_eval_ms * timings.n_p_eval},
@ -1037,7 +1037,6 @@ static json format_final_response(llama_server_context &llama, const std::string
        {"stopped_limit", llama.stopped_limit},
        {"stopping_word", llama.stopping_word},
        {"tokens_cached", llama.n_past},
        {"tokens_predicted", llama.num_tokens_predicted},
        {"timings", format_timings(llama)},
    };