From 53dc399472d5bd35ee739b865e843b1996bd3814 Mon Sep 17 00:00:00 2001 From: Equim Date: Sat, 12 Aug 2023 06:35:14 +0800 Subject: [PATCH] server: fixed wrong variable name in timing json (#2579) * server: fixed wrong variable name in timing json * remove redunct entry --- examples/server/server.cpp | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/examples/server/server.cpp b/examples/server/server.cpp index 637f6d6c2..2340f93ac 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -1008,7 +1008,7 @@ static json format_timings(llama_server_context &llama) assert(timings.n_eval == llama.num_tokens_predicted); return json{ - {"prompt_n", timings.n_eval}, + {"prompt_n", timings.n_p_eval}, {"prompt_ms", timings.t_p_eval_ms}, {"prompt_per_token_ms", timings.t_p_eval_ms / timings.n_p_eval}, {"prompt_per_second", 1e3 / timings.t_p_eval_ms * timings.n_p_eval}, @@ -1037,7 +1037,6 @@ static json format_final_response(llama_server_context &llama, const std::string {"stopped_limit", llama.stopped_limit}, {"stopping_word", llama.stopping_word}, {"tokens_cached", llama.n_past}, - {"tokens_predicted", llama.num_tokens_predicted}, {"timings", format_timings(llama)}, };