Skip to content

Commit 6028879

Browse files
committed
parallel : print misses on each request
1 parent eed3fd4 commit 6028879

File tree

1 file changed

+2
-4
lines changed

1 file changed

+2
-4
lines changed

examples/parallel/parallel.cpp

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -326,12 +326,10 @@ int main(int argc, char ** argv) {
326326

327327
const auto t_main_end = ggml_time_us();
328328

329-
LOG_TEE("\033[1mClient %3d, seq %4d, prompt %4d t, response %4d t, time %5.2f s, speed: PP %5.2f t/s, TG %5.2f t/s, AVG %5.2f t/s \033[0m: \n\nInput: %s\nResponse: %s\n\n",
329+
LOG_TEE("\033[1mClient %3d, seq %4d, prompt %4d t, response %4d t, time %5.2f s, cache miss %d \033[0m: \n\nInput: %s\nResponse: %s\n\n",
330330
client.id, client.seq_id, client.n_prompt, client.n_decoded,
331331
(t_main_end - client.t_start_prompt) / 1e6,
332-
(double) (client.n_prompt ) / (client.t_start_gen - client.t_start_prompt) * 1e6,
333-
(double) (client.n_decoded ) / (t_main_end - client.t_start_gen) * 1e6,
334-
(double) (client.n_decoded + client.n_prompt) / (t_main_end - client.t_start_prompt) * 1e6,
332+
n_cache_miss,
335333
::trim(client.input).c_str(),
336334
::trim(client.response).c_str());
337335

0 commit comments

Comments
 (0)