Measure eval time only for single-token calls

2023-03-22 07:22:51 +02:00 · 2023-03-22 07:22:51 +02:00 · a9f900b645
commit a9f900b645
parent 71ed3d224d
1 changed files with 5 additions and 2 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -836,8 +836,11 @@ static bool llama_eval_internal(
    ggml_free(ctx0);
-    lctx.t_eval_us += ggml_time_us() - t_start_us;
+    // measure the performance only for the single-token evals
-    lctx.n_eval++;
+    if (N == 1) {
        lctx.t_eval_us += ggml_time_us() - t_start_us;
        lctx.n_eval++;
    }
    return true;
 }