Measure eval time only for single-token calls

2023-03-22 07:22:51 +02:00 · 2023-03-22 07:22:51 +02:00 · a9f900b645
commit a9f900b645
parent 71ed3d224d
1 changed files with 5 additions and 2 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -836,8 +836,11 @@ static bool llama_eval_internal(

    ggml_free(ctx0);

+    // measure the performance only for the single-token evals
+    if (N == 1) {
        lctx.t_eval_us += ggml_time_us() - t_start_us;
        lctx.n_eval++;
+    }

    return true;
 }