Measure eval time only for single-token calls

This commit is contained in:
Georgi Gerganov 2023-03-22 07:22:51 +02:00
parent 71ed3d224d
commit a9f900b645
No known key found for this signature in database
GPG key ID: 449E073F9DC10735

View file

@ -836,8 +836,11 @@ static bool llama_eval_internal(
ggml_free(ctx0);
// measure the performance only for the single-token evals
if (N == 1) {
lctx.t_eval_us += ggml_time_us() - t_start_us;
lctx.n_eval++;
}
return true;
}