diff --git a/common/common.h b/common/common.h index 286642db2..5536fd409 100644 --- a/common/common.h +++ b/common/common.h @@ -133,6 +133,7 @@ struct common_params_sampling { bool penalize_nl = false; // consider newlines as a repeatable token bool ignore_eos = false; bool no_perf = false; // disable performance metrics + bool timing_per_token = false; std::vector dry_sequence_breakers = {"\n", ":", "\"", "*"}; // default sequence breakers for DRY diff --git a/examples/server/server.cpp b/examples/server/server.cpp index 179cf6192..a18489426 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -1269,6 +1269,7 @@ struct server_context { {"n_keep", slot.params.n_keep}, {"n_discard", slot.params.n_discard}, {"ignore_eos", slot.params.sampling.ignore_eos}, + {"timing_per_token", slot.params.sampling.timing_per_token}, {"stream", slot.params.stream}, //{"logit_bias", slot.params.sampling.logit_bias}, {"n_probs", slot.params.sampling.n_probs},