From 332003584eb39bbd4465d69666033155e087ef46 Mon Sep 17 00:00:00 2001 From: xaedes Date: Fri, 19 May 2023 18:41:06 +0200 Subject: [PATCH] sample with non-greedy sampling parameters at the end of training --- examples/baby-llama/baby-llama-text.cpp | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/examples/baby-llama/baby-llama-text.cpp b/examples/baby-llama/baby-llama-text.cpp index 099863bb8..beacf4686 100644 --- a/examples/baby-llama/baby-llama-text.cpp +++ b/examples/baby-llama/baby-llama-text.cpp @@ -1712,9 +1712,12 @@ int main(int argc, char ** argv) { save_model(&model, fn_chkpt_out); { - int n_gen = 128; + int n_gen = 1024; int sample_ctx = n_tokens - n_tokens/8; + sampler.params.temp = 0.2; + sampler.params.repeat_penalty = 1.1; + sampler.params.mirostat = 2; init_sampler(&sampler, lctx); printf("Generating %d tokens.\n", n_gen);