Make llama.com n_predict be -1 by default

2025-09-03 23:34:27 +00:00 · 2023-05-12 08:20:34 -07:00 · 2023-05-12 08:20:34 -07:00 · bbfe4fbd11
commit bbfe4fbd11
parent ca19ecf49c
1 changed files with 1 additions and 1 deletions
--- a/third_party/ggml/common.h
+++ b/third_party/ggml/common.h
@ -22,7 +22,7 @@ struct gpt_params {
    int32_t seed          = -1;   // RNG seed
    int32_t verbose       = 0;    // Logging verbosity
    int32_t n_threads     = std::min(1, (int)(_getcpucount() * 0.75));
-    int32_t n_predict     = 128;  // new tokens to predict
+    int32_t n_predict     = -1;   // new tokens to predict
    int32_t n_parts       = -1;   // amount of model parts (-1 = determine from model dimensions)
    int32_t n_ctx         = 512;  // context size
    int32_t n_batch       = 64;   // batch size for prompt processing (must be >=32 to use BLAS)