llama : better n_batch and n_ubatch comment

2024-03-13 18:09:56 +01:00 · 2024-03-13 18:09:56 +01:00 · 9092883d58
commit 9092883d58
parent 3c38789f5b
1 changed files with 2 additions and 2 deletions
--- a/llama.h
+++ b/llama.h
@ -234,8 +234,8 @@ extern "C" {
    struct llama_context_params {
        uint32_t seed;              // RNG seed, -1 for random
        uint32_t n_ctx;             // text context, 0 = from model
-        uint32_t n_batch;           // prompt processing maximum batch size (ignored if n_ubatch is not zero)
+        uint32_t n_batch;           // logical maximum batch size that can be submitted to llama_decode
-        uint32_t n_ubatch;          // prompt processing maximum batch size
+        uint32_t n_ubatch;          // physical maximum batch size
        uint32_t n_seq_max;         // max number of sequences (i.e. distinct states for recurrent models)
        uint32_t n_threads;         // number of threads to use for generation
        uint32_t n_threads_batch;   // number of threads to use for batch processing