This commit is contained in:
eiery 2023-04-20 17:06:34 -04:00
parent 4b781c2055
commit c6dfc44a37

View file

@ -21,7 +21,7 @@ struct gpt_params {
int32_t n_parts = -1; // amount of model parts (-1 = determine from model dimensions)
int32_t n_ctx = 512; // context size
#if defined(GGML_USE_ACCELERATE) || defined(GGML_USE_OPENBLAS) || defined (GGML_USE_CUBLAS)
int32_t n_batch = 512; // batch size for prompt processing (must be >=32 to use BLAS)
int32_t n_batch = 512; // batch size for prompt processing (must be >=32 to use BLAS)
#else
int32_t n_batch = 8; // batch size for prompt processing
#endif