parallel : example for serving multiple users in parallel

This commit is contained in:
Georgi Gerganov 2023-09-18 20:30:05 +03:00
parent 1f17ea631c
commit 0161372b9a
No known key found for this signature in database
GPG key ID: 449E073F9DC10735
9 changed files with 262 additions and 13 deletions

View file

@ -681,7 +681,7 @@ int main(int argc, char ** argv) {
return 1;
}
params.perplexity = true;
params.logits_all = true;
params.n_batch = std::min(params.n_batch, params.n_ctx);
if (params.ppl_stride > 0) {