refact : fix convert script + zero out KV cache to avoid nans

This commit is contained in:
Georgi Gerganov 2023-10-07 11:18:04 +03:00
parent 0e797c2fc5
commit bdbe11719d
No known key found for this signature in database
GPG key ID: 449E073F9DC10735
4 changed files with 28 additions and 78 deletions

View file

@ -167,7 +167,7 @@ int main(int argc, char ** argv) {
// the max batch size is as large as the context to handle cases where we get very long input prompt from multiple
// users. regardless of the size, the main loop will chunk the batch into a maximum of params.n_batch tokens at a time
llama_batch batch = llama_batch_init(params.n_ctx, 0);
llama_batch batch = llama_batch_init(n_ctx, 0);
int32_t n_total_prompt = 0;
int32_t n_total_gen = 0;