Update server.cpp

This commit is contained in:
Maximilian Winter 2024-01-26 22:54:26 +01:00
parent edc2c08943
commit 960cfb003f

View file

@ -1611,7 +1611,7 @@ struct llama_server_context
std::vector<int32_t> slot_npasts;
for (auto & slot : slots)
{
slot_npasts.emplace_back(slot.n_past);
slot_npasts.emplace_back(0);
}
for (int32_t i = 0; i < (int32_t) batch.n_tokens; i += n_batch)