Work around for recalculating logits in cached prompts

This commit is contained in:
Danny Daemonic 2023-05-27 03:20:03 -07:00
parent bdbda1b17a
commit 573b690e16

View file

@ -360,6 +360,12 @@ int main(int argc, char ** argv) {
}
}
if (i > 0) {
// check if we've used up all the prompt but not all cached tokens
if (embd.size() == i && n_session_consumed < session_tokens.size()) {
// force revaluation of the last token to recalculate logits
i--;
n_past--;
}
embd.erase(embd.begin(), embd.begin() + i);
}
}