alternate approach to replace end of text tokens

This commit is contained in:
rabidcopy 2023-03-20 17:45:52 -05:00 committed by GitHub
parent d9284a580c
commit 2479c78bc6
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -1001,6 +1001,12 @@ int main(int argc, char ** argv) {
t_sample_us += ggml_time_us() - t_start_sample_us; t_sample_us += ggml_time_us() - t_start_sample_us;
} }
// replace end of text token with newline token when in interactive mode
if (id == EOS_TOKEN_ID && params.interactive) {
id = NEWLINE_TOKEN_ID;
is_interacting = true;
}
// add it to the context // add it to the context
embd.push_back(id); embd.push_back(id);
@ -1086,12 +1092,12 @@ int main(int argc, char ** argv) {
// end of text token // end of text token
if (embd.back() == EOS_TOKEN_ID) { if (embd.back() == EOS_TOKEN_ID) {
if (params.interactive) { if (params.interactive) {
is_interacting = true; // is_interacting = true;
embd.back() = NEWLINE_TOKEN_ID; // embd.back() = NEWLINE_TOKEN_ID;
last_n_tokens.back() = NEWLINE_TOKEN_ID; // last_n_tokens.back() = NEWLINE_TOKEN_ID;
if (params.antiprompt.size() != 0) { // if (params.antiprompt.size() != 0) {
fprintf(stderr, "\n"); // fprintf(stderr, "\n");
} // }
} else { } else {
fprintf(stderr, " [end of text]\n"); fprintf(stderr, " [end of text]\n");
break; break;