fix instruct mode (#445)

changes to EOS behavior in interactive and reverse prompt handling broke instruct mode by erroneously injecting instruct mode's reverse prompt and an extra newline.
2024-11-09 23:29:44 +00:00 · 2023-03-24 10:22:39 -05:00 · 2023-03-24 10:22:39 -05:00 · 863f65e2e3
commit 863f65e2e3
parent afd220d9c6
1 changed files with 7 additions and 3 deletions
--- a/main.cpp
+++ b/main.cpp
@ -387,7 +387,7 @@ int main(int argc, char ** argv) {
            }

            // replace end of text token with newline token when in interactive mode
-            if (id == llama_token_eos() && params.interactive) {
+            if (id == llama_token_eos() && params.interactive && !params.instruct) {
                id = llama_token_newline.front();
                if (params.antiprompt.size() != 0) {
                    // tokenize and inject first reverse prompt
@ -488,9 +488,13 @@ int main(int argc, char ** argv) {

        // end of text token
        if (embd.back() == llama_token_eos()) {
+            if (params.instruct) {
+                is_interacting = true;
+            } else {
                fprintf(stderr, " [end of text]\n");
                break;
            }
+        }

        // In interactive mode, respect the maximum number of tokens and drop back to user input when reached.
        if (params.interactive && remaining_tokens <= 0) {