llm: add back check for empty token cache

2024-04-30 17:38:44 -04:00 · 2024-04-30 17:38:44 -04:00 · fcf4d60eee
parent e33d5c2dbc
commit fcf4d60eee
1 changed files with 1 additions and 1 deletions
--- a/llm/ext_server/server.cpp
+++ b/llm/ext_server/server.cpp
@ -1032,7 +1032,7 @@ struct llama_server_context
            slot.has_next_token = false;
        }
-        if (llama_token_is_eog(model, result.tok))
+        if (!slot.cache_tokens.empty() && llama_token_is_eog(model, result.tok))
        {
            slot.stopped_eos = true;
            slot.has_next_token = false;