fix(llama.cpp): fix eos without cache (#1852)

2025-06-13 04:28:10 +00:00 · 2024-03-18 18:59:24 +01:00
parent b202bfaaa0
commit fa9e330fc6
1 changed files with 1 additions and 1 deletions
--- a/backend/cpp/llama/grpc-server.cpp
+++ b/backend/cpp/llama/grpc-server.cpp
@ -1084,7 +1084,7 @@ struct llama_server_context
            slot.has_next_token = false;
        }

-        if (!slot.cache_tokens.empty() && result.tok == llama_token_eos(model))
+        if (result.tok == llama_token_eos(model))
        {
            slot.stopped_eos = true;
            slot.has_next_token = false;