Commit fcf4d60e authored by jmorganca's avatar jmorganca
Browse files

llm: add back check for empty token cache

parent e33d5c2d
...@@ -1032,7 +1032,7 @@ struct llama_server_context ...@@ -1032,7 +1032,7 @@ struct llama_server_context
slot.has_next_token = false; slot.has_next_token = false;
} }
if (llama_token_is_eog(model, result.tok)) if (!slot.cache_tokens.empty() && llama_token_is_eog(model, result.tok))
{ {
slot.stopped_eos = true; slot.stopped_eos = true;
slot.has_next_token = false; slot.has_next_token = false;
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment