Unverified Commit 18d9a7e1 authored by Jeffrey Morgan's avatar Jeffrey Morgan Committed by GitHub
Browse files

update llama.cpp submodule to `f364eb6` (#4060)

parent 8488388c
...@@ -1032,7 +1032,7 @@ struct llama_server_context ...@@ -1032,7 +1032,7 @@ struct llama_server_context
slot.has_next_token = false; slot.has_next_token = false;
} }
if (!slot.cache_tokens.empty() && result.tok == llama_token_eos(model)) if (llama_token_is_eog(model, result.tok))
{ {
slot.stopped_eos = true; slot.stopped_eos = true;
slot.has_next_token = false; slot.has_next_token = false;
...@@ -1144,12 +1144,15 @@ struct llama_server_context ...@@ -1144,12 +1144,15 @@ struct llama_server_context
res.result_json = json res.result_json = json
{ {
{"content", tkn.text_to_send},
{"stop", false}, {"stop", false},
{"slot_id", slot.id}, {"slot_id", slot.id},
{"multimodal", multimodal} {"multimodal", multimodal}
}; };
if (!llama_token_is_eog(model, tkn.tok)) {
res.result_json["content"] = tkn.text_to_send;
}
if (slot.sparams.n_probs > 0) if (slot.sparams.n_probs > 0)
{ {
std::vector<completion_token_output> probs_output = {}; std::vector<completion_token_output> probs_output = {};
......
Subproject commit f4ab2a41476600a98067a9474ea8f9e6db41bcfa Subproject commit f364eb6fb5d46118a76fa045f487318de4c24961
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment