Unverified Commit cb389c91 authored by Junlong Li's avatar Junlong Li Committed by GitHub
Browse files

Fix llava parallelism/fork bug (#315)

parent eddaa2b5
...@@ -73,9 +73,11 @@ class RuntimeEndpoint(BaseBackend): ...@@ -73,9 +73,11 @@ class RuntimeEndpoint(BaseBackend):
assert res.status_code == 200 assert res.status_code == 200
def commit_lazy_operations(self, s: StreamExecutor): def commit_lazy_operations(self, s: StreamExecutor):
data = {"text": s.text_, "sampling_params": {"max_new_tokens": 0}}
self._add_images(s, data)
res = http_request( res = http_request(
self.base_url + "/generate", self.base_url + "/generate",
json={"text": s.text_, "sampling_params": {"max_new_tokens": 0}}, json=data,
auth_token=self.auth_token, auth_token=self.auth_token,
api_key=self.api_key, api_key=self.api_key,
verify=self.verify, verify=self.verify,
......
...@@ -276,6 +276,7 @@ class StreamExecutor: ...@@ -276,6 +276,7 @@ class StreamExecutor:
exes[i].messages_ = list(self.messages_) exes[i].messages_ = list(self.messages_)
exes[i].cur_role = self.cur_role exes[i].cur_role = self.cur_role
exes[i].fork_start_text_pos = len(self.text_) exes[i].fork_start_text_pos = len(self.text_)
exes[i].images_ = list(self.images_)
return exes return exes
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment