Unverified Commit 4837543a authored by PanZezhong1725's avatar PanZezhong1725 Committed by GitHub
Browse files

Merge pull request #15 from InfiniTensor/issue/14

issue/14: 兼容openai协议
parents 897f5741 4fb73db2
......@@ -187,7 +187,7 @@ async def chat_stream(id_, request_data, request: Request):
chunk = json.dumps(
chunk_json(id_, content="", role="assistant"), ensure_ascii=False
)
yield f"{chunk}\n\n"
yield f"data: {chunk}\n\n"
request.app.state.request_queue.sync_q.put(infer_task)
......@@ -203,7 +203,7 @@ async def chat_stream(id_, request_data, request: Request):
chunk_json(id_, finish_reason=infer_task.finish_reason),
ensure_ascii=False,
)
yield f"{chunk}\n\n"
yield f"data: {chunk}\n\n"
break
token = await infer_task.output_queue.async_q.get()
......@@ -213,7 +213,7 @@ async def chat_stream(id_, request_data, request: Request):
.replace("<0x0A>", "\n")
)
chunk = json.dumps(chunk_json(id_, content=content), ensure_ascii=False)
yield f"{chunk}\n\n"
yield f"data: {chunk}\n\n"
except Exception as e:
print(f"[Error] ID : {id_} Exception: {e}")
......@@ -274,8 +274,8 @@ async def chat_completions(request: Request):
chat_stream(id_, data, request), media_type="text/event-stream"
)
else:
return JSONResponse(chat(id_, data))
response = await chat(id_, data, request)
return JSONResponse(content=response)
if __name__ == "__main__":
uvicorn.run(App, host="0.0.0.0", port=8000)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment