Unverified Commit 4fd9d490 authored by spike-zhu's avatar spike-zhu Committed by GitHub
Browse files

issue/71: support vllm benchmark text completion in InfiniLM

parent 1c710c19
...@@ -98,6 +98,7 @@ def chunk_json(id_, content=None, role=None, finish_reason=None): ...@@ -98,6 +98,7 @@ def chunk_json(id_, content=None, role=None, finish_reason=None):
"choices": [ "choices": [
{ {
"index": 0, "index": 0,
"text": content,
"delta": delta, "delta": delta,
"logprobs": None, "logprobs": None,
"finish_reason": finish_reason, "finish_reason": finish_reason,
...@@ -275,9 +276,15 @@ async def chat(id_, request_data, request: Request): ...@@ -275,9 +276,15 @@ async def chat(id_, request_data, request: Request):
@App.post("/chat/completions") @App.post("/chat/completions")
async def chat_completions(request: Request): async def chat_completions(request: Request):
data = await request.json() data = await request.json()
print('-----------------------------------------')
print(data)
print('-----------------------------------------')
if not data.get("messages"): if not data.get("messages"):
return JSONResponse(content={"error": "No message provided"}, status_code=400) if not data.get("prompt"):
return JSONResponse(content={"error": "No message provided"}, status_code=400)
else:
data['messages'] = [{"role": "user", "content": data.get("prompt")}]
stream = data.get("stream", False) stream = data.get("stream", False)
id_ = f"cmpl-{uuid.uuid4().hex}" id_ = f"cmpl-{uuid.uuid4().hex}"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment