Unverified Commit 32de16ce authored by Lianmin Zheng's avatar Lianmin Zheng Committed by GitHub
Browse files

Fix streaming (#437)

parent 0992d85f
......@@ -20,15 +20,16 @@ class FinishReason(IntEnum):
LENGTH = auto()
STOP_STR = auto()
def to_str(self):
if self == FinishReason.EOS_TOKEN:
@staticmethod
def to_str(reason):
if reason == FinishReason.EOS_TOKEN:
return None
elif self == FinishReason.LENGTH:
elif reason == FinishReason.LENGTH:
return "length"
elif self == FinishReason.STOP_STR:
elif reason == FinishReason.STOP_STR:
return "stop"
else:
raise ValueError(f"Invalid finish reason: {self}")
return None
class Req:
......
......@@ -24,7 +24,7 @@ from sglang.srt.managers.io_struct import (
FlushCacheReq,
TokenizedGenerateReqInput,
)
from sglang.srt.managers.router.infer_batch import Batch, ForwardMode, Req
from sglang.srt.managers.router.infer_batch import Batch, ForwardMode, Req, FinishReason
from sglang.srt.managers.router.model_runner import ModelRunner
from sglang.srt.managers.router.radix_cache import RadixCache
from sglang.srt.managers.router.scheduler import Scheduler
......@@ -615,7 +615,7 @@ class ModelRpcServer:
+ len(req.output_ids)
- req.prompt_tokens,
"completion_tokens_wo_jump_forward": req.completion_tokens_wo_jump_forward,
"finish_reason": req.finish_reason.to_str(),
"finish_reason": FinishReason.to_str(req.finish_reason),
"hit_stop_str": req.hit_stop_str,
}
if req.return_logprob:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment