Unverified Commit 32de16ce authored by Lianmin Zheng's avatar Lianmin Zheng Committed by GitHub
Browse files

Fix streaming (#437)

parent 0992d85f
...@@ -20,15 +20,16 @@ class FinishReason(IntEnum): ...@@ -20,15 +20,16 @@ class FinishReason(IntEnum):
LENGTH = auto() LENGTH = auto()
STOP_STR = auto() STOP_STR = auto()
def to_str(self): @staticmethod
if self == FinishReason.EOS_TOKEN: def to_str(reason):
if reason == FinishReason.EOS_TOKEN:
return None return None
elif self == FinishReason.LENGTH: elif reason == FinishReason.LENGTH:
return "length" return "length"
elif self == FinishReason.STOP_STR: elif reason == FinishReason.STOP_STR:
return "stop" return "stop"
else: else:
raise ValueError(f"Invalid finish reason: {self}") return None
class Req: class Req:
......
...@@ -24,7 +24,7 @@ from sglang.srt.managers.io_struct import ( ...@@ -24,7 +24,7 @@ from sglang.srt.managers.io_struct import (
FlushCacheReq, FlushCacheReq,
TokenizedGenerateReqInput, TokenizedGenerateReqInput,
) )
from sglang.srt.managers.router.infer_batch import Batch, ForwardMode, Req from sglang.srt.managers.router.infer_batch import Batch, ForwardMode, Req, FinishReason
from sglang.srt.managers.router.model_runner import ModelRunner from sglang.srt.managers.router.model_runner import ModelRunner
from sglang.srt.managers.router.radix_cache import RadixCache from sglang.srt.managers.router.radix_cache import RadixCache
from sglang.srt.managers.router.scheduler import Scheduler from sglang.srt.managers.router.scheduler import Scheduler
...@@ -615,7 +615,7 @@ class ModelRpcServer: ...@@ -615,7 +615,7 @@ class ModelRpcServer:
+ len(req.output_ids) + len(req.output_ids)
- req.prompt_tokens, - req.prompt_tokens,
"completion_tokens_wo_jump_forward": req.completion_tokens_wo_jump_forward, "completion_tokens_wo_jump_forward": req.completion_tokens_wo_jump_forward,
"finish_reason": req.finish_reason.to_str(), "finish_reason": FinishReason.to_str(req.finish_reason),
"hit_stop_str": req.hit_stop_str, "hit_stop_str": req.hit_stop_str,
} }
if req.return_logprob: if req.return_logprob:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment