"vscode:/vscode.git/clone" did not exist on "8e1cae5d668fb809f4470c681562e20aeffceda2"
Unverified Commit 5e6c3265 authored by Yanyi Liu's avatar Yanyi Liu Committed by GitHub
Browse files

Support setting `use_thread` in the `run_program` for easier debugging. (#1823)


Co-authored-by: default avatarByron Hsu <byronhsu1230@gmail.com>
parent 680cad20
......@@ -54,7 +54,14 @@ def run_internal(state, program, func_args, func_kwargs, sync):
def run_program(
program, backend, func_args, func_kwargs, default_sampling_para, stream, sync=False
program,
backend,
func_args,
func_kwargs,
default_sampling_para,
stream,
sync=False,
use_thread=True,
):
if hasattr(backend, "endpoint"):
backend = backend.endpoint
......@@ -67,6 +74,7 @@ def run_program(
chat_template=None,
stream=stream,
num_api_spec_tokens=program.num_api_spec_tokens,
use_thread=use_thread,
)
state = ProgramState(stream_executor)
......
......@@ -168,6 +168,7 @@ class SglFunction:
return_text_in_logprobs: Optional[bool] = None,
stream: bool = False,
backend=None,
use_thread: bool = True,
**kwargs,
):
from sglang.lang.interpreter import run_program
......@@ -195,7 +196,15 @@ class SglFunction:
return_text_in_logprobs=return_text_in_logprobs,
)
backend = backend or global_config.default_backend
return run_program(self, backend, args, kwargs, default_sampling_para, stream)
return run_program(
self,
backend,
args,
kwargs,
default_sampling_para,
stream,
use_thread=use_thread,
)
def run_batch(
self,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment