Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
52e1f52f
"tests/python/common/test_subgraph.py" did not exist on "4c5136c8f8ded9087fd3aa75721b45db18e9b069"
Unverified
Commit
52e1f52f
authored
Aug 09, 2025
by
Trevor Morris
Committed by
GitHub
Aug 09, 2025
Browse files
[bugfix] Fix missing args in bench one batch (#8877)
parent
50188092
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
6 additions
and
0 deletions
+6
-0
python/sglang/bench_one_batch.py
python/sglang/bench_one_batch.py
+6
-0
No files found.
python/sglang/bench_one_batch.py
View file @
52e1f52f
...
@@ -61,6 +61,7 @@ from sglang.srt.configs.model_config import ModelConfig
...
@@ -61,6 +61,7 @@ from sglang.srt.configs.model_config import ModelConfig
from
sglang.srt.distributed.parallel_state
import
destroy_distributed_environment
from
sglang.srt.distributed.parallel_state
import
destroy_distributed_environment
from
sglang.srt.entrypoints.engine
import
_set_envs_and_config
from
sglang.srt.entrypoints.engine
import
_set_envs_and_config
from
sglang.srt.hf_transformers_utils
import
get_tokenizer
from
sglang.srt.hf_transformers_utils
import
get_tokenizer
from
sglang.srt.layers.moe.utils
import
DeepEPMode
,
MoeA2ABackend
from
sglang.srt.managers.schedule_batch
import
Req
,
ScheduleBatch
from
sglang.srt.managers.schedule_batch
import
Req
,
ScheduleBatch
from
sglang.srt.managers.scheduler
import
Scheduler
from
sglang.srt.managers.scheduler
import
Scheduler
from
sglang.srt.model_executor.forward_batch_info
import
ForwardBatch
from
sglang.srt.model_executor.forward_batch_info
import
ForwardBatch
...
@@ -300,6 +301,11 @@ def _maybe_prepare_mlp_sync_batch(batch: ScheduleBatch, model_runner):
...
@@ -300,6 +301,11 @@ def _maybe_prepare_mlp_sync_batch(batch: ScheduleBatch, model_runner):
disable_cuda_graph
=
model_runner
.
server_args
.
disable_cuda_graph
,
disable_cuda_graph
=
model_runner
.
server_args
.
disable_cuda_graph
,
spec_algorithm
=
SpeculativeAlgorithm
.
NONE
,
spec_algorithm
=
SpeculativeAlgorithm
.
NONE
,
speculative_num_draft_tokens
=
None
,
speculative_num_draft_tokens
=
None
,
enable_two_batch_overlap
=
model_runner
.
server_args
.
enable_two_batch_overlap
,
enable_deepep_moe
=
MoeA2ABackend
(
model_runner
.
server_args
.
moe_a2a_backend
).
is_deepep
(),
deepep_mode
=
DeepEPMode
(
model_runner
.
server_args
.
deepep_mode
),
require_mlp_tp_gather
=
require_mlp_tp_gather
(
model_runner
.
server_args
),
require_mlp_tp_gather
=
require_mlp_tp_gather
(
model_runner
.
server_args
),
disable_overlap_schedule
=
model_runner
.
server_args
.
disable_overlap_schedule
,
disable_overlap_schedule
=
model_runner
.
server_args
.
disable_overlap_schedule
,
)
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment