Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
8221f9ae
Unverified
Commit
8221f9ae
authored
Oct 15, 2025
by
Liangsheng Yin
Committed by
GitHub
Oct 15, 2025
Browse files
Tiny cleanup some eagle unused codes (#11660)
parent
ab9187a2
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
0 additions
and
9 deletions
+0
-9
python/sglang/srt/speculative/draft_utils.py
python/sglang/srt/speculative/draft_utils.py
+0
-4
python/sglang/srt/speculative/eagle_draft_cuda_graph_runner.py
...n/sglang/srt/speculative/eagle_draft_cuda_graph_runner.py
+0
-1
python/sglang/srt/speculative/eagle_worker.py
python/sglang/srt/speculative/eagle_worker.py
+0
-4
No files found.
python/sglang/srt/speculative/draft_utils.py
View file @
8221f9ae
...
...
@@ -96,7 +96,6 @@ class DraftBackendFactory:
FlashInferMultiStepDraftBackend
,
)
self
.
has_prefill_wrapper_verify
=
True
return
FlashInferMultiStepDraftBackend
(
self
.
draft_model_runner
,
self
.
topk
,
self
.
speculative_num_steps
)
...
...
@@ -105,7 +104,6 @@ class DraftBackendFactory:
FlashInferMLAMultiStepDraftBackend
,
)
self
.
has_prefill_wrapper_verify
=
True
return
FlashInferMLAMultiStepDraftBackend
(
self
.
draft_model_runner
,
self
.
topk
,
self
.
speculative_num_steps
)
...
...
@@ -149,7 +147,6 @@ class DraftBackendFactory:
TRTLLMHAAttnMultiStepDraftBackend
,
)
self
.
has_prefill_wrapper_verify
=
True
return
TRTLLMHAAttnMultiStepDraftBackend
(
self
.
draft_model_runner
,
self
.
topk
,
self
.
speculative_num_steps
)
...
...
@@ -164,7 +161,6 @@ class DraftBackendFactory:
TRTLLMMLAMultiStepDraftBackend
,
)
self
.
has_prefill_wrapper_verify
=
True
return
TRTLLMMLAMultiStepDraftBackend
(
self
.
draft_model_runner
,
self
.
topk
,
self
.
speculative_num_steps
)
...
...
python/sglang/srt/speculative/eagle_draft_cuda_graph_runner.py
View file @
8221f9ae
...
...
@@ -41,7 +41,6 @@ class EAGLEDraftCudaGraphRunner:
# Parse args
self
.
eagle_worker
=
eagle_worker
self
.
model_runner
=
model_runner
=
eagle_worker
.
model_runner
self
.
model_runner
:
EAGLEWorker
self
.
graphs
=
{}
self
.
output_buffers
=
{}
self
.
enable_torch_compile
=
model_runner
.
server_args
.
enable_torch_compile
...
...
python/sglang/srt/speculative/eagle_worker.py
View file @
8221f9ae
...
...
@@ -192,10 +192,6 @@ class EAGLEWorker(TpModelWorker):
def
init_attention_backend
(
self
):
# Create multi-step attn backends and cuda graph runners
self
.
has_prefill_wrapper_verify
=
False
self
.
draft_extend_attn_backend
=
None
draft_backend_factory
=
DraftBackendFactory
(
self
.
server_args
,
self
.
draft_model_runner
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment