Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
24f7cb1e
Unverified
Commit
24f7cb1e
authored
Sep 29, 2025
by
Zhihao Zhang
Committed by
GitHub
Sep 28, 2025
Browse files
[speculative decoding] rename lookahead to ngram (#11010)
Co-authored-by:
a4zhangfei
<
a4zhangfei@qq.com
>
parent
e05555fa
Changes
22
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
4 additions
and
4 deletions
+4
-4
test/srt/run_suite.py
test/srt/run_suite.py
+1
-1
test/srt/test_ngram_speculative_decoding.py
test/srt/test_ngram_speculative_decoding.py
+3
-3
No files found.
test/srt/run_suite.py
View file @
24f7cb1e
...
...
@@ -79,7 +79,7 @@ suites = {
TestFile
(
"test_hidden_states.py"
,
55
),
TestFile
(
"test_hybrid_attn_backend.py"
,
100
),
TestFile
(
"test_standalone_speculative_decoding.py"
,
250
),
TestFile
(
"test_
lookahead
_speculative_decoding.py"
,
250
),
TestFile
(
"test_
ngram
_speculative_decoding.py"
,
250
),
TestFile
(
"test_input_embeddings.py"
,
38
),
TestFile
(
"test_io_struct.py"
,
8
),
TestFile
(
"test_jinja_template_utils.py"
,
1
),
...
...
test/srt/test_
lookahead
_speculative_decoding.py
→
test/srt/test_
ngram
_speculative_decoding.py
View file @
24f7cb1e
...
...
@@ -7,7 +7,7 @@ import requests
from
sglang.srt.utils
import
kill_process_tree
from
sglang.test.few_shot_gsm8k
import
run_eval
as
run_eval_few_shot_gsm8k
from
sglang.test.test_utils
import
(
DEFAULT_
LOOKAHEAD
_SPECULATIVE_TARGET_MODEL_FOR_TEST
,
DEFAULT_
NGRAM
_SPECULATIVE_TARGET_MODEL_FOR_TEST
,
DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH
,
DEFAULT_URL_FOR_TEST
,
CustomTestCase
,
...
...
@@ -23,7 +23,7 @@ DEFAULT_SERVER_ARGS = [
"--cuda-graph-max-bs"
,
"8"
,
"--speculative-algorithm"
,
"
LOOKAHEAD
"
,
"
NGRAM
"
,
"--speculative-num-draft-tokens"
,
"16"
,
"--mem-fraction-static"
,
...
...
@@ -33,7 +33,7 @@ DEFAULT_SERVER_ARGS = [
class
TestStandaloneSpeculativeDecodingBase
(
CustomTestCase
):
model
=
DEFAULT_
LOOKAHEAD
_SPECULATIVE_TARGET_MODEL_FOR_TEST
model
=
DEFAULT_
NGRAM
_SPECULATIVE_TARGET_MODEL_FOR_TEST
base_url
=
DEFAULT_URL_FOR_TEST
accuracy_threshold
=
0.79
# derived tests need to override this
spec_decode_threshold
=
1.8
# derived spec decoding tests need to override this
...
...
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment