Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
efb0de2c
Unverified
Commit
efb0de2c
authored
Sep 06, 2025
by
jacky.cheng
Committed by
GitHub
Sep 05, 2025
Browse files
Update wave-lang to 3.7.0 and unify Wave kernel buffer options (#10069)
parent
0f6ac5e2
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
4 additions
and
8 deletions
+4
-8
python/pyproject.toml
python/pyproject.toml
+1
-1
python/sglang/srt/layers/attention/wave_ops/decode_attention.py
.../sglang/srt/layers/attention/wave_ops/decode_attention.py
+2
-4
python/sglang/srt/layers/attention/wave_ops/extend_attention.py
.../sglang/srt/layers/attention/wave_ops/extend_attention.py
+1
-3
No files found.
python/pyproject.toml
View file @
efb0de2c
...
@@ -82,7 +82,7 @@ srt_hip = [
...
@@ -82,7 +82,7 @@ srt_hip = [
"sglang[runtime_common]"
,
"sglang[runtime_common]"
,
"torch"
,
"torch"
,
"petit_kernel==0.0.2"
,
"petit_kernel==0.0.2"
,
"wave-lang==
1.0.1
"
,
"wave-lang==
3.7.0
"
,
]
]
# https://docs.sglang.ai/platforms/cpu_server.html
# https://docs.sglang.ai/platforms/cpu_server.html
...
...
python/sglang/srt/layers/attention/wave_ops/decode_attention.py
View file @
efb0de2c
...
@@ -64,8 +64,7 @@ def get_wave_kernel(
...
@@ -64,8 +64,7 @@ def get_wave_kernel(
subs
=
hyperparams_0
,
subs
=
hyperparams_0
,
canonicalize
=
True
,
canonicalize
=
True
,
run_bench
=
False
,
run_bench
=
False
,
use_buffer_load_ops
=
True
,
use_buffer_ops
=
True
,
use_buffer_store_ops
=
True
,
waves_per_eu
=
2
,
waves_per_eu
=
2
,
dynamic_symbols
=
dynamic_symbols_0
,
dynamic_symbols
=
dynamic_symbols_0
,
wave_runtime
=
True
,
wave_runtime
=
True
,
...
@@ -77,8 +76,7 @@ def get_wave_kernel(
...
@@ -77,8 +76,7 @@ def get_wave_kernel(
subs
=
hyperparams_1
,
subs
=
hyperparams_1
,
canonicalize
=
True
,
canonicalize
=
True
,
run_bench
=
False
,
run_bench
=
False
,
use_buffer_load_ops
=
False
,
use_buffer_ops
=
False
,
use_buffer_store_ops
=
False
,
waves_per_eu
=
4
,
waves_per_eu
=
4
,
dynamic_symbols
=
dynamic_symbols_1
,
dynamic_symbols
=
dynamic_symbols_1
,
wave_runtime
=
True
,
wave_runtime
=
True
,
...
...
python/sglang/srt/layers/attention/wave_ops/extend_attention.py
View file @
efb0de2c
...
@@ -67,11 +67,9 @@ def get_wave_kernel(
...
@@ -67,11 +67,9 @@ def get_wave_kernel(
schedule
=
SchedulingType
.
NONE
,
schedule
=
SchedulingType
.
NONE
,
use_scheduling_barriers
=
False
,
use_scheduling_barriers
=
False
,
dynamic_symbols
=
dynamic_symbols
,
dynamic_symbols
=
dynamic_symbols
,
use_buffer_load_ops
=
True
,
use_buffer_ops
=
True
,
use_buffer_store_ops
=
True
,
waves_per_eu
=
2
,
waves_per_eu
=
2
,
denorm_fp_math_f32
=
"preserve-sign"
,
denorm_fp_math_f32
=
"preserve-sign"
,
gpu_native_math_precision
=
True
,
wave_runtime
=
True
,
wave_runtime
=
True
,
)
)
options
=
set_default_run_config
(
options
)
options
=
set_default_run_config
(
options
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment