Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
b188a89a
"...restful/test_restful_interface_func_turbomind.py" did not exist on "e2d98ddce2d31dcc95c58604d9ddae8232344a1d"
Unverified
Commit
b188a89a
authored
Jul 16, 2025
by
YanbingJiang
Committed by
GitHub
Jul 16, 2025
Browse files
Fix CI xeon test with triton 3.3.1 (#8086)
parent
497efe74
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
11 additions
and
1 deletion
+11
-1
python/sglang/srt/layers/quantization/fp8_kernel.py
python/sglang/srt/layers/quantization/fp8_kernel.py
+11
-1
No files found.
python/sglang/srt/layers/quantization/fp8_kernel.py
View file @
b188a89a
...
...
@@ -29,6 +29,7 @@ from sglang.srt.utils import (
direct_register_custom_op
,
get_device_core_count
,
get_device_name
,
is_cpu
,
is_cuda
,
is_hip
,
log_info_on_rank0
,
...
...
@@ -37,6 +38,7 @@ from sglang.srt.utils import (
_is_hip
=
is_hip
()
_is_cuda
=
is_cuda
()
_is_cpu
=
is_cpu
()
if
_is_cuda
:
from
sgl_kernel
import
(
...
...
@@ -1168,7 +1170,7 @@ def scaled_fp8_quant(
return
output
,
scale
@
triton
.
autotune
(
fp8_autotune
=
triton
.
autotune
(
configs
=
[
triton
.
Config
({
"BLOCK_M"
:
block_m
},
num_warps
=
num_warps
)
for
block_m
in
[
16
,
32
,
64
,
128
]
...
...
@@ -1176,6 +1178,8 @@ def scaled_fp8_quant(
],
key
=
[
"K"
,
"BLOCK_K"
,
"M_ALIGNMENT"
],
)
@
triton
.
jit
def
_per_token_group_quant_fp8_hopper_moe_mn_major
(
a
,
# (M, K):(K, 1)
...
...
@@ -1221,6 +1225,12 @@ def _per_token_group_quant_fp8_hopper_moe_mn_major(
tl
.
store
(
sfa_ptrs
,
inp_amax
/
448.0
,
mask
=
coord_m
<
m
)
if
not
_is_cpu
:
_per_token_group_quant_fp8_hopper_moe_mn_major
=
fp8_autotune
(
_per_token_group_quant_fp8_hopper_moe_mn_major
)
def
per_token_group_quant_fp8_hopper_moe_mn_major
(
A
:
torch
.
Tensor
,
expert_offsets
:
torch
.
Tensor
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment