Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
2dccecf4
Unverified
Commit
2dccecf4
authored
Dec 26, 2024
by
Yineng Zhang
Committed by
GitHub
Dec 26, 2024
Browse files
fix: only enable moe_align_block_size for now (#2590)
parent
75ad0a14
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
2 additions
and
32 deletions
+2
-32
sgl-kernel/pyproject.toml
sgl-kernel/pyproject.toml
+1
-1
sgl-kernel/src/sgl-kernel/__init__.py
sgl-kernel/src/sgl-kernel/__init__.py
+1
-11
sgl-kernel/src/sgl-kernel/ops/__init__.py
sgl-kernel/src/sgl-kernel/ops/__init__.py
+0
-20
No files found.
sgl-kernel/pyproject.toml
View file @
2dccecf4
...
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
...
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
[project]
[project]
name
=
"sgl-kernel"
name
=
"sgl-kernel"
version
=
"0.0.2.post
8
"
version
=
"0.0.2.post
9
"
description
=
"Kernel Library for SGLang"
description
=
"Kernel Library for SGLang"
readme
=
"README.md"
readme
=
"README.md"
requires-python
=
">=3.8"
requires-python
=
">=3.8"
...
...
sgl-kernel/src/sgl-kernel/__init__.py
View file @
2dccecf4
from
.ops
import
(
from
.ops
import
moe_align_block_size
custom_dispose
,
custom_reduce
,
init_custom_reduce
,
moe_align_block_size
,
warp_reduce
,
)
__all__
=
[
__all__
=
[
"warp_reduce"
,
"init_custom_reduce"
,
"custom_dispose"
,
"custom_reduce"
,
"moe_align_block_size"
,
"moe_align_block_size"
,
]
]
sgl-kernel/src/sgl-kernel/ops/__init__.py
View file @
2dccecf4
from
.custom_reduce_cuda
import
all_reduce
as
_all_reduce
from
.custom_reduce_cuda
import
dispose
as
_dispose
from
.custom_reduce_cuda
import
init_custom_ar
as
_init_custom_ar
from
.moe_align_block_size
import
moe_align_block_size
as
_moe_align_block_size
from
.moe_align_block_size
import
moe_align_block_size
as
_moe_align_block_size
from
.warp_reduce_cuda
import
reduce
as
_reduce
def
warp_reduce
(
input_tensor
):
return
_reduce
(
input_tensor
)
def
init_custom_reduce
(
rank_id
,
num_devices
,
buffers
,
barrier_in
,
barrier_out
):
return
_init_custom_ar
(
rank_id
,
num_devices
,
buffers
,
barrier_in
,
barrier_out
)
def
custom_dispose
(
fa
):
_dispose
(
fa
)
def
custom_reduce
(
fa
,
inp
,
out
):
_all_reduce
(
fa
,
inp
,
out
)
def
moe_align_block_size
(
def
moe_align_block_size
(
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment