Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
267cc5ff
Commit
267cc5ff
authored
Jul 21, 2025
by
zhuwenwen
Browse files
update List
parent
b1babea8
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
4 additions
and
4 deletions
+4
-4
vllm/model_executor/layers/fused_moe/fused_moe.py
vllm/model_executor/layers/fused_moe/fused_moe.py
+4
-4
No files found.
vllm/model_executor/layers/fused_moe/fused_moe.py
View file @
267cc5ff
...
...
@@ -1047,7 +1047,7 @@ def try_get_optimal_moe_config(
dtype
:
Optional
[
str
],
M
:
int
,
is_marlin
:
bool
=
False
,
block_shape
:
Optional
[
l
ist
[
int
]]
=
None
,
block_shape
:
Optional
[
L
ist
[
int
]]
=
None
,
use_nn_moe
:
Optional
[
bool
]
=
False
,
)
->
dict
[
str
,
int
]:
from
vllm.model_executor.layers.fused_moe
import
get_config
...
...
@@ -1392,7 +1392,7 @@ def fused_experts(
w2_zp
:
Optional
[
torch
.
Tensor
]
=
None
,
a1_scale
:
Optional
[
torch
.
Tensor
]
=
None
,
a2_scale
:
Optional
[
torch
.
Tensor
]
=
None
,
block_shape
:
Optional
[
l
ist
[
int
]]
=
None
,
block_shape
:
Optional
[
L
ist
[
int
]]
=
None
,
allow_deep_gemm
:
bool
=
False
,
allow_cutlass_block_scaled_grouped_gemm
:
bool
=
False
,
use_nn_moe
:
Optional
[
bool
]
=
False
)
->
torch
.
Tensor
:
...
...
@@ -1796,7 +1796,7 @@ class TritonExperts(mk.FusedMoEPermuteExpertsUnpermute):
use_int8_w8a16
:
bool
=
False
,
use_int4_w4a16
:
bool
=
False
,
per_act_token_quant
:
bool
=
False
,
block_shape
:
Optional
[
l
ist
[
int
]]
=
None
,
block_shape
:
Optional
[
L
ist
[
int
]]
=
None
,
):
super
().
__init__
(
FusedMoEQuantConfig
.
make
(
...
...
@@ -1981,7 +1981,7 @@ def modular_triton_fused_moe(
use_int8_w8a16
:
bool
,
use_int4_w4a16
:
bool
,
per_act_token_quant
:
bool
,
block_shape
:
Optional
[
l
ist
[
int
]]
=
None
,
block_shape
:
Optional
[
L
ist
[
int
]]
=
None
,
)
->
mk
.
FusedMoEModularKernel
:
return
mk
.
FusedMoEModularKernel
(
MoEPrepareAndFinalizeNoEP
(),
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment