Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
c1acd6d7
Unverified
Commit
c1acd6d7
authored
Jul 12, 2025
by
Wentao Ye
Committed by
GitHub
Jul 12, 2025
Browse files
[Refactor] Change the way of import triton (#20774)
Signed-off-by:
yewentao256
<
zhyanwentao@126.com
>
parent
3b3b778d
Changes
5
Show whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
5 additions
and
9 deletions
+5
-9
tests/kernels/moe/test_batched_moe.py
tests/kernels/moe/test_batched_moe.py
+1
-1
vllm/attention/ops/triton_unified_attention.py
vllm/attention/ops/triton_unified_attention.py
+1
-2
vllm/lora/ops/triton_ops/lora_expand_op.py
vllm/lora/ops/triton_ops/lora_expand_op.py
+1
-2
vllm/lora/ops/triton_ops/lora_shrink_op.py
vllm/lora/ops/triton_ops/lora_shrink_op.py
+1
-2
vllm/model_executor/layers/fused_moe/fused_batched_moe.py
vllm/model_executor/layers/fused_moe/fused_batched_moe.py
+1
-2
No files found.
tests/kernels/moe/test_batched_moe.py
View file @
c1acd6d7
...
...
@@ -6,7 +6,6 @@ from typing import Optional
import
pytest
import
torch
import
triton.language
as
tl
from
tests.kernels.moe.utils
import
(
batched_moe
,
make_quantized_test_activations
,
...
...
@@ -18,6 +17,7 @@ from vllm.model_executor.layers.fused_moe.fused_batched_moe import (
invoke_moe_batched_triton_kernel
)
from
vllm.model_executor.layers.fused_moe.fused_moe
import
fused_topk
from
vllm.platforms
import
current_platform
from
vllm.triton_utils
import
tl
MNK_FACTORS
=
[
(
1
,
128
,
128
),
...
...
vllm/attention/ops/triton_unified_attention.py
View file @
c1acd6d7
...
...
@@ -8,10 +8,9 @@
# - Thomas Parnell <tpa@zurich.ibm.com>
import
torch
import
triton
import
triton.language
as
tl
from
vllm.logger
import
init_logger
from
vllm.triton_utils
import
tl
,
triton
logger
=
init_logger
(
__name__
)
...
...
vllm/lora/ops/triton_ops/lora_expand_op.py
View file @
c1acd6d7
...
...
@@ -8,12 +8,11 @@ https://arxiv.org/abs/2310.18547
"""
import
torch
import
triton
import
triton.language
as
tl
from
vllm.lora.ops.triton_ops.kernel_utils
import
do_expand_kernel
from
vllm.lora.ops.triton_ops.utils
import
_get_lora_b_ptr
from
vllm.platforms
import
current_platform
from
vllm.triton_utils
import
tl
,
triton
from
vllm.utils
import
direct_register_custom_op
...
...
vllm/lora/ops/triton_ops/lora_shrink_op.py
View file @
c1acd6d7
...
...
@@ -8,12 +8,11 @@ https://arxiv.org/abs/2310.18547
"""
import
torch
import
triton
import
triton.language
as
tl
from
vllm.lora.ops.triton_ops.kernel_utils
import
do_shrink_kernel
from
vllm.lora.ops.triton_ops.utils
import
_get_lora_a_ptr
from
vllm.platforms
import
current_platform
from
vllm.triton_utils
import
tl
,
triton
from
vllm.utils
import
direct_register_custom_op
...
...
vllm/model_executor/layers/fused_moe/fused_batched_moe.py
View file @
c1acd6d7
...
...
@@ -4,8 +4,6 @@
from
typing
import
Optional
import
torch
import
triton
import
triton.language
as
tl
import
vllm.model_executor.layers.fused_moe.modular_kernel
as
mk
from
vllm.model_executor.layers.fused_moe.config
import
FusedMoEQuantConfig
...
...
@@ -18,6 +16,7 @@ from vllm.model_executor.layers.fused_moe.utils import (
normalize_scales_shape
)
from
vllm.model_executor.layers.quantization.utils.quant_utils
import
(
group_broadcast
)
from
vllm.triton_utils
import
tl
,
triton
@
triton
.
jit
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment