Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
6216b12d
"vscode:/vscode.git/clone" did not exist on "81ecf425f0a645e6d6f1c339ba79ef37e95a9569"
Commit
6216b12d
authored
Jan 19, 2026
by
zhuwenwen
Browse files
remove SUPPORT_MOE_MARLIN_W16A16
parent
1a26d0b6
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
0 additions
and
10 deletions
+0
-10
vllm/platforms/rocm.py
vllm/platforms/rocm.py
+0
-6
vllm/utils/__init__.py
vllm/utils/__init__.py
+0
-4
No files found.
vllm/platforms/rocm.py
View file @
6216b12d
...
@@ -16,12 +16,6 @@ from vllm.utils import cuda_device_count_stateless
...
@@ -16,12 +16,6 @@ from vllm.utils import cuda_device_count_stateless
from
.interface
import
DeviceCapability
,
Platform
,
PlatformEnum
,
_Backend
from
.interface
import
DeviceCapability
,
Platform
,
PlatformEnum
,
_Backend
from
vllm.utils
import
SUPPORT_MOE_MARLIN_W16A16
if
SUPPORT_MOE_MARLIN_W16A16
:
os
.
environ
[
'VLLM_USE_MARLIN_W16A16_MOE'
]
=
'1'
os
.
environ
[
'MOE_NN'
]
=
'0'
if
TYPE_CHECKING
:
if
TYPE_CHECKING
:
from
vllm.config
import
ModelConfig
,
VllmConfig
from
vllm.config
import
ModelConfig
,
VllmConfig
...
...
vllm/utils/__init__.py
View file @
6216b12d
...
@@ -86,10 +86,6 @@ if TYPE_CHECKING:
...
@@ -86,10 +86,6 @@ if TYPE_CHECKING:
logger
=
init_logger
(
__name__
)
logger
=
init_logger
(
__name__
)
GPU_ARCH
=
torch
.
cuda
.
get_device_properties
(
"cuda"
).
gcnArchName
SUPPORT_MOE_MARLIN_W16A16
=
any
(
arch
in
GPU_ARCH
for
arch
in
[
"gfx936"
])
# This value is chosen to have a balance between ITL and TTFT. Note it is
# This value is chosen to have a balance between ITL and TTFT. Note it is
# not optimized for throughput.
# not optimized for throughput.
DEFAULT_MAX_NUM_BATCHED_TOKENS
=
2048
DEFAULT_MAX_NUM_BATCHED_TOKENS
=
2048
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment