Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
a087cda8
Commit
a087cda8
authored
Sep 25, 2024
by
zhuwenwen
Browse files
remove reason of unsupported
parent
2b91ac93
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
9 additions
and
9 deletions
+9
-9
vllm/model_executor/models/__init__.py
vllm/model_executor/models/__init__.py
+6
-6
vllm/platforms/rocm.py
vllm/platforms/rocm.py
+3
-3
No files found.
vllm/model_executor/models/__init__.py
View file @
a087cda8
...
@@ -123,12 +123,12 @@ _ROCM_SWA_REASON = ("Sliding window attention (SWA) is not yet supported in "
...
@@ -123,12 +123,12 @@ _ROCM_SWA_REASON = ("Sliding window attention (SWA) is not yet supported in "
"please use CK flash attention by setting "
"please use CK flash attention by setting "
"`VLLM_USE_TRITON_FLASH_ATTN=0`"
)
"`VLLM_USE_TRITON_FLASH_ATTN=0`"
)
_ROCM_PARTIALLY_SUPPORTED_MODELS
:
Dict
[
str
,
str
]
=
{
_ROCM_PARTIALLY_SUPPORTED_MODELS
:
Dict
[
str
,
str
]
=
{
"Qwen2ForCausalLM"
:
#
"Qwen2ForCausalLM":
_ROCM_SWA_REASON
,
#
_ROCM_SWA_REASON,
"MistralForCausalLM"
:
#
"MistralForCausalLM":
_ROCM_SWA_REASON
,
#
_ROCM_SWA_REASON,
"MixtralForCausalLM"
:
#
"MixtralForCausalLM":
_ROCM_SWA_REASON
,
#
_ROCM_SWA_REASON,
"PaliGemmaForConditionalGeneration"
:
"PaliGemmaForConditionalGeneration"
:
(
"ROCm flash attention does not yet "
(
"ROCm flash attention does not yet "
"fully support 32-bit precision on PaliGemma"
),
"fully support 32-bit precision on PaliGemma"
),
...
...
vllm/platforms/rocm.py
View file @
a087cda8
...
@@ -11,9 +11,9 @@ from .interface import Platform, PlatformEnum
...
@@ -11,9 +11,9 @@ from .interface import Platform, PlatformEnum
logger
=
init_logger
(
__name__
)
logger
=
init_logger
(
__name__
)
if
os
.
environ
.
get
(
"VLLM_WORKER_MULTIPROC_METHOD"
,
None
)
in
[
"fork"
,
None
]:
if
os
.
environ
.
get
(
"VLLM_WORKER_MULTIPROC_METHOD"
,
None
)
in
[
"fork"
,
None
]:
logger
.
warning
(
"`fork` method is not supported by ROCm. "
#
logger.warning("`fork` method is not supported by ROCm. "
"VLLM_WORKER_MULTIPROC_METHOD is overridden to"
#
"VLLM_WORKER_MULTIPROC_METHOD is overridden to"
" `spawn` instead."
)
#
" `spawn` instead.")
os
.
environ
[
"VLLM_WORKER_MULTIPROC_METHOD"
]
=
"spawn"
os
.
environ
[
"VLLM_WORKER_MULTIPROC_METHOD"
]
=
"spawn"
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment