remove reason of unsupported

a087cda8 · zhuwenwen · 2b91ac93 · a087cda8 · a087cda8
Commit a087cda8 authored Sep 25, 2024 by zhuwenwen
Hide whitespace changes
Inline Side-by-side

Showing with 9 additions and 9 deletions

vllm/model_executor/models/__init__.py vllm/model_executor/models/__init__.py +6 -6

vllm/platforms/rocm.py vllm/platforms/rocm.py +3 -3

No files found.
--- a/vllm/model_executor/models/__init__.py
+++ b/vllm/model_executor/models/__init__.py
@@ -123,12 +123,12 @@ _ROCM_SWA_REASON = ("Sliding window attention (SWA) is not yet supported in "
                    "please use CK flash attention by setting "
                    "`VLLM_USE_TRITON_FLASH_ATTN=0`")
 _ROCM_PARTIALLY_SUPPORTED_MODELS: Dict[str, str] = {
-    "Qwen2ForCausalLM":
+    # "Qwen2ForCausalLM":
-    _ROCM_SWA_REASON,
+    # _ROCM_SWA_REASON,
-    "MistralForCausalLM":
+    # "MistralForCausalLM":
-    _ROCM_SWA_REASON,
+    # _ROCM_SWA_REASON,
-    "MixtralForCausalLM":
+    # "MixtralForCausalLM":
-    _ROCM_SWA_REASON,
+    # _ROCM_SWA_REASON,
    "PaliGemmaForConditionalGeneration":
    ("ROCm flash attention does not yet "
     "fully support 32-bit precision on PaliGemma"),

--- a/vllm/platforms/rocm.py
+++ b/vllm/platforms/rocm.py
@@ -11,9 +11,9 @@ from .interface import Platform, PlatformEnum
 logger = init_logger(__name__)
 if os.environ.get("VLLM_WORKER_MULTIPROC_METHOD", None) in ["fork", None]:
-    logger.warning("`fork` method is not supported by ROCm. "
+    # logger.warning("`fork` method is not supported by ROCm. "
-                   "VLLM_WORKER_MULTIPROC_METHOD is overridden to"
+    #                "VLLM_WORKER_MULTIPROC_METHOD is overridden to"
-                   " `spawn` instead.")
+    #                " `spawn` instead.")
    os.environ["VLLM_WORKER_MULTIPROC_METHOD"] = "spawn"