Unverified Commit 83f74c69 authored by Luka Govedič's avatar Luka Govedič Committed by GitHub
Browse files

[Fix][ROCm] Enforce eager for all encoder-decoder models on ROCm (#18154)


Signed-off-by: default avatarLuka Govedič <lgovedic@redhat.com>
parent 2dff0935
...@@ -906,12 +906,17 @@ class ModelConfig: ...@@ -906,12 +906,17 @@ class ModelConfig:
def _verify_cuda_graph(self) -> None: def _verify_cuda_graph(self) -> None:
self.max_seq_len_to_capture = min(self.max_seq_len_to_capture, self.max_seq_len_to_capture = min(self.max_seq_len_to_capture,
self.max_model_len) self.max_model_len)
# CUDAGraph capture not supported for enc-dec models and mllama on ROCm
ROCM_UNSUPPORTED_MODELS = ['mllama'] ROCM_UNSUPPORTED_MODELS = ['mllama']
if (self.hf_config.model_type in ROCM_UNSUPPORTED_MODELS unsupported_rocm = (self.hf_config.model_type
and not self.enforce_eager and current_platform.is_rocm()): in ROCM_UNSUPPORTED_MODELS
or self.is_encoder_decoder)
if (unsupported_rocm and not self.enforce_eager
and current_platform.is_rocm()):
logger.warning( logger.warning(
"CUDA graph is not supported for %s on ROCm yet, fallback " "CUDA graph is not supported for %s on ROCm yet, fallback "
"to the eager mode.", self.hf_config.model_type) "to eager mode.", self.hf_config.model_type)
self.enforce_eager = True self.enforce_eager = True
def _verify_bnb_config(self) -> None: def _verify_bnb_config(self) -> None:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment