Unverified Commit 180fba65 authored by Divakar Verma's avatar Divakar Verma Committed by GitHub
Browse files

[ROCm] fix import for on_gfx9 (#32783)


Signed-off-by: default avatarDivakar Verma <divakar.verma@amd.com>
parent f9995398
......@@ -913,7 +913,14 @@ class BatchedTritonExperts(mk.FusedMoEPermuteExpertsUnpermute):
activation_key: QuantKey | None,
) -> bool:
p = current_platform
device_supports_fp8 = (p.is_rocm() and p.rocm.on_gfx9()) or (
if p.is_rocm():
from vllm.platforms.rocm import on_gfx9
is_rocm_on_gfx9 = on_gfx9()
else:
is_rocm_on_gfx9 = False
device_supports_fp8 = is_rocm_on_gfx9 or (
p.is_cuda() and p.has_device_capability((8, 9))
)
......
......@@ -1922,7 +1922,14 @@ class TritonExperts(mk.FusedMoEPermuteExpertsUnpermute):
activation_key: QuantKey | None,
) -> bool:
p = current_platform
device_supports_fp8 = (p.is_rocm() and p.rocm.on_gfx9()) or (
if p.is_rocm():
from vllm.platforms.rocm import on_gfx9
is_rocm_on_gfx9 = on_gfx9()
else:
is_rocm_on_gfx9 = False
device_supports_fp8 = is_rocm_on_gfx9 or (
p.is_cuda() and p.has_device_capability((8, 9))
)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment