Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
0023cd2b
Unverified
Commit
0023cd2b
authored
Feb 20, 2025
by
Gregory Shtrasberg
Committed by
GitHub
Feb 19, 2025
Browse files
[ROCm] MI300A compile targets deprecation (#13560)
parent
041e2947
Changes
4
Show whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
4 additions
and
7 deletions
+4
-7
CMakeLists.txt
CMakeLists.txt
+1
-1
csrc/quantization/fp8/amd/hip_float8_impl.h
csrc/quantization/fp8/amd/hip_float8_impl.h
+1
-2
csrc/rocm/attention.cu
csrc/rocm/attention.cu
+1
-2
vllm/attention/backends/rocm_flash_attn.py
vllm/attention/backends/rocm_flash_attn.py
+1
-2
No files found.
CMakeLists.txt
View file @
0023cd2b
...
...
@@ -34,7 +34,7 @@ set(PYTHON_SUPPORTED_VERSIONS "3.9" "3.10" "3.11" "3.12")
set
(
CUDA_SUPPORTED_ARCHS
"7.0;7.2;7.5;8.0;8.6;8.7;8.9;9.0"
)
# Supported AMD GPU architectures.
set
(
HIP_SUPPORTED_ARCHS
"gfx906;gfx908;gfx90a;
gfx940;gfx941;
gfx942;gfx1030;gfx1100;gfx1101"
)
set
(
HIP_SUPPORTED_ARCHS
"gfx906;gfx908;gfx90a;gfx942;gfx1030;gfx1100;gfx1101"
)
#
# Supported/expected torch versions for CUDA/ROCm.
...
...
csrc/quantization/fp8/amd/hip_float8_impl.h
View file @
0023cd2b
#pragma once
#if defined(__HIPCC__) && \
(defined(__gfx940__) || defined(__gfx941__) || defined(__gfx942__))
#if defined(__HIPCC__) && defined(__gfx942__)
#define __HIP__MI300__
#endif
...
...
csrc/rocm/attention.cu
View file @
0023cd2b
...
...
@@ -24,8 +24,7 @@
#include "../attention/dtype_fp8.cuh"
#include "../quantization/fp8/amd/quant_utils.cuh"
#if defined(__HIPCC__) && (defined(__gfx90a__) || defined(__gfx940__) || \
defined(__gfx941__) || defined(__gfx942__))
#if defined(__HIPCC__) && (defined(__gfx90a__) || defined(__gfx942__))
#define __HIP__MI300_MI250__
#endif
...
...
vllm/attention/backends/rocm_flash_attn.py
View file @
0023cd2b
...
...
@@ -25,8 +25,7 @@ logger = init_logger(__name__)
_PARTITION_SIZE_ROCM
=
512
_GPU_ARCH
=
torch
.
cuda
.
get_device_properties
(
"cuda"
).
gcnArchName
_ON_NAVI
=
"gfx1"
in
_GPU_ARCH
_ON_MI250_MI300
=
any
(
arch
in
_GPU_ARCH
for
arch
in
[
"gfx90a"
,
"gfx940"
,
"gfx941"
,
"gfx942"
])
_ON_MI250_MI300
=
any
(
arch
in
_GPU_ARCH
for
arch
in
[
"gfx90a"
,
"gfx942"
])
class
ROCmFlashAttentionBackend
(
AttentionBackend
):
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment