Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
6c9837a7
Unverified
Commit
6c9837a7
authored
Jun 29, 2025
by
Huy Do
Committed by
GitHub
Jun 29, 2025
Browse files
Fix cuda_archs_loose_intersection when handling sm_*a (#20207)
Signed-off-by:
Huy Do
<
huydhn@gmail.com
>
parent
6f2f53a8
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
26 additions
and
21 deletions
+26
-21
CMakeLists.txt
CMakeLists.txt
+12
-2
cmake/utils.cmake
cmake/utils.cmake
+14
-19
No files found.
CMakeLists.txt
View file @
6c9837a7
...
...
@@ -562,7 +562,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
"if you intend on running FP8 quantized MoE models on Hopper."
)
else
()
message
(
STATUS
"Not building grouped_mm_c3x as no compatible archs found "
"in CUDA target architectures"
)
"in CUDA target architectures
.
"
)
endif
()
endif
()
...
...
@@ -574,6 +574,16 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
SRCS
"
${
SRCS
}
"
CUDA_ARCHS
"
${
CUTLASS_MOE_DATA_ARCHS
}
"
)
list
(
APPEND VLLM_EXT_SRC
"
${
SRCS
}
"
)
message
(
STATUS
"Building moe_data for archs:
${
CUTLASS_MOE_DATA_ARCHS
}
"
)
else
()
if
(
NOT
${
CMAKE_CUDA_COMPILER_VERSION
}
VERSION_GREATER_EQUAL 12.3 AND CUTLASS_MOE_DATA_ARCHS
)
message
(
STATUS
"Not building moe_data as CUDA Compiler version is "
"not >= 12.3, we recommend upgrading to CUDA 12.3 or later "
"if you intend on running FP8 quantized MoE models on Hopper or Blackwell."
)
else
()
message
(
STATUS
"Not building moe_data as no compatible archs found "
"in CUDA target architectures."
)
endif
()
endif
()
#
...
...
cmake/utils.cmake
View file @
6c9837a7
...
...
@@ -313,21 +313,16 @@ function(cuda_archs_loose_intersection OUT_CUDA_ARCHS SRC_CUDA_ARCHS TGT_CUDA_AR
# if x.0a is in SRC_CUDA_ARCHS and x.0 is in CUDA_ARCHS then we should
# remove x.0a from SRC_CUDA_ARCHS and add x.0a to _CUDA_ARCHS
set
(
_CUDA_ARCHS
)
if
(
"9.0a"
IN_LIST _SRC_CUDA_ARCHS
)
list
(
REMOVE_ITEM _SRC_CUDA_ARCHS
"9.0a"
)
if
(
"9.0"
IN_LIST TGT_CUDA_ARCHS
)
list
(
REMOVE_ITEM _TGT_CUDA_ARCHS
"9.0"
)
set
(
_CUDA_ARCHS
"9.0a"
)
endif
()
endif
()
if
(
"10.0a"
IN_LIST _SRC_CUDA_ARCHS
)
list
(
REMOVE_ITEM _SRC_CUDA_ARCHS
"10.0a"
)
if
(
"10.0"
IN_LIST TGT_CUDA_ARCHS
)
list
(
REMOVE_ITEM _TGT_CUDA_ARCHS
"10.0"
)
set
(
_CUDA_ARCHS
"10.0a"
)
foreach
(
_arch
${
_SRC_CUDA_ARCHS
}
)
if
(
_arch MATCHES
"
\\
a$"
)
list
(
REMOVE_ITEM _SRC_CUDA_ARCHS
"
${
_arch
}
"
)
string
(
REPLACE
"a"
""
_base
"
${
_arch
}
"
)
if
(
"
${
_base
}
"
IN_LIST TGT_CUDA_ARCHS
)
list
(
REMOVE_ITEM _TGT_CUDA_ARCHS
"
${
_base
}
"
)
list
(
APPEND _CUDA_ARCHS
"
${
_arch
}
"
)
endif
()
endif
()
endforeach
()
list
(
SORT _SRC_CUDA_ARCHS COMPARE NATURAL ORDER ASCENDING
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment