"...git@developer.sourcefind.cn:2222/OpenDAS/vllm_cscc.git" did not exist on "28ef9ba399340ea7013df8cd1c359b07acc0a302"
Unverified Commit e123aafd authored by Michael Goin's avatar Michael Goin Committed by GitHub
Browse files

Disable GPTQ AllSpark kernels for CUDA Compiler < 12.0 (#14157)


Signed-off-by: default avatarmgoin <mgoin64@gmail.com>
parent 5b143d33
...@@ -319,7 +319,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA") ...@@ -319,7 +319,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
# Only build AllSpark kernels if we are building for at least some compatible archs. # Only build AllSpark kernels if we are building for at least some compatible archs.
cuda_archs_loose_intersection(ALLSPARK_ARCHS "8.0;8.6;8.7;8.9" "${CUDA_ARCHS}") cuda_archs_loose_intersection(ALLSPARK_ARCHS "8.0;8.6;8.7;8.9" "${CUDA_ARCHS}")
if (ALLSPARK_ARCHS) if (${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 12.0 AND ALLSPARK_ARCHS)
set(ALLSPARK_SRCS set(ALLSPARK_SRCS
"csrc/quantization/gptq_allspark/allspark_repack.cu" "csrc/quantization/gptq_allspark/allspark_repack.cu"
"csrc/quantization/gptq_allspark/allspark_qgemm_w8a16.cu") "csrc/quantization/gptq_allspark/allspark_qgemm_w8a16.cu")
...@@ -330,7 +330,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA") ...@@ -330,7 +330,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
message(STATUS "Building AllSpark kernels for archs: ${ALLSPARK_ARCHS}") message(STATUS "Building AllSpark kernels for archs: ${ALLSPARK_ARCHS}")
else() else()
message(STATUS "Not building AllSpark kernels as no compatible archs found" message(STATUS "Not building AllSpark kernels as no compatible archs found"
" in CUDA target architectures") " in CUDA target architectures, or CUDA not >= 12.0")
endif() endif()
# The cutlass_scaled_mm kernels for Hopper (c3x, i.e. CUTLASS 3.x) require # The cutlass_scaled_mm kernels for Hopper (c3x, i.e. CUTLASS 3.x) require
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment