Skip to content

Commit e888f73

Browse files
mgoinshreyankg
authored andcommitted
Disable GPTQ AllSpark kernels for CUDA Compiler < 12.0 (vllm-project#14157)
Signed-off-by: mgoin <[email protected]>
1 parent 0dd0e59 commit e888f73

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -319,7 +319,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
319319

320320
# Only build AllSpark kernels if we are building for at least some compatible archs.
321321
cuda_archs_loose_intersection(ALLSPARK_ARCHS "8.0;8.6;8.7;8.9" "${CUDA_ARCHS}")
322-
if (ALLSPARK_ARCHS)
322+
if (${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 12.0 AND ALLSPARK_ARCHS)
323323
set(ALLSPARK_SRCS
324324
"csrc/quantization/gptq_allspark/allspark_repack.cu"
325325
"csrc/quantization/gptq_allspark/allspark_qgemm_w8a16.cu")
@@ -330,7 +330,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
330330
message(STATUS "Building AllSpark kernels for archs: ${ALLSPARK_ARCHS}")
331331
else()
332332
message(STATUS "Not building AllSpark kernels as no compatible archs found"
333-
" in CUDA target architectures")
333+
" in CUDA target architectures, or CUDA not >= 12.0")
334334
endif()
335335

336336
# The cutlass_scaled_mm kernels for Hopper (c3x, i.e. CUTLASS 3.x) require

0 commit comments

Comments
 (0)