Skip to content

Commit 45a1a69

Browse files
authored
[Build] Disable sm_90a in cu11 (#5141)
1 parent 87a658c commit 45a1a69

File tree

1 file changed

+8
-6
lines changed

1 file changed

+8
-6
lines changed

CMakeLists.txt

Lines changed: 8 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -177,7 +177,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
177177
include(FetchContent)
178178
SET(CUTLASS_ENABLE_HEADERS_ONLY=ON)
179179
FetchContent_Declare(
180-
cutlass
180+
cutlass
181181
GIT_REPOSITORY https://github.com/nvidia/cutlass.git
182182
# CUTLASS 3.5.0
183183
GIT_TAG 7d49e6c7e2f8896c47f586706e67e1fb215529dc
@@ -200,11 +200,13 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
200200
# The CUTLASS kernels for Hopper require sm90a to be enabled.
201201
# This is done via the below gencode option, BUT that creates kernels for both sm90 and sm90a.
202202
# That adds an extra 17MB to compiled binary, so instead we selectively enable it.
203-
set_source_files_properties(
204-
"csrc/quantization/cutlass_w8a8/scaled_mm_dq_c3x.cu"
205-
PROPERTIES
206-
COMPILE_FLAGS
207-
"-gencode arch=compute_90a,code=sm_90a")
203+
if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 11)
204+
set_source_files_properties(
205+
"csrc/quantization/cutlass_w8a8/scaled_mm_dq_c3x.cu"
206+
PROPERTIES
207+
COMPILE_FLAGS
208+
"-gencode arch=compute_90a,code=sm_90a")
209+
endif()
208210

209211
endif()
210212

0 commit comments

Comments
 (0)