File tree 1 file changed +8
-6
lines changed
1 file changed +8
-6
lines changed Original file line number Diff line number Diff line change @@ -177,7 +177,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
177
177
include (FetchContent)
178
178
SET (CUTLASS_ENABLE_HEADERS_ONLY=ON )
179
179
FetchContent_Declare(
180
- cutlass
180
+ cutlass
181
181
GIT_REPOSITORY https://github.com/nvidia/cutlass.git
182
182
# CUTLASS 3.5.0
183
183
GIT_TAG 7d49e6c7e2f8896c47f586706e67e1fb215529dc
@@ -200,11 +200,13 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
200
200
# The CUTLASS kernels for Hopper require sm90a to be enabled.
201
201
# This is done via the below gencode option, BUT that creates kernels for both sm90 and sm90a.
202
202
# That adds an extra 17MB to compiled binary, so instead we selectively enable it.
203
- set_source_files_properties (
204
- "csrc/quantization/cutlass_w8a8/scaled_mm_dq_c3x.cu"
205
- PROPERTIES
206
- COMPILE_FLAGS
207
- "-gencode arch=compute_90a,code=sm_90a" )
203
+ if (${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 11)
204
+ set_source_files_properties (
205
+ "csrc/quantization/cutlass_w8a8/scaled_mm_dq_c3x.cu"
206
+ PROPERTIES
207
+ COMPILE_FLAGS
208
+ "-gencode arch=compute_90a,code=sm_90a" )
209
+ endif ()
208
210
209
211
endif ()
210
212
You can’t perform that action at this time.
0 commit comments