@@ -285,15 +285,15 @@ endif()
285
285
286
286
message (STATUS "Enabling C extension." )
287
287
define_gpu_extension_target(
288
- _C
289
- DESTINATION vllm
290
- LANGUAGE ${VLLM_GPU_LANG}
291
- SOURCES ${VLLM_EXT_SRC}
292
- COMPILE_FLAGS ${VLLM_GPU_FLAGS}
293
- ARCHITECTURES ${VLLM_GPU_ARCHES}
294
- INCLUDE_DIRECTORIES ${CUTLASS_INCLUDE_DIR}
295
- USE_SABI 3
296
- WITH_SOABI)
288
+ _C
289
+ DESTINATION vllm
290
+ LANGUAGE ${VLLM_GPU_LANG}
291
+ SOURCES ${VLLM_EXT_SRC}
292
+ COMPILE_FLAGS ${VLLM_GPU_FLAGS}
293
+ ARCHITECTURES ${VLLM_GPU_ARCHES}
294
+ INCLUDE_DIRECTORIES ${CUTLASS_INCLUDE_DIR}
295
+ USE_SABI 3
296
+ WITH_SOABI)
297
297
298
298
# If CUTLASS is compiled on NVCC >= 12.5, it by default uses
299
299
# cudaGetDriverEntryPointByVersion as a wrapper to avoid directly calling the
@@ -325,11 +325,6 @@ define_gpu_extension_target(
325
325
USE_SABI 3
326
326
WITH_SOABI)
327
327
328
- # vllm-flash-attn currently only supported on CUDA
329
- if (NOT VLLM_TARGET_DEVICE STREQUAL "cuda" )
330
- return ()
331
- endif ()
332
-
333
328
if (VLLM_GPU_LANG STREQUAL "HIP" )
334
329
#
335
330
# _rocm_C extension
@@ -349,6 +344,11 @@ if(VLLM_GPU_LANG STREQUAL "HIP")
349
344
WITH_SOABI)
350
345
endif ()
351
346
347
+ # vllm-flash-attn currently only supported on CUDA
348
+ if (NOT VLLM_TARGET_DEVICE STREQUAL "cuda" )
349
+ return ()
350
+ endif ()
351
+
352
352
#
353
353
# Build vLLM flash attention from source
354
354
#
@@ -357,7 +357,7 @@ endif()
357
357
# They should be identical but if they aren't, this is a massive footgun.
358
358
#
359
359
# The vllm-flash-attn install rules are nested under vllm to make sure the library gets installed in the correct place.
360
- # To only install vllm-flash-attn, use --component vllm-flash-attn_c .
360
+ # To only install vllm-flash-attn, use --component vllm_flash_attn_c .
361
361
# If no component is specified, vllm-flash-attn is still installed.
362
362
363
363
# If VLLM_FLASH_ATTN_SRC_DIR is set, vllm-flash-attn is installed from that directory instead of downloading.
0 commit comments