File tree Expand file tree Collapse file tree 1 file changed +5
-5
lines changed Expand file tree Collapse file tree 1 file changed +5
-5
lines changed Original file line number Diff line number Diff line change @@ -286,10 +286,6 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
286286 list (APPEND VLLM_GPU_FLAGS "-DENABLE_SCALED_MM_C3X=1" )
287287 message (STATUS "Building scaled_mm_c3x for archs: ${SCALED_MM_3X_ARCHS} " )
288288 else ()
289- # clear SCALED_MM_3X_ARCHS so the scaled_mm_c2x kernels know we didn't
290- # build any 3x kernels
291- set (SCALED_MM_3X_ARCHS)
292-
293289 if (NOT ${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 12.0 AND SCALED_MM_3X_ARCHS)
294290 message (STATUS "Not building scaled_mm_c3x as CUDA Compiler version is "
295291 "not >= 12.0, we recommend upgrading to CUDA 12.0 or "
@@ -299,13 +295,17 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
299295 message (STATUS "Not building scaled_mm_c3x as no compatible archs found "
300296 "in CUDA target architectures" )
301297 endif ()
298+
299+ # clear SCALED_MM_3X_ARCHS so the scaled_mm_c2x kernels know we didn't
300+ # build any 3x kernels
301+ set (SCALED_MM_3X_ARCHS)
302302 endif ()
303303
304304 #
305305 # For the cutlass_scaled_mm kernels we want to build the c2x (CUTLASS 2.x)
306306 # kernels for the remaining archs that are not already built for 3x.
307307 cuda_archs_loose_intersection(SCALED_MM_2X_ARCHS
308- "7.5;8.0;8.6;8.9;9.0;9.0a " "${CUDA_ARCHS} " )
308+ "7.5;8.0;8.6;8.9;9.0" "${CUDA_ARCHS} " )
309309 # subtract out the archs that are already built for 3x
310310 list (REMOVE_ITEM SCALED_MM_2X_ARCHS ${SCALED_MM_3X_ARCHS} )
311311 if (SCALED_MM_2X_ARCHS)
You can’t perform that action at this time.
0 commit comments