File tree Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -308,7 +308,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
308
308
# Keep building Marlin for 9.0 as there are some group sizes and shapes that
309
309
# are not supported by Machete yet.
310
310
# 9.0 for latest bf16 atomicAdd PTX
311
- cuda_archs_loose_intersection (MARLIN_ARCHS "8.0;9.0+PTX" "${CUDA_ARCHS} " )
311
+ cuda_archs_loose_intersection (MARLIN_ARCHS "8.0;8.7; 9.0+PTX" "${CUDA_ARCHS} " )
312
312
if (MARLIN_ARCHS )
313
313
314
314
#
@@ -454,7 +454,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
454
454
# kernels for the remaining archs that are not already built for 3x.
455
455
# (Build 8.9 for FP8)
456
456
cuda_archs_loose_intersection (SCALED_MM_2X_ARCHS
457
- "7.5;8.0;8.9+PTX" "${CUDA_ARCHS} " )
457
+ "7.5;8.0;8.7;8. 9+PTX" "${CUDA_ARCHS} " )
458
458
# subtract out the archs that are already built for 3x
459
459
list (REMOVE_ITEM SCALED_MM_2X_ARCHS ${SCALED_MM_3X_ARCHS} )
460
460
if (SCALED_MM_2X_ARCHS )
@@ -684,7 +684,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
684
684
685
685
list (APPEND VLLM_MOE_EXT_SRC "${VLLM_MOE_WNA16_SRC} " )
686
686
# 9.0 for latest bf16 atomicAdd PTX
687
- cuda_archs_loose_intersection (MARLIN_MOE_ARCHS "8.0;9.0+PTX" "${CUDA_ARCHS} " )
687
+ cuda_archs_loose_intersection (MARLIN_MOE_ARCHS "8.0;8.7; 9.0+PTX" "${CUDA_ARCHS} " )
688
688
if (MARLIN_MOE_ARCHS )
689
689
690
690
#
You can’t perform that action at this time.
0 commit comments