From 3bce859017bc040c5469fdf45e4a1ccfb65d77ed Mon Sep 17 00:00:00 2001 From: Huy Do Date: Sat, 14 Jun 2025 02:58:07 -0700 Subject: [PATCH] Only build CUTLASS MoE kernels on Hopper Signed-off-by: Huy Do --- CMakeLists.txt | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/CMakeLists.txt b/CMakeLists.txt index bd389823fbb2..d75f0d321247 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -542,10 +542,10 @@ if(VLLM_GPU_LANG STREQUAL "CUDA") # CUTLASS MoE kernels - # The MoE kernel cutlass_moe_mm requires CUDA 12.3 or later (and only works + # The MoE kernel cutlass_moe_mm requires CUDA 12.3 or later (and ONLY works # on Hopper). get_cutlass_(pplx_)moe_mm_data should only be compiled # if it's possible to compile MoE kernels that use its output. - cuda_archs_loose_intersection(SCALED_MM_ARCHS "9.0a;10.0a" "${CUDA_ARCHS}") + cuda_archs_loose_intersection(SCALED_MM_ARCHS "9.0a" "${CUDA_ARCHS}") if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER_EQUAL 12.3 AND SCALED_MM_ARCHS) set(SRCS "csrc/quantization/cutlass_w8a8/moe/grouped_mm_c3x.cu" "csrc/quantization/cutlass_w8a8/moe/moe_data.cu")