Skip to content

Commit cbd34e8

Browse files
huydhnyangw-dev
authored andcommitted
Only build CUTLASS MoE kernels on Hopper (vllm-project#19648)
Signed-off-by: Yang Wang <[email protected]>
1 parent 303a886 commit cbd34e8

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -542,10 +542,10 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
542542

543543
# CUTLASS MoE kernels
544544

545-
# The MoE kernel cutlass_moe_mm requires CUDA 12.3 or later (and only works
545+
# The MoE kernel cutlass_moe_mm requires CUDA 12.3 or later (and ONLY works
546546
# on Hopper). get_cutlass_(pplx_)moe_mm_data should only be compiled
547547
# if it's possible to compile MoE kernels that use its output.
548-
cuda_archs_loose_intersection(SCALED_MM_ARCHS "9.0a;10.0a" "${CUDA_ARCHS}")
548+
cuda_archs_loose_intersection(SCALED_MM_ARCHS "9.0a" "${CUDA_ARCHS}")
549549
if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER_EQUAL 12.3 AND SCALED_MM_ARCHS)
550550
set(SRCS "csrc/quantization/cutlass_w8a8/moe/grouped_mm_c3x.cu"
551551
"csrc/quantization/cutlass_w8a8/moe/moe_data.cu")

0 commit comments

Comments
 (0)