File tree Expand file tree Collapse file tree 1 file changed +14
-3
lines changed Expand file tree Collapse file tree 1 file changed +14
-3
lines changed Original file line number Diff line number Diff line change @@ -419,9 +419,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
419
419
if (${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 12.8 AND FP4_ARCHS )
420
420
set (SRCS
421
421
"csrc/quantization/fp4/nvfp4_quant_kernels.cu"
422
- "csrc/quantization/fp4/nvfp4_scaled_mm_kernels.cu"
423
- "csrc/quantization/cutlass_w8a8/c3x/scaled_mm_sm100_fp8.cu"
424
- )
422
+ "csrc/quantization/fp4/nvfp4_scaled_mm_kernels.cu" )
425
423
set_gencode_flags_for_srcs (
426
424
SRCS "${SRCS} "
427
425
CUDA_ARCHS "${FP4_ARCHS} " )
@@ -434,6 +432,19 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
434
432
set (FP4_ARCHS )
435
433
endif ()
436
434
435
+ # FP8 Blackwell Archs
436
+ cuda_archs_loose_intersection (BLACKWELL_ARCHS "10.0;10.1;12.0" "${CUDA_ARCHS} " )
437
+ if (${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 12.8 AND BLACKWELL_ARCHS )
438
+ set (SRCS
439
+ "csrc/quantization/cutlass_w8a8/c3x/scaled_mm_sm100_fp8.cu"
440
+ )
441
+ list (APPEND VLLM_EXT_SRC "${SRCS} " )
442
+ message (STATUS "Building FP8 for archs: ${BLACKWELL_ARCHS} " )
443
+ else ()
444
+ # clear BLACKWELL_ARCHS
445
+ set (BLACKWELL_ARCHS )
446
+ endif ()
447
+
437
448
#
438
449
# Machete kernels
439
450
You can’t perform that action at this time.
0 commit comments