Skip to content

Commit fadb1a8

Browse files
committed
fix: add SM90 guard for FP8 Blockscale GEMM
Signed-off-by: Zihua Wu <[email protected]>
1 parent c27e130 commit fadb1a8

File tree

1 file changed

+8
-0
lines changed

1 file changed

+8
-0
lines changed

cpp/tensorrt_llm/kernels/cutlass_kernels/fp8_blockscale_gemm/fp8_blockscale_gemm.cu

+8
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,14 @@ template <typename ElementA, typename ElementB, typename ElementD>
2525
CutlassFp8BlockScaleGemmRunner<ElementA, ElementB, ElementD>::CutlassFp8BlockScaleGemmRunner()
2626
{
2727
TLLM_LOG_DEBUG(__PRETTY_FUNCTION__);
28+
int sm = tensorrt_llm::common::getSMVersion();
29+
if (sm != 90)
30+
{
31+
TLLM_THROW(
32+
"FP8 Blockscale GEMM kernels are only supported on SM90 architectures, but current device compute "
33+
"capability is %d.",
34+
sm);
35+
}
2836
}
2937

3038
template <typename ElementA, typename ElementB, typename ElementD>

0 commit comments

Comments
 (0)