diff --git a/csrc/quantization/cutlass_w8a8/scaled_mm_c2x.cu b/csrc/quantization/cutlass_w8a8/scaled_mm_c2x.cu index d26c43de522c9..aac4900f933a7 100644 --- a/csrc/quantization/cutlass_w8a8/scaled_mm_c2x.cu +++ b/csrc/quantization/cutlass_w8a8/scaled_mm_c2x.cu @@ -4,7 +4,8 @@ #include "scaled_mm_c2x.cuh" #include "scaled_mm_c2x_sm80_dispatch.cuh" -#include "scaled_mm_c2x_sm89_dispatch.cuh" +#include "scaled_mm_c2x_sm89_fp8_dispatch.cuh" +#include "scaled_mm_c2x_sm89_int8_dispatch.cuh" /* This file defines quantized GEMM operations using the CUTLASS 2.x API, for @@ -98,25 +99,17 @@ template