diff --git a/torchao/csrc/cuda/activation24/sparse_gemm.cu b/torchao/csrc/cuda/activation24/sparse_gemm.cu index f837bcc3aa..48b4c6e687 100644 --- a/torchao/csrc/cuda/activation24/sparse_gemm.cu +++ b/torchao/csrc/cuda/activation24/sparse_gemm.cu @@ -95,10 +95,10 @@ struct SparseRowwiseKernel { float, ElementOut, cutlass::layout::RowMajor, - 1, + 8, ElementOut, cutlass::layout::RowMajor, - 1, + 8, cutlass::epilogue::TmaWarpSpecializedCooperative, EpilogueEVT>::CollectiveOp; @@ -172,10 +172,10 @@ struct SparseRowwiseKernel { float, ElementOut, cutlass::layout::RowMajor, - 1, + 8, ElementOut, cutlass::layout::RowMajor, - 1, + 8, cutlass::epilogue::TmaWarpSpecializedCooperative, EpilogueEVT>::CollectiveOp;