We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9fa6fa7 commit 2025b75Copy full SHA for 2025b75
torchao/csrc/cuda/activation24/sparse_gemm.cu
@@ -95,10 +95,10 @@ struct SparseRowwiseKernel<cutlass::float_e4m3_t> {
95
float,
96
ElementOut,
97
cutlass::layout::RowMajor,
98
- 1,
+ 8,
99
100
101
102
cutlass::epilogue::TmaWarpSpecializedCooperative,
103
EpilogueEVT>::CollectiveOp;
104
@@ -172,10 +172,10 @@ struct SparseRowwiseKernel<cutlass::bfloat16_t> {
172
173
174
175
176
177
178
179
180
181
0 commit comments