Skip to content

Commit bd7e2e0

Browse files
committed
fix wmma tf32 fragment sizes for a and b
1 parent afea816 commit bd7e2e0

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

src/device/intrinsics/wmma.jl

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -43,7 +43,7 @@ const map_frag_sizes = Dict(
4343
"a.f16.m8n32k16" => 8,
4444
"a.f16.m32n8k16" => 8,
4545

46-
"a.tf32.m16n16k8" => 8,
46+
"a.tf32.m16n16k8" => 4,
4747
# B
4848
"b.u8.m16n16k16" => 2,
4949
"b.u8.m8n32k16" => 4,
@@ -57,7 +57,7 @@ const map_frag_sizes = Dict(
5757
"b.f16.m8n32k16" => 8,
5858
"b.f16.m32n8k16" => 8,
5959

60-
"b.tf32.m16n16k8" => 8,
60+
"b.tf32.m16n16k8" => 4,
6161
# C
6262
"c.s32.m16n16k16" => 8,
6363
"c.s32.m8n32k16" => 8,

0 commit comments

Comments
 (0)