We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4aefa90 commit fd05b19Copy full SHA for fd05b19
src/device/intrinsics/wmma.jl
@@ -43,7 +43,7 @@ const map_frag_sizes = Dict(
43
"a.f16.m8n32k16" => 8,
44
"a.f16.m32n8k16" => 8,
45
46
- "a.tf32.m16n16k8" => 8,
+ "a.tf32.m16n16k8" => 4,
47
# B
48
"b.u8.m16n16k16" => 2,
49
"b.u8.m8n32k16" => 4,
@@ -57,7 +57,7 @@ const map_frag_sizes = Dict(
57
"b.f16.m8n32k16" => 8,
58
"b.f16.m32n8k16" => 8,
59
60
- "b.tf32.m16n16k8" => 8,
+ "b.tf32.m16n16k8" => 4,
61
# C
62
"c.s32.m16n16k16" => 8,
63
"c.s32.m8n32k16" => 8,
0 commit comments