We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7efb6ac commit 53badacCopy full SHA for 53badac
ggml/src/ggml-cuda/mmf.cuh
@@ -36,7 +36,7 @@ static __global__ void mul_mat_f(
36
return;
37
}
38
39
- constexpr int I_preferred = I_16_supported ? 16 : 32; // For Turing MMA both work butr 16 is ~1% faster.
+ constexpr int I_preferred = I_16_supported ? 16 : 32; // For Turing MMA both work but 16 is ~1% faster.
40
41
typedef tile<I_preferred, 8, T> tile_A;
42
typedef tile<8, 8, T> tile_B;
0 commit comments