We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ad4dce8 commit 30c25eeCopy full SHA for 30c25ee
shaders/stensor/linalg/gemm.slang
@@ -26,8 +26,6 @@ void gemm_fast(
26
) {
27
let local_id = local_id.y;
28
29
- out[0] = 1.0;
30
-
31
for (var k = 0u; k < shape_m2.ncols; k += 4u) {
32
var sum = float4x4(0.0);
33
src/linalg/contiguous.rs
@@ -112,8 +112,8 @@ mod test {
112
&backend,
113
&mut shapes,
114
&mut pass,
115
- gpu_tensor.as_view().transposed(),
116
&gpu_output,
+ gpu_tensor.as_view().transposed(),
117
)
118
.unwrap();
119
drop(pass); // Ensure the pass is ended before the encoder is borrowed again.
0 commit comments