Skip to content

Commit 979b25d

Browse files
committed
added improved matmul function
added fixed bench added more tests for matmul
1 parent cb7a00d commit 979b25d

File tree

4 files changed

+594
-215
lines changed

4 files changed

+594
-215
lines changed

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -174,9 +174,9 @@ We welcome contributions to Katana! Please see our [Contributing Guidelines](CON
174174

175175
## TODO
176176
- Full SIMD Ops Set (soon!)
177+
- Autograd capability/Graph Compiler
177178
- Extended usage guide
178179
- More ML Ops and tests
179-
- Autograd capability/Graph Compiler
180180
- CUDA/GPU support
181181

182182
## List of ops to be added soon:

src/bench.zig

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@ const Tensor = tensormod.Tensor;
44
const ops = @import("ops.zig");
55
const matmul = ops.matmul;
66
const T = ops.Tile;
7-
const V = ops.Vec;
87

98
pub fn calculateGflops(allocator: std.mem.Allocator, M: usize, N: usize, K: usize, iterations: usize) !f64 {
109
const shape_a = [_]usize{ M, K };
@@ -70,7 +69,7 @@ pub fn main() !void {
7069
const iterations = 5;
7170

7271
try std.io.getStdOut().writer().print("\nRunning MatMul Benchmark\n", .{});
73-
try std.io.getStdOut().writer().print("T = {d} \nV = {d} \n", .{ T, V });
72+
try std.io.getStdOut().writer().print("T = {d} \n", .{T});
7473
try std.io.getStdOut().writer().print("Number of threads = {d}\n", .{try std.Thread.getCpuCount()});
7574

7675
for (sizes) |size| {

0 commit comments

Comments
 (0)