Skip to content

Commit 5bfe5cb

Browse files
committed
Add new gemm tuned cfg
1 parent 6db3b52 commit 5bfe5cb

File tree

1 file changed

+8
-0
lines changed

1 file changed

+8
-0
lines changed

benchmarks/triton_kernels_benchmark/gemm_benchmark.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -98,10 +98,18 @@ def matmul_kernel_with_block_pointers(
9898
triton.Config(
9999
{'BLOCK_SIZE_M': 256, 'BLOCK_SIZE_N': 128, 'BLOCK_SIZE_K': 32, 'GROUP_SIZE_M': 4, 'grf_mode': 'large'},
100100
num_stages=s, num_warps=32) for s in [2]
101+
] + [
102+
triton.Config(
103+
{'BLOCK_SIZE_M': 128, 'BLOCK_SIZE_N': 1024, 'BLOCK_SIZE_K': 16, 'GROUP_SIZE_M': 1, 'grf_mode': 'large'},
104+
num_stages=s, num_warps=32) for s in [2]
101105
] + [
102106
triton.Config(
103107
{'BLOCK_SIZE_M': 64, 'BLOCK_SIZE_N': 128, 'BLOCK_SIZE_K': 32, 'GROUP_SIZE_M': 4, 'grf_mode': 'large'},
104108
num_stages=s, num_warps=32) for s in [2]
109+
] + [
110+
triton.Config(
111+
{'BLOCK_SIZE_M': 16, 'BLOCK_SIZE_N': 1024, 'BLOCK_SIZE_K': 64, 'GROUP_SIZE_M': 32, 'grf_mode': 'large'},
112+
num_stages=s, num_warps=32) for s in [2, 3]
105113
] + [
106114
triton.Config(
107115
{'BLOCK_SIZE_M': 8, 'BLOCK_SIZE_N': 512, 'BLOCK_SIZE_K': 64, 'GROUP_SIZE_M': 1, 'grf_mode': 'large'},

0 commit comments

Comments
 (0)