Skip to content

Commit c0b7415

Browse files
Fallback performance experiment
Signed-off-by: Whitney Tsang <[email protected]>
1 parent 2d1ba45 commit c0b7415

File tree

3 files changed

+9
-9
lines changed

3 files changed

+9
-9
lines changed

benchmarks/triton_kernels_benchmark/gemm_tensor_desc_benchmark.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -25,11 +25,11 @@ def matmul_kernel_with_tensor_descriptors(
2525
# Pointers to matrices
2626
a_ptr, b_ptr, c_ptr,
2727
# Matrix dimensions
28-
M: tl.constexpr, N: tl.constexpr, K: tl.constexpr,
28+
M, N, K,
2929
# Stride variables
30-
stride_am: tl.constexpr, stride_ak: tl.constexpr, #
31-
stride_bk: tl.constexpr, stride_bn: tl.constexpr, #
32-
stride_cm: tl.constexpr, stride_cn: tl.constexpr,
30+
stride_am, stride_ak, #
31+
stride_bk, stride_bn, #
32+
stride_cm, stride_cn,
3333
# Meta-parameters
3434
BLOCK_SIZE_M: tl.constexpr, BLOCK_SIZE_N: tl.constexpr, BLOCK_SIZE_K: tl.constexpr, GROUP_SIZE_M: tl.constexpr):
3535
pid = tl.program_id(axis=0)

benchmarks/triton_kernels_benchmark/gemm_tensor_of_ptr_benchmark.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -25,11 +25,11 @@ def matmul_kernel(
2525
# Pointers to matrices
2626
a_ptr, b_ptr, c_ptr,
2727
# Matrix dimensions
28-
M: tl.constexpr, N: tl.constexpr, K: tl.constexpr,
28+
M, N, K,
2929
# Stride variables
30-
stride_am: tl.constexpr, stride_ak: tl.constexpr, #
31-
stride_bk: tl.constexpr, stride_bn: tl.constexpr, #
32-
stride_cm: tl.constexpr, stride_cn: tl.constexpr,
30+
stride_am, stride_ak, #
31+
stride_bk, stride_bn, #
32+
stride_cm, stride_cn,
3333
# Meta-parameters
3434
BLOCK_SIZE_M: tl.constexpr, BLOCK_SIZE_N: tl.constexpr, BLOCK_SIZE_K: tl.constexpr, GROUP_SIZE_M: tl.constexpr):
3535
pid = tl.program_id(axis=0)

third_party/intel/backend/compiler.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -207,7 +207,7 @@ def make_ttir(cls, mod, metadata, opt):
207207
pm = ir.pass_manager(mod.context)
208208
pm.enable_debug()
209209
passes.common.add_inliner(pm)
210-
intel.passes.ttir.add_convert_tdesc_to_block_pointer(pm)
210+
#intel.passes.ttir.add_convert_tdesc_to_block_pointer(pm)
211211
passes.ttir.add_rewrite_tensor_descriptor_to_pointer(pm)
212212
passes.common.add_cse(pm)
213213
passes.common.add_licm(pm)

0 commit comments

Comments
 (0)