Skip to content

Commit 5924ac3

Browse files
committed
[XPU] Conditionally add elementwise optimization pass to the pipeline
Conditionally add `-tritonintelgpu-optimize-elementwise-parallelism` to the pipeline. Signed-off-by: victor-eds <[email protected]>
1 parent 96a664f commit 5924ac3

File tree

2 files changed

+5
-1
lines changed

2 files changed

+5
-1
lines changed

third_party/intel/backend/compiler.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -251,8 +251,9 @@ def make_ttgir(mod, metadata, opt, properties):
251251
passes.common.add_cse(pm)
252252
passes.ttgpuir.add_prefetch(pm)
253253
passes.ttgpuir.add_optimize_dot_operands(pm, True)
254-
if os.getenv("TRITON_INTEL_OPTIMIZE_REDUCTION_LOCALITY", "0") == 1:
254+
if os.getenv("TRITON_INTEL_OPTIMIZE_REDUCTION_LOCALITY", "0") == "1":
255255
intel.passes.ttgpuir.add_optimize_reduction_locality(pm)
256+
intel.passes.ttgpuir.add_optimize_elementwise_parallelism(pm)
256257
intel.passes.ttgpuir.add_remove_layout_conversions(pm)
257258
intel.passes.ttgpuir.add_reduce_data_duplication(pm)
258259
passes.ttgpuir.add_reorder_instructions(pm)

third_party/intel/triton_xpu.cc

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -100,6 +100,9 @@ void init_triton_intel_passes_ttgpuir(py::module &&m) {
100100
gpu::intel::createTritonIntelGPUMaterializeBlockPointer);
101101
ADD_PASS_WRAPPER_0("add_optimize_reduction_locality",
102102
gpu::intel::createTritonIntelGPUOptimizeReductionLocality);
103+
ADD_PASS_WRAPPER_0(
104+
"add_optimize_elementwise_parallelism",
105+
gpu::intel::createTritonIntelGPUOptimizeElementwiseParallelism);
103106
}
104107

105108
void init_triton_intel(py::module &&m) {

0 commit comments

Comments
 (0)