Skip to content

Commit d2e9b1b

Browse files
committed
TEST
1 parent 793a3ae commit d2e9b1b

File tree

1 file changed

+5
-1
lines changed

1 file changed

+5
-1
lines changed

third_party/intel/lib/TritonIntelGPUTransforms/OptimizeElementwiseParallelism.cpp

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -104,8 +104,12 @@ bool optimizationDoesNotWorsenRegisterPressure(
104104
if (auto convertLayout = dyn_cast<ConvertLayoutOp>(owner))
105105
return convertLayout.getResult().getType() == newType;
106106

107+
// Broadcasted in source.
108+
if (isa<ExpandDimsOp>(owner))
109+
return true;
110+
107111
// Allow for loop optimizations.
108-
if (auto yield = dyn_cast<scf::YieldOp>(owner))
112+
if (isa<scf::YieldOp>(owner))
109113
return true;
110114

111115
// Only allow candidates. Check only operation constraints. We do not have

0 commit comments

Comments
 (0)