Fix pre-commit

etiotto · etiotto · commit 703450600b12 · 2025-10-28T19:44:48.000Z
Signed-off-by: Ettore Tiotto &lt;ettore.tiotto@intel.com&gt;
diff --git a/test/Triton/Intel/RemoveMasks/unnecessary-masks.mlir b/test/Triton/Intel/RemoveMasks/unnecessary-masks.mlir
@@ -2,59 +2,59 @@
 
 module {
   tt.func public @test1(%in_ptr0: !tt.ptr<f16> {tt.divisibility = 16 : i32}, %in_ptr1: !tt.ptr<f16> {tt.divisibility = 16 : i32}) {
-    %cst = arith.constant dense<0.000000e+00> : tensor<32x32xf16> 
-    %c576_i32 = arith.constant 576 : i32 
-    %c0_i32 = arith.constant 0 : i32 
-    %cst_4 = arith.constant dense<9216> : tensor<32x1xi32> 
-    %cst_5 = arith.constant dense<16> : tensor<1x32xi32> 
-    %cst_6 = arith.constant dense<576> : tensor<1x32xi32> 
-    %cst_7 = arith.constant dense<0xFF800000> : tensor<32x32xf32> 
-    %cst_8 = arith.constant dense<16> : tensor<32x1xi32> 
-    %c32_i32 = arith.constant 32 : i32 
-    %0 = tt.get_program_id x : i32 
-    %1 = arith.muli %0, %c32_i32 : i32 
-    %2 = tt.make_range {end = 32 : i32, start = 0 : i32} : tensor<32xi32> 
-    %3 = tt.expand_dims %2 {axis = 1 : i32} : tensor<32xi32> -> tensor<32x1xi32> 
-    %4 = tt.splat %1 : i32 -> tensor<32x1xi32> 
-    %5 = arith.addi %4, %3 : tensor<32x1xi32> 
-    %6 = tt.expand_dims %2 {axis = 0 : i32} : tensor<32xi32> -> tensor<1x32xi32> 
-    %7 = arith.remsi %5, %cst_8 : tensor<32x1xi32> 
-    %8 = arith.divsi %5, %cst_8 : tensor<32x1xi32> 
-    %9 = tt.splat %in_ptr1 : !tt.ptr<f16> -> tensor<32x1x!tt.ptr<f16>> 
-    %10 = tt.addptr %9, %7 : tensor<32x1x!tt.ptr<f16>>, tensor<32x1xi32> 
-    %11 = tt.load %10 evictionPolicy = evict_last : tensor<32x1x!tt.ptr<f16>> 
-    %12 = arith.extf %11 : tensor<32x1xf16> to tensor<32x1xf32> 
-    %13 = tt.broadcast %7 : tensor<32x1xi32> -> tensor<32x32xi32> 
-    %14 = arith.muli %8, %cst_4 : tensor<32x1xi32> 
-    %15 = tt.broadcast %14 : tensor<32x1xi32> -> tensor<32x32xi32> 
-    %16 = tt.splat %in_ptr0 : !tt.ptr<f16> -> tensor<32x32x!tt.ptr<f16>> 
-    %17 = tt.broadcast %12 : tensor<32x1xf32> -> tensor<32x32xf32> 
+    %cst = arith.constant dense<0.000000e+00> : tensor<32x32xf16>
+    %c576_i32 = arith.constant 576 : i32
+    %c0_i32 = arith.constant 0 : i32
+    %cst_4 = arith.constant dense<9216> : tensor<32x1xi32>
+    %cst_5 = arith.constant dense<16> : tensor<1x32xi32>
+    %cst_6 = arith.constant dense<576> : tensor<1x32xi32>
+    %cst_7 = arith.constant dense<0xFF800000> : tensor<32x32xf32>
+    %cst_8 = arith.constant dense<16> : tensor<32x1xi32>
+    %c32_i32 = arith.constant 32 : i32
+    %0 = tt.get_program_id x : i32
+    %1 = arith.muli %0, %c32_i32 : i32
+    %2 = tt.make_range {end = 32 : i32, start = 0 : i32} : tensor<32xi32>
+    %3 = tt.expand_dims %2 {axis = 1 : i32} : tensor<32xi32> -> tensor<32x1xi32>
+    %4 = tt.splat %1 : i32 -> tensor<32x1xi32>
+    %5 = arith.addi %4, %3 : tensor<32x1xi32>
+    %6 = tt.expand_dims %2 {axis = 0 : i32} : tensor<32xi32> -> tensor<1x32xi32>
+    %7 = arith.remsi %5, %cst_8 : tensor<32x1xi32>
+    %8 = arith.divsi %5, %cst_8 : tensor<32x1xi32>
+    %9 = tt.splat %in_ptr1 : !tt.ptr<f16> -> tensor<32x1x!tt.ptr<f16>>
+    %10 = tt.addptr %9, %7 : tensor<32x1x!tt.ptr<f16>>, tensor<32x1xi32>
+    %11 = tt.load %10 evictionPolicy = evict_last : tensor<32x1x!tt.ptr<f16>>
+    %12 = arith.extf %11 : tensor<32x1xf16> to tensor<32x1xf32>
+    %13 = tt.broadcast %7 : tensor<32x1xi32> -> tensor<32x32xi32>
+    %14 = arith.muli %8, %cst_4 : tensor<32x1xi32>
+    %15 = tt.broadcast %14 : tensor<32x1xi32> -> tensor<32x32xi32>
+    %16 = tt.splat %in_ptr0 : !tt.ptr<f16> -> tensor<32x32x!tt.ptr<f16>>
+    %17 = tt.broadcast %12 : tensor<32x1xf32> -> tensor<32x32xf32>
     %_tmp5 = scf.for %r0_offset = %c0_i32 to %c576_i32 step %c32_i32 iter_args(%_tmp5_9 = %cst_7) -> (tensor<32x32xf32>)  : i32 {
-      %44 = tt.splat %r0_offset : i32 -> tensor<1x32xi32> 
-      %45 = arith.addi %44, %6 : tensor<1x32xi32> 
-      %46 = arith.cmpi slt, %45, %cst_6 : tensor<1x32xi32> 
-      %47 = arith.muli %45, %cst_5 : tensor<1x32xi32> 
-      %48 = tt.broadcast %47 : tensor<1x32xi32> -> tensor<32x32xi32> 
-      %49 = arith.addi %13, %48 : tensor<32x32xi32> 
-      %50 = arith.addi %49, %15 : tensor<32x32xi32> 
-      %51 = tt.addptr %16, %50 : tensor<32x32x!tt.ptr<f16>>, tensor<32x32xi32> 
-      %52 = tt.broadcast %46 : tensor<1x32xi1> -> tensor<32x32xi1> 
-      %53 = tt.load %51, %52, %cst evictionPolicy = evict_last : tensor<32x32x!tt.ptr<f16>> 
-      %54 = arith.extf %53 : tensor<32x32xf16> to tensor<32x32xf32> 
-      %55 = arith.addf %54, %17 : tensor<32x32xf32> 
-      %mask = arith.cmpf ogt, %_tmp5_9, %55 : tensor<32x32xf32> 
-      %56 = arith.cmpf une, %_tmp5_9, %_tmp5_9 : tensor<32x32xf32> 
-      %mask_10 = arith.ori %mask, %56 : tensor<32x32xi1> 
-      %57 = arith.select %mask_10, %_tmp5_9, %55 : tensor<32x32xi1>, tensor<32x32xf32> 
-      %58 = arith.select %52, %57, %_tmp5_9 : tensor<32x32xi1>, tensor<32x32xf32> 
-      scf.yield %58 : tensor<32x32xf32> 
-    } 
+      %44 = tt.splat %r0_offset : i32 -> tensor<1x32xi32>
+      %45 = arith.addi %44, %6 : tensor<1x32xi32>
+      %46 = arith.cmpi slt, %45, %cst_6 : tensor<1x32xi32>
+      %47 = arith.muli %45, %cst_5 : tensor<1x32xi32>
+      %48 = tt.broadcast %47 : tensor<1x32xi32> -> tensor<32x32xi32>
+      %49 = arith.addi %13, %48 : tensor<32x32xi32>
+      %50 = arith.addi %49, %15 : tensor<32x32xi32>
+      %51 = tt.addptr %16, %50 : tensor<32x32x!tt.ptr<f16>>, tensor<32x32xi32>
+      %52 = tt.broadcast %46 : tensor<1x32xi1> -> tensor<32x32xi1>
+      %53 = tt.load %51, %52, %cst evictionPolicy = evict_last : tensor<32x32x!tt.ptr<f16>>
+      %54 = arith.extf %53 : tensor<32x32xf16> to tensor<32x32xf32>
+      %55 = arith.addf %54, %17 : tensor<32x32xf32>
+      %mask = arith.cmpf ogt, %_tmp5_9, %55 : tensor<32x32xf32>
+      %56 = arith.cmpf une, %_tmp5_9, %_tmp5_9 : tensor<32x32xf32>
+      %mask_10 = arith.ori %mask, %56 : tensor<32x32xi1>
+      %57 = arith.select %mask_10, %_tmp5_9, %55 : tensor<32x32xi1>, tensor<32x32xf32>
+      %58 = arith.select %52, %57, %_tmp5_9 : tensor<32x32xi1>, tensor<32x32xf32>
+      scf.yield %58 : tensor<32x32xf32>
+    }
     tt.return
   }
   // CHECK: tt.func public @test1([[PARAM_0_:%.+]]: !tt.ptr<f16> {tt.divisibility = 16 : i32}, [[PARAM_1_:%.+]]: !tt.ptr<f16> {tt.divisibility = 16 : i32}) {
   // CHECK:   scf.for
   // CHECK:     [[PTR:%.+]] = tt.addptr {{.*}} : tensor<32x32x!tt.ptr<f16>>, tensor<32x32xi32>
-  // CHECK:     [[LOAD:%.+]] = tt.load [[PTR]] evictionPolicy = evict_last : tensor<32x32x!tt.ptr<f16>>  
+  // CHECK:     [[LOAD:%.+]] = tt.load [[PTR]] evictionPolicy = evict_last : tensor<32x32x!tt.ptr<f16>>
   // CHECK:     arith.extf [[LOAD]] : tensor<32x32xf16> to tensor<32x32xf32>
   // CHECK:     [[ORI:%.+]] = arith.ori {{.*}} : tensor<32x32xi1>
   // CHECK:     [[SEL:%.+]] = arith.select [[ORI]], {{.*}}, {{.*}} : tensor<32x32xi1>, tensor<32x32xf32>