[LLVM] Bump to 75aa01b89 (#257)

bump-llvm[bot] · github-actions[bot] · makslevental · web-flow · commit 3ecb49e08d6e · 2025-12-01T18:22:59.000-08:00
Bump LLVM to llvm/llvm-project@75aa01b89 --------- Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: Maksim Levental <maksim.levental@gmail.com>
diff --git a/projects/eudsl-python-extras/examples/cuda_matmul_opt.py b/projects/eudsl-python-extras/examples/cuda_matmul_opt.py
@@ -415,7 +415,7 @@ def sgemm_shared_mem_1d_block_tiling[
     inner_row_B = tid / BN
 
     thread_results = memref.alloca((TM,), dtype)
-    linalg.fill(0, thread_results)
+    linalg.fill(0.0, thread_results)
 
     for bk_idx in range_(0, K, BK):
         # Move blocktile to beginning of A's row and B's column
@@ -483,13 +483,13 @@ def sgemm_shared_mem_2d_block_tiling[
     stride_B = num_threads_blocktile // BN
 
     thread_results = memref.alloca((TM, TN), dtype)
-    linalg.fill(0, thread_results)
+    linalg.fill(0.0, thread_results)
 
     reg_M = memref.alloca((TM,), dtype)
-    linalg.fill(0, reg_M)
+    linalg.fill(0.0, reg_M)
 
     reg_N = memref.alloca((TN,), dtype)
-    linalg.fill(0, reg_N)
+    linalg.fill(0.0, reg_N)
 
     for bk_idx in range_(0, K, BK):
         A_ = A[c_row : c_row + BM, bk_idx : bk_idx + BK]
@@ -579,13 +579,13 @@ def sgemm_shared_mem_2d_block_tiling_vectorize[
     inner_row_B = tid / (BN // VECTOR_WIDTH)
 
     thread_results = memref.alloca((TM, TN), dtype)
-    linalg.fill(0, thread_results)
+    linalg.fill(0.0, thread_results)
 
     reg_M = memref.alloca((TM,), dtype)
-    linalg.fill(0, reg_M)
+    linalg.fill(0.0, reg_M)
 
     reg_N = memref.alloca((TN,), dtype)
-    linalg.fill(0, reg_N)
+    linalg.fill(0.0, reg_N)
 
     for bk_idx in range_(0, K, BK):
         A_ = A[c_row : c_row + BM, bk_idx : bk_idx + BK]
@@ -708,13 +708,13 @@ def sgemm_warp_tiling[
 
     # allocate thread-local cache for results in registerfile
     thread_results = memref.alloca((WMITER * TM, WNITER * TN), dtype)
-    linalg.fill(0, thread_results)
+    linalg.fill(0.0, thread_results)
 
     reg_M = memref.alloca((WMITER, TM), dtype)
-    linalg.fill(0, reg_M)
+    linalg.fill(0.0, reg_M)
 
     reg_N = memref.alloca((WNITER, TN), dtype)
-    linalg.fill(0, reg_N)
+    linalg.fill(0.0, reg_N)
 
     for bk_idx in range_(0, K, BK):
         A_ = A[c_row : c_row + BM, bk_idx : bk_idx + BK]
diff --git a/projects/eudsl-python-extras/tests/dialect/test_transform.py b/projects/eudsl-python-extras/tests/dialect/test_transform.py
@@ -702,7 +702,7 @@ def matmul_i8_i8(
         B: T.tensor(K, N, T.i8()),
     ):
         empty = tensor.empty(M, N, T.i8())
-        filled = linalg_dialect.fill(arith.constant(0), outs=[empty])
+        filled = linalg_dialect.fill(arith.constant(0, type=T.i8()), outs=[empty])
         return linalg.matmul(A, B, filled)
 
     @module(attrs={"transform.target_tag": StringAttr.get("payload")})
@@ -856,8 +856,8 @@ def main(variant_op: any_op_t()):
           module attributes {transform.target_tag = "payload"} {
             func.func @matmul_i8_i8(%arg0: tensor<16x256xi8>, %arg1: tensor<256x256xi8>) -> tensor<16x256xi8> {
               %0 = tensor.empty() : tensor<16x256xi8>
-              %c0_i32 = arith.constant 0 : i32
-              %1 = linalg.fill ins(%c0_i32 : i32) outs(%0 : tensor<16x256xi8>) -> tensor<16x256xi8>
+              %c0_i8 = arith.constant 0 : i8
+              %1 = linalg.fill ins(%c0_i8 : i8) outs(%0 : tensor<16x256xi8>) -> tensor<16x256xi8>
               %2 = linalg.matmul {cast = #linalg.type_fn<cast_signed>} ins(%arg0, %arg1 : tensor<16x256xi8>, tensor<256x256xi8>) outs(%1 : tensor<16x256xi8>) -> tensor<16x256xi8>
               return %2 : tensor<16x256xi8>
             }
@@ -924,7 +924,7 @@ def matmul_i8_i8(
         B: T.tensor(K, N, T.i8()),
     ):
         empty = tensor.empty(M, N, T.i8())
-        filled = linalg_dialect.fill(arith.constant(0), outs=[empty])
+        filled = linalg_dialect.fill(arith.constant(0, type=T.i8()), outs=[empty])
         return linalg.matmul(A, B, filled)
 
     @module(attrs={"transform.target_tag": StringAttr.get("payload")})
@@ -997,13 +997,13 @@ def main(variant_op: any_op_t()):
         module {
           module attributes {transform.target_tag = "payload"} {
             func.func @matmul_i8_i8(%arg0: tensor<16x256xi8>, %arg1: tensor<256x256xi8>) -> tensor<16x256xi8> {
-              %c0_i32 = arith.constant 0 : i32
+              %c0_i8 = arith.constant 0 : i8
               %0 = tensor.empty() : tensor<16x256xi8>
               %1 = tensor.empty() : tensor<1x4x16x64xi8>
               %pack = linalg.pack %arg0 inner_dims_pos = [0, 1] inner_tiles = [16, 64] into %1 : tensor<16x256xi8> -> tensor<1x4x16x64xi8>
               %2 = tensor.empty() : tensor<4x1x64x64xi8>
               %3 = tensor.empty() : tensor<1x1x16x64xi8>
-              %4 = linalg.fill ins(%c0_i32 : i32) outs(%3 : tensor<1x1x16x64xi8>) -> tensor<1x1x16x64xi8>
+              %4 = linalg.fill ins(%c0_i8 : i8) outs(%3 : tensor<1x1x16x64xi8>) -> tensor<1x1x16x64xi8>
               %5 = scf.forall (%arg2, %arg3) in (1, 4) shared_outs(%arg4 = %0) -> (tensor<16x256xi8>) {
                 %6 = affine.apply #map(%arg3)
                 %extracted_slice = tensor.extract_slice %arg1[0, %6] [256, 64] [1, 1] : tensor<256x256xi8> to tensor<256x64xi8>
diff --git a/third_party/llvm-project b/third_party/llvm-project
@@ -1 +1 @@
-Subproject commit 24b87b8d4891d90afd8c4033a4997dedecbdd107
+Subproject commit 75aa01b89553bf4213a3b0e83829b6d0689941b9