@@ -545,9 +545,9 @@ module attributes {transform.with_named_sequence} {
545545!type = memref <2 x 32 x f32 >
546546!type1d = memref <32 x f32 >
547547
548- // CHECK-DAG: #[[$MAPBLIN:.*]] = affine_map<(d0, d1, d2) -> (d0 + d1 * 12 + d2 * 108)>
549- // CHECK-DAG: #[[$MAPBX:.*]] = affine_map<(d0, d1, d2) -> ((d0 + d1 * 12 + d2 * 108) mod 7)>
550- // CHECK-DAG: #[[$MAPBY:.*]] = affine_map<(d0, d1, d2) -> ((d0 + d1 * 12 + d2 * 108) floordiv 7)>
548+ // CHECK-DAG: #[[$MAPBLIN:.*]] = affine_map<()[s0, s1, s2] -> (s0 + s1 * 12 + s2 * 108)>
549+ // CHECK-DAG: #[[$MAPBX:.*]] = affine_map<()[s0, s1, s2] -> ((s0 + s1 * 12 + s2 * 108) mod 7)>
550+ // CHECK-DAG: #[[$MAPBY:.*]] = affine_map<()[s0, s1, s2] -> ((s0 + s1 * 12 + s2 * 108) floordiv 7)>
551551
552552// CHECK-LABEL: func.func @block_linear_existing_launch(
553553// CHECK-SAME: %[[ARGX:[0-9a-z]+]]: memref<2x32xf32>
@@ -566,9 +566,9 @@ func.func @block_linear_existing_launch(
566566// CHECK-DAG: %[[BIDX:.*]] = gpu.block_id x
567567// CHECK-DAG: %[[BIDY:.*]] = gpu.block_id y
568568// CHECK-DAG: %[[BIDZ:.*]] = gpu.block_id z
569- // CHECK-DAG: %[[BIDLIN:.*]] = affine.apply #[[$MAPBLIN]](%[[BIDX]], %[[BIDY]], %[[BIDZ]])
570- // CHECK-DAG: %[[BLX:.*]] = affine.apply #[[$MAPBX]](%[[BIDX]], %[[BIDY]], %[[BIDZ]])
571- // CHECK-DAG: %[[BLY:.*]] = affine.apply #[[$MAPBY]](%[[BIDX]], %[[BIDY]], %[[BIDZ]])
569+ // CHECK-DAG: %[[BIDLIN:.*]] = affine.apply #[[$MAPBLIN]]()[ %[[BIDX]], %[[BIDY]], %[[BIDZ]]]
570+ // CHECK-DAG: %[[BLX:.*]] = affine.apply #[[$MAPBX]]()[ %[[BIDX]], %[[BIDY]], %[[BIDZ]]]
571+ // CHECK-DAG: %[[BLY:.*]] = affine.apply #[[$MAPBY]]()[ %[[BIDX]], %[[BIDY]], %[[BIDZ]]]
572572// CHECK-DAG: %[[CMPLIN:.*]] = arith.cmpi ult, %[[BIDLIN]], %[[C63]] : index
573573// CHECK: scf.if %[[CMPLIN]]
574574// CHECK: memref.load %[[ARGX]][%[[BLX]], %[[BLY]]]
@@ -600,8 +600,8 @@ module attributes {transform.with_named_sequence} {
600600!type = memref <2 x 32 x f32 >
601601!type1d = memref <32 x f32 >
602602
603- // CHECK-DAG: #[[$MAPBX:.*]] = affine_map<(d0) -> (d0 mod 7)>
604- // CHECK-DAG: #[[$MAPBY:.*]] = affine_map<(d0, d1, d2) -> (d1 + d2 * 9 + d0 floordiv 7)>
603+ // CHECK-DAG: #[[$MAPBX:.*]] = affine_map<()[s0] -> (s0 mod 7)>
604+ // CHECK-DAG: #[[$MAPBY:.*]] = affine_map<()[s0, s1, s2] -> (s1 + s2 * 9 + s0 floordiv 7)>
605605
606606// CHECK-LABEL: func.func @block_linear_generate_launch(
607607// CHECK-SAME: %[[ARGX:[0-9a-z]+]]: memref<2x32xf32>
@@ -620,8 +620,8 @@ func.func @block_linear_generate_launch(
620620// CHECK-DAG: %[[BIDX:.*]] = gpu.block_id x
621621// CHECK-DAG: %[[BIDY:.*]] = gpu.block_id y
622622// CHECK-DAG: %[[BIDZ:.*]] = gpu.block_id z
623- // CHECK-DAG: %[[BLX:.*]] = affine.apply #[[$MAPBX]](%[[BIDX]])
624- // CHECK-DAG: %[[BLY:.*]] = affine.apply #[[$MAPBY]](%[[BIDX]], %[[BIDY]], %[[BIDZ]])
623+ // CHECK-DAG: %[[BLX:.*]] = affine.apply #[[$MAPBX]]()[ %[[BIDX]]]
624+ // CHECK-DAG: %[[BLY:.*]] = affine.apply #[[$MAPBY]]()[ %[[BIDX]], %[[BIDY]], %[[BIDZ]]]
625625// CHECK: memref.load %[[ARGX]][%[[BLX]], %[[BLY]]]
626626// CHECK: memref.load %[[ARGY]][%[[BLX]], %[[BLY]]]
627627 scf.forall (%i , %j ) in (%c7 , %c9 ) {
@@ -647,7 +647,7 @@ module attributes {transform.with_named_sequence} {
647647#map = affine_map <(d0 ) -> (d0 * 128 )>
648648#map1 = affine_map <(d0 ) -> (d0 * 32 )>
649649
650- // CHECK-DAG: #[[$MAPB:.*]] = affine_map<(d0) -> (d0 * 128)>
650+ // CHECK-DAG: #[[$MAPB:.*]] = affine_map<()[s0] -> (s0 * 128)>
651651// CHECK-DAG: #[[$MAPW:.*]] = affine_map<()[s0, s1, s2] -> (s2 * 32 + ((s0 + s1 * 4) floordiv 32) * 32)>
652652
653653// CHECK-LABEL: func.func @simple_fill(
@@ -660,7 +660,7 @@ func.func @simple_fill(%arg0: memref<128xf32>) -> memref<128xf32> {
660660// CHECK: gpu.launch
661661 scf.forall (%arg1 ) in (1 ) {
662662// CHECK: %[[BIDX:.*]] = gpu.block_id x
663- // CHECK: %[[BLX:.*]] = affine.apply #[[$MAPB]](%[[BIDX]])
663+ // CHECK: %[[BLX:.*]] = affine.apply #[[$MAPB]]()[ %[[BIDX]]]
664664 %0 = affine.apply #map (%arg1 )
665665 %subview = memref.subview %arg0 [%0 ] [128 ] [1 ] : memref <128 xf32 > to memref <128 xf32 , strided <[1 ], offset : ?>>
666666 scf.forall (%arg2 ) in (4 ) {
0 commit comments