@@ -10,7 +10,7 @@ module attributes {"ttg.num-warps" = 4 : i32} {
10
10
// CHECK-LABEL: @two_consumers
11
11
tt.func @two_consumers (%lb: i32 , %ub: i32 , %step: i32 ) {
12
12
// CHECK: [[C0:%.*]] = arith.constant 0 : i32
13
- // CHECK-NEXT: [[ABUF:%.*]] = ttg.local_alloc : () -> !ttg.memdesc<2x1xi32 , {{.*}}>
13
+ // CHECK-NEXT: [[ABUF:%.*]] = ttg.local_alloc : () -> !ttg.memdesc<1x1xi32 , {{.*}}>
14
14
// CHECK-NEXT: [[AREF:%.*]] = nvws.aref.create [[ABUF]]
15
15
scf.for %i = %lb to %ub step %step iter_args () -> () : i32 {
16
16
%0 = " op_a" () {ttg.partition = 0 } : () -> !ty
@@ -40,7 +40,7 @@ tt.func @two_consumers(%lb: i32, %ub: i32, %step: i32) {
40
40
// CHECK-LABEL: @distance_one
41
41
tt.func @distance_one (%lb: i32 , %ub: i32 , %step: i32 ) {
42
42
// CHECK: [[C0:%.*]] = arith.constant 0 : i32
43
- // CHECK: [[ABUF:%.*]] = ttg.local_alloc : () -> !ttg.memdesc<2x1xi32 , {{.*}}>
43
+ // CHECK: [[ABUF:%.*]] = ttg.local_alloc : () -> !ttg.memdesc<1x1xi32 , {{.*}}>
44
44
// CHECK-NEXT: [[AREF:%.*]] = nvws.aref.create [[ABUF]]
45
45
%cst = arith.constant dense <0 > : !ty
46
46
// CHECK: scf.for [[IV:%.*]] = [[LB:%.*]] to [[UB:%.*]] step [[STEP:%.*]] iter_args([[K:%.*]] = {{.*}})
@@ -63,9 +63,9 @@ tt.func @distance_one(%lb: i32, %ub: i32, %step: i32) {
63
63
}
64
64
65
65
tt.func @complex_case (%lb: i32 , %ub: i32 , %step: i32 ) {
66
- // CHECK: [[ABUF1:%.*]] = ttg.local_alloc : () -> !ttg.memdesc<2x1xi32 , {{.*}}>
66
+ // CHECK: [[ABUF1:%.*]] = ttg.local_alloc : () -> !ttg.memdesc<1x1xi32 , {{.*}}>
67
67
// CHECK-NEXT: [[AREF1:%.*]] = nvws.aref.create [[ABUF1]]
68
- // CHECK-NEXT: [[ABUF2:%.*]] = ttg.local_alloc : () -> !ttg.memdesc<2x1xi32 , {{.*}}>
68
+ // CHECK-NEXT: [[ABUF2:%.*]] = ttg.local_alloc : () -> !ttg.memdesc<1x1xi32 , {{.*}}>
69
69
// CHECK-NEXT: [[AREF2:%.*]] = nvws.aref.create [[ABUF2]]
70
70
%cst = arith.constant dense <0 > : !ty
71
71
// CHECK: scf.for [[IV:%.*]] = [[LB:%.*]] to [[UB:%.*]] step [[STEP:%.*]] iter_args([[K:%.*]] = {{.*}}, [[L:%.*]] = {{.*}})
0 commit comments