Skip to content

Commit 2af05fa

Browse files
committed
Update tests
1 parent b4908bd commit 2af05fa

File tree

1 file changed

+16
-12
lines changed

1 file changed

+16
-12
lines changed

mlir/test/Dialect/AMDGPU/amdgpu-fold-memrefs.mlir

Lines changed: 16 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -54,18 +54,20 @@ func.func @subview_folding_offset(%offset_i: index, %offset_j: index) {
5454
// CHECK: func @test_expand_shape
5555
// CHECK-SAME: %[[ARG0:.*]]: index, %[[ARG1:.*]]: index
5656
func.func @test_expand_shape(%offset_i: index, %offset_j: index) {
57-
// CHECK: %[[LOCAL:.*]] = memref.alloc() : memref<64x64xf16, 3>
57+
// CHECK: %[[LOCAL:.*]] = memref.alloc() : memref<4096xf16, 3>
5858
// CHECK: %[[MEM:.*]] = memref.alloc() : memref<8192xf16>
5959
// CHECK: %[[C0:.*]] = arith.constant 0 : index
60-
// CHECK: %[[IDX:.*]] = affine.linearize_index [%[[ARG0]], %[[ARG1]]] by (64, 128) : index
61-
// CHECK: amdgpu.gather_to_lds %[[MEM]][%[[IDX]]], %[[LOCAL]][%[[C0]], %[[C0]]]
62-
// CHECK-SAME: vector<8xf16>, memref<8192xf16>, memref<64x64xf16, 3>
60+
// CHECK: %[[IDXM:.*]] = affine.linearize_index [%[[ARG0]], %[[ARG1]]] by (64, 128) : index
61+
// CHECK: %[[IDXL:.*]] = affine.linearize_index [%[[C0]], %[[C0]]] by (64, 64) : index
62+
// CHECK: amdgpu.gather_to_lds %[[MEM]][%[[IDXM]]], %[[LOCAL]][%[[IDXL]]]
63+
// CHECK-SAME: vector<8xf16>, memref<8192xf16>, memref<4096xf16, 3>
6364

64-
%alloc = memref.alloc() : memref<64x64xf16, #gpu_lds_addrspace>
65+
%alloc = memref.alloc() : memref<4096xf16, #gpu_lds_addrspace>
6566
%mem = memref.alloc() : memref<8192xf16>
66-
%expand = memref.expand_shape %mem [[0, 1]] output_shape [64, 128] : memref<8192xf16> into memref<64x128xf16>
67+
%expand_mem = memref.expand_shape %mem [[0, 1]] output_shape [64, 128] : memref<8192xf16> into memref<64x128xf16>
68+
%expand_alloc = memref.expand_shape %alloc [[0, 1]] output_shape [64, 64] : memref<4096xf16, #gpu_lds_addrspace> into memref<64x64xf16, #gpu_lds_addrspace>
6769
%c0 = arith.constant 0 : index
68-
amdgpu.gather_to_lds %expand[%offset_i, %offset_j], %alloc[%c0, %c0]
70+
amdgpu.gather_to_lds %expand_mem[%offset_i, %offset_j], %expand_alloc[%c0, %c0]
6971
: vector<8xf16>, memref<64x128xf16>, memref<64x64xf16, #gpu_lds_addrspace>
7072
func.return
7173
}
@@ -80,15 +82,17 @@ func.func @test_collapse_shape(%offset_i: index, %offset_j: index) {
8082
// CHECK: %[[LOCAL:.*]] = memref.alloc() : memref<64x64xf16, 3>
8183
// CHECK: %[[MEM:.*]] = memref.alloc() : memref<64x128xf16>
8284
// CHECK: %[[C0:.*]] = arith.constant 0 : index
83-
// CHECK: %[[INDICES:.*]]:2 = affine.delinearize_index %[[ARG0]] into (64, 128) : index, index
84-
// CHECK: amdgpu.gather_to_lds %[[MEM]][%[[INDICES]]#0, %[[INDICES]]#1], %[[LOCAL]][%[[C0]], %[[C0]]]
85+
// CHECK: %[[INDICES_MEM:.*]]:2 = affine.delinearize_index %[[ARG0]] into (64, 128) : index, index
86+
// CHECK: %[[INDICES_LDS:.*]]:2 = affine.delinearize_index %[[ARG1]] into (64, 64) : index, index
87+
// CHECK: amdgpu.gather_to_lds %[[MEM]][%[[INDICES_MEM]]#0, %[[INDICES_MEM]]#1], %[[LOCAL]][%[[INDICES_LDS]]#0, %[[INDICES_LDS]]#1]
8588
// CHECK-SAME: vector<8xf16>, memref<64x128xf16>, memref<64x64xf16, 3>
8689

8790
%alloc = memref.alloc() : memref<64x64xf16, #gpu_lds_addrspace>
91+
%collapse_alloc = memref.collapse_shape %alloc [[0, 1]] : memref<64x64xf16, #gpu_lds_addrspace> into memref<4096xf16, #gpu_lds_addrspace>
8892
%mem = memref.alloc() : memref<64x128xf16>
89-
%collapse = memref.collapse_shape %mem [[0, 1]] : memref<64x128xf16> into memref<8192xf16>
93+
%collapse_mem = memref.collapse_shape %mem [[0, 1]] : memref<64x128xf16> into memref<8192xf16>
9094
%c0 = arith.constant 0 : index
91-
amdgpu.gather_to_lds %collapse[%offset_i], %alloc[%c0, %c0]
92-
: vector<8xf16>, memref<8192xf16>, memref<64x64xf16, #gpu_lds_addrspace>
95+
amdgpu.gather_to_lds %collapse_mem[%offset_i], %collapse_alloc[%offset_j]
96+
: vector<8xf16>, memref<8192xf16>, memref<4096xf16, #gpu_lds_addrspace>
9397
func.return
9498
}

0 commit comments

Comments
 (0)