Skip to content

Commit 4259f63

Browse files
committed
Adding check nots.
1 parent fa30258 commit 4259f63

File tree

1 file changed

+18
-11
lines changed

1 file changed

+18
-11
lines changed
Lines changed: 18 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1,32 +1,39 @@
11
// RUN: mlir-opt %s -convert-amdgpu-to-rocdl=chipset=gfx950 | FileCheck %s
2-
3-
#gpu_lds_addrspace = 3
4-
#amdgpu_fat_buffer_addrspace = 7
2+
// RUN: not mlir-opt %s --split-input-file -convert-amdgpu-to-rocdl=chipset=gfx945 2>&1 | FileCheck %s --check-prefix=CHECK-OLD
53

64
// CHECK-LABEL: func @transpose_load_to_rocdl_4xf16
7-
func.func @transpose_load_to_rocdl_4xf16(%idx1 : index, %idx2 : index, %wgmem : memref<128x72xf16, #gpu_lds_addrspace>) -> vector<4xf16> {
5+
func.func @transpose_load_to_rocdl_4xf16(%idx1 : index, %idx2 : index, %wgmem : memref<128x72xf16, 3>) -> vector<4xf16> {
86
// CHECK: rocdl.ds.read.tr16.b64
9-
%0 = amdgpu.transpose_load %wgmem[%idx1, %idx2] : memref<128x72xf16, #gpu_lds_addrspace> -> vector<4xf16>
7+
// CHECK-OLD: error: 'amdgpu.transpose_load' op Non-gfx950 chipset not supported
8+
%0 = amdgpu.transpose_load %wgmem[%idx1, %idx2] : memref<128x72xf16, 3> -> vector<4xf16>
109
return %0 : vector<4xf16>
1110
}
1211

12+
// -----
13+
1314
// CHECK-LABEL: func @transpose_load_to_rocdl_8xi8
14-
func.func @transpose_load_to_rocdl_8xi8(%idx1 : index, %idx2 : index, %wgmem : memref<128x128xi8, #gpu_lds_addrspace>) -> vector<8xi8> {
15+
func.func @transpose_load_to_rocdl_8xi8(%idx1 : index, %idx2 : index, %wgmem : memref<128x128xi8, 3>) -> vector<8xi8> {
1516
// CHECK: rocdl.ds.read.tr8.b64
16-
%0 = amdgpu.transpose_load %wgmem[%idx1, %idx2] : memref<128x128xi8, #gpu_lds_addrspace> -> vector<8xi8>
17+
// CHECK-OLD: error: 'amdgpu.transpose_load' op Non-gfx950 chipset not supported
18+
%0 = amdgpu.transpose_load %wgmem[%idx1, %idx2] : memref<128x128xi8, 3> -> vector<8xi8>
1719
return %0 : vector<8xi8>
1820
}
1921

22+
// -----
23+
2024
// CHECK-LABEL: func @transpose_load_to_rocdl_16xi4
21-
func.func @transpose_load_to_rocdl_16xi4(%idx1 : index, %idx2 : index, %wgmem : memref<128x16xi4, #gpu_lds_addrspace>) -> vector<16xi4> {
25+
func.func @transpose_load_to_rocdl_16xi4(%idx1 : index, %idx2 : index, %wgmem : memref<128x16xi4, 3>) -> vector<16xi4> {
2226
// CHECK: rocdl.ds.read.tr4.b64
23-
%0 = amdgpu.transpose_load %wgmem[%idx1, %idx2] : memref<128x16xi4, #gpu_lds_addrspace> -> vector<16xi4>
27+
// CHECK-OLD: error: 'amdgpu.transpose_load' op Non-gfx950 chipset not supported
28+
%0 = amdgpu.transpose_load %wgmem[%idx1, %idx2] : memref<128x16xi4, 3> -> vector<16xi4>
2429
return %0 : vector<16xi4>
2530
}
2631

32+
// -----
33+
2734
// CHECK-LABEL: func @transpose_load_to_rocdl_3xi32
28-
func.func @transpose_load_to_rocdl_3xi32(%idx1 : index, %idx2 : index, %wgmem : memref<128x32xi32, #gpu_lds_addrspace>) -> vector<3xi32> {
35+
func.func @transpose_load_to_rocdl_3xi32(%idx1 : index, %idx2 : index, %wgmem : memref<128x32xi32, 3>) -> vector<3xi32> {
2936
// CHECK: rocdl.ds.read.tr6.b96
30-
%0 = amdgpu.transpose_load %wgmem[%idx1, %idx2] : memref<128x32xi32, #gpu_lds_addrspace> -> vector<3xi32>
37+
%0 = amdgpu.transpose_load %wgmem[%idx1, %idx2] : memref<128x32xi32, 3> -> vector<3xi32>
3138
return %0 : vector<3xi32>
3239
}

0 commit comments

Comments
 (0)