Skip to content

Commit 1a40d6c

Browse files
committed
update again
1 parent b483701 commit 1a40d6c

File tree

2 files changed

+9
-9
lines changed

2 files changed

+9
-9
lines changed

mlir/include/mlir/Dialect/AMDGPU/IR/AMDGPU.td

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -795,7 +795,7 @@ def AMDGPU_GatherToLDSOp :
795795
Note: only enabled for gfx942 and later.
796796
}];
797797
let assemblyFormat = [{
798-
$src `[` $srcIndices `]` `,` $dst `[` $dstIndices `]` attr-dict `:` type($src) `,` type($dst)
798+
$src `[` $srcIndices `]` `,` $dst `[` $dstIndices `]` attr-dict `:` $transferType `,` type($src) `,` type($dst)
799799
}];
800800
let hasVerifier = 1;
801801
}

mlir/test/Conversion/AMDGPUToROCDL/load_lds.mlir

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -39,8 +39,8 @@ func.func @global_load_to_rocdl_f32(%global : memref<128x72xf32, #gpu_global_add
3939
// CHECK: %[[C0:.*]] = llvm.mlir.constant(0 : i32) : i32
4040
// CHECK: %[[C0_2:.*]] = llvm.mlir.constant(0 : i32) : i32
4141
// CHECK: rocdl.global.load.lds %[[GLOBAL_PTR]], %[[LDS_PTR]], %[[C4]], %[[C0]], %[[C0_2]]
42-
amdgpu.gather_to_lds %global[%c12, %c0], %alloc[%c32, %c0] {transferType = f32}
43-
: memref<128x72xf32, #gpu_global_addrspace>, memref<64x64xf32, #gpu_lds_addrspace>
42+
amdgpu.gather_to_lds %global[%c12, %c0], %alloc[%c32, %c0]
43+
: f32, memref<128x72xf32, #gpu_global_addrspace>, memref<64x64xf32, #gpu_lds_addrspace>
4444
func.return
4545
}
4646

@@ -80,8 +80,8 @@ func.func @global_load_to_rocdl_i8(%global : memref<128x72xi8, #gpu_global_addrs
8080
%c12 = arith.constant 12 : index
8181
%c32 = arith.constant 32 : index
8282
%alloc = memref.alloc() : memref<64x64xi8, #gpu_lds_addrspace>
83-
amdgpu.gather_to_lds %global[%c12, %c0], %alloc[%c32, %c0] {transferType = i8}
84-
: memref<128x72xi8, #gpu_global_addrspace>, memref<64x64xi8, #gpu_lds_addrspace>
83+
amdgpu.gather_to_lds %global[%c12, %c0], %alloc[%c32, %c0]
84+
: i8, memref<128x72xi8, #gpu_global_addrspace>, memref<64x64xi8, #gpu_lds_addrspace>
8585
func.return
8686
}
8787

@@ -121,8 +121,8 @@ func.func @global_load_to_rocdl_vec(%global : memref<128x72xi16, #gpu_global_add
121121
%c12 = arith.constant 12 : index
122122
%c32 = arith.constant 32 : index
123123
%alloc = memref.alloc() : memref<64x128xi16, #gpu_lds_addrspace>
124-
amdgpu.gather_to_lds %global[%c12, %c0], %alloc[%c32, %c0] {transferType = vector<2 x i16>}
125-
: memref<128x72xi16, #gpu_global_addrspace>, memref<64x128xi16, #gpu_lds_addrspace>
124+
amdgpu.gather_to_lds %global[%c12, %c0], %alloc[%c32, %c0]
125+
: vector<2 x i16>, memref<128x72xi16, #gpu_global_addrspace>, memref<64x128xi16, #gpu_lds_addrspace>
126126
func.return
127127
}
128128

@@ -145,7 +145,7 @@ func.func @global_load_to_rocdl_dynamic_indices(%global : memref<512xi32, #gpu_g
145145
// CHECK: rocdl.global.load.lds %[[GLOBAL_PTR]], %[[LDS_PTR]], %[[C4]], %[[C0]], %[[C0_2]]
146146
%alloc = memref.alloc() : memref<4x64xi32, #gpu_lds_addrspace>
147147
%c0 = arith.constant 0 : index
148-
amdgpu.gather_to_lds %global[%src_idx], %alloc[%dst_idx, %c0] {transferType = i32}
149-
: memref<512xi32, #gpu_global_addrspace>, memref<4x64xi32, #gpu_lds_addrspace>
148+
amdgpu.gather_to_lds %global[%src_idx], %alloc[%dst_idx, %c0]
149+
: i32, memref<512xi32, #gpu_global_addrspace>, memref<4x64xi32, #gpu_lds_addrspace>
150150
func.return
151151
}

0 commit comments

Comments
 (0)