@@ -214,47 +214,36 @@ func.func @tma_load_multicast5d(%tmaDescriptor: !llvm.ptr, %dest : !llvm.ptr<3>,
214
214
215
215
// CHECK-LABEL: @tma_store_1d
216
216
func.func @tma_store_1d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %p : i1 ) {
217
- // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.1d.global.shared::cta.bulk_group [$0, {$2} ], [$1];", "l,r,r"
218
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ] : !llvm.ptr , !llvm.ptr <3 >, i32
219
217
// CHECK: llvm.inline_asm has_side_effects asm_dialect = att "@$3 cp.async.bulk.tensor.1d.global.shared::cta.bulk_group [$0, {$2} ], [$1];", "l,r,r,b"
220
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i1
218
+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
221
219
return
222
220
}
223
221
224
222
// CHECK-LABEL: @tma_store_2d
225
223
func.func @tma_store_2d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %crd1: i32 , %p : i1 ) {
226
- // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.2d.global.shared::cta.bulk_group [$0, {$2, $3} ], [$1];", "l,r,r,r"
227
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ] : !llvm.ptr , !llvm.ptr <3 >, i32 , i32
228
224
// CHECK: llvm.inline_asm has_side_effects asm_dialect = att "@$4 cp.async.bulk.tensor.2d.global.shared::cta.bulk_group [$0, {$2, $3} ], [$1];", "l,r,r,r,b"
229
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i1
225
+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
230
226
return
231
227
}
232
228
233
229
// CHECK-LABEL: @tma_store_3d
234
230
func.func @tma_store_3d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %crd1: i32 , %crd2: i32 , %p : i1 ) {
235
- // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.3d.global.shared::cta.bulk_group [$0, {$2, $3, $4} ], [$1];", "l,r,r,r,r"
236
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ] : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32
237
231
// CHECK: llvm.inline_asm has_side_effects asm_dialect = att "@$5 cp.async.bulk.tensor.3d.global.shared::cta.bulk_group [$0, {$2, $3, $4} ], [$1];", "l,r,r,r,r,b"
238
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i1
232
+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
239
233
return
240
234
}
241
235
242
236
// CHECK-LABEL: @tma_store_4d
243
237
func.func @tma_store_4d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %crd1: i32 , %crd2: i32 , %crd3: i32 , %p : i1 ) {
244
- // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.4d.global.shared::cta.bulk_group [$0, {$2, $3, $4, $5} ], [$1];", "l,r,r,r,r,r"
245
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ] : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i32
246
238
// CHECK: llvm.inline_asm has_side_effects asm_dialect = att "@$6 cp.async.bulk.tensor.4d.global.shared::cta.bulk_group [$0, {$2, $3, $4, $5} ], [$1];", "l,r,r,r,r,r,b"
247
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i32 , i1
239
+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
248
240
return
249
241
}
250
242
251
243
// CHECK-LABEL: @tma_store_5d
252
244
func.func @tma_store_5d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %crd1: i32 , %crd2: i32 , %crd3: i32 , %crd4: i32 , %p : i1 ) {
253
- // CHECK-NEXT: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.5d.global.shared::cta.bulk_group [$0, {$2, $3, $4, $5, $6} ], [$1];", "l,r,r,r,r,r,r"
254
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ,%crd4 ] : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i32 , i32
255
-
256
245
// CHECK-NEXT: llvm.inline_asm has_side_effects asm_dialect = att "@$7 cp.async.bulk.tensor.5d.global.shared::cta.bulk_group [$0, {$2, $3, $4, $5, $6} ], [$1];", "l,r,r,r,r,r,r,b"
257
- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ,%crd4 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i32 , i32 , i1
246
+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ,%crd4 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
258
247
return
259
248
}
260
249
0 commit comments