@@ -308,6 +308,7 @@ func.func @_QPtest_type() {
308308// CHECK-LABEL: func.func @_QPtest_type()
309309// CHECK: fir.call @_FortranACUFDataTransferPtrPtr(%{{.*}}, %{{.*}}, %c12{{.*}}, %c0{{.*}}, %{{.*}}, %{{.*}}) : (!fir.llvm_ptr<i8>, !fir.llvm_ptr<i8>, i64, i32, !fir.ref<i8>, i32) -> none
310310
311+ <<<<<<< HEAD
311312func.func @_QPtest_array_type() {
312313 %c10 = arith.constant 10 : index
313314 %0 = cuf.alloc !fir.array<10x!fir.type<_QMbarTcmplx{id:i32,c:complex<f32>}>> {bindc_name = "a", data_attr = #cuf.cuda<device>, uniq_name = "_QFtest_array_typeEa"} -> !fir.ref<!fir.array<10x!fir.type<_QMbarTcmplx{id:i32,c:complex<f32>}>>>
@@ -326,5 +327,41 @@ func.func @_QPtest_array_type() {
326327// CHECK: fir.call @_FortranACUFMemAlloc(%[[CONV_BYTES]], %c0{{.*}}, %{{.*}}, %{{.*}}) : (i64, i32, !fir.ref<i8>, i32) -> !fir.llvm_ptr<i8>
327328// CHECK: %[[BYTES:.*]] = arith.muli %c10{{.*}}, %c12{{.*}} : i64
328329// CHECK: fir.call @_FortranACUFDataTransferPtrPtr(%{{.*}}, %{{.*}}, %[[BYTES]], %c0{{.*}}, %{{.*}}, %{{.*}}) : (!fir.llvm_ptr<i8>, !fir.llvm_ptr<i8>, i64, i32, !fir.ref<i8>, i32) -> none
330+ =======
331+ func.func @_QPshape_shift() {
332+ %c0_i32 = arith.constant 0 : i32
333+ %c11 = arith.constant 11 : index
334+ %c10 = arith.constant 10 : index
335+ %0 = cuf.alloc !fir.array<10xi32> {bindc_name = "cdev", data_attr = #cuf.cuda<device>, uniq_name = "_QFshape_shiftEcdev"} -> !fir.ref<!fir.array<10xi32>>
336+ %1 = fir.shape_shift %c11, %c10 : (index, index) -> !fir.shapeshift<1>
337+ %2:2 = hlfir.declare %0(%1) {data_attr = #cuf.cuda<device>, uniq_name = "_QFshape_shiftEcdev"} : (!fir.ref<!fir.array<10xi32>>, !fir.shapeshift<1>) -> (!fir.box<!fir.array<10xi32>>, !fir.ref<!fir.array<10xi32>>)
338+ cuf.data_transfer %c0_i32 to %2#1, %1 : !fir.shapeshift<1> {transfer_kind = #cuf.cuda_transfer<host_device>} : i32, !fir.ref<!fir.array<10xi32>>
339+ cuf.free %2#1 : !fir.ref<!fir.array<10xi32>> {data_attr = #cuf.cuda<device>}
340+ return
341+ }
342+
343+ // CHECK-LABEL: func.func @_QPshape_shift()
344+ // CHECK: fir.call @_FortranACUFDataTransferDescDescNoRealloc
345+
346+ func.func @_QPshape_shift2() {
347+ %c11 = arith.constant 11 : index
348+ %c10 = arith.constant 10 : index
349+ %0 = fir.alloca !fir.array<10xi32> {bindc_name = "ahost", uniq_name = "_QFshape_shift2Eahost"}
350+ %1 = fir.shape %c10 : (index) -> !fir.shape<1>
351+ %2:2 = hlfir.declare %0(%1) {uniq_name = "_QFshape_shift2Eahost"} : (!fir.ref<!fir.array<10xi32>>, !fir.shape<1>) -> (!fir.ref<!fir.array<10xi32>>, !fir.ref<!fir.array<10xi32>>)
352+ %3 = cuf.alloc !fir.array<10xi32> {bindc_name = "cdev", data_attr = #cuf.cuda<device>, uniq_name = "_QFshape_shift2Ecdev"} -> !fir.ref<!fir.array<10xi32>>
353+ %4 = fir.shape_shift %c11, %c10 : (index, index) -> !fir.shapeshift<1>
354+ %5:2 = hlfir.declare %3(%4) {data_attr = #cuf.cuda<device>, uniq_name = "_QFshape_shift2Ecdev"} : (!fir.ref<!fir.array<10xi32>>, !fir.shapeshift<1>) -> (!fir.box<!fir.array<10xi32>>, !fir.ref<!fir.array<10xi32>>)
355+ cuf.data_transfer %2#0 to %5#1, %4 : !fir.shapeshift<1> {transfer_kind = #cuf.cuda_transfer<host_device>} : !fir.ref<!fir.array<10xi32>>, !fir.ref<!fir.array<10xi32>>
356+ cuf.free %5#1 : !fir.ref<!fir.array<10xi32>> {data_attr = #cuf.cuda<device>}
357+ return
358+ }
359+
360+ // CHECK-LABEL: func.func @_QPshape_shift2()
361+ // CHECK: %[[C10:.*]] = fir.convert %c10{{.*}} : (index) -> i64
362+ // CHECK: %[[BYTES:.*]] = arith.muli %[[C10]], %c4{{.*}} : i64
363+ // CHECK: fir.call @_FortranACUFDataTransferPtrPtr(%{{.*}}, %{{.*}}, %[[BYTES]], %{{.*}}, %{{.*}}, %{{.*}}) : (!fir.llvm_ptr<i8>, !fir.llvm_ptr<i8>, i64, i32, !fir.ref<i8>, i32) -> none
364+
365+ >>>>>>> 2480604fdb1c ([flang][cuda] Handle LHS with shape_shift in data transfer)
329366
330367} // end of module
0 commit comments