|
| 1 | +!RUN: %flang_fc1 -emit-hlfir -ffast-math -fopenmp -fopenmp-version=60 %s -o - | FileCheck %s |
| 2 | + |
| 3 | +subroutine f00(x, y) |
| 4 | + implicit none |
| 5 | + real :: x, y |
| 6 | + |
| 7 | + !$omp atomic update |
| 8 | + x = ((x + 1) + y) + 2 |
| 9 | +end |
| 10 | + |
| 11 | +!CHECK-LABEL: func.func @_QPf00 |
| 12 | +!CHECK: %[[X:[0-9]+]]:2 = hlfir.declare %arg0 |
| 13 | +!CHECK: %[[Y:[0-9]+]]:2 = hlfir.declare %arg1 |
| 14 | +!CHECK: %cst = arith.constant 1.000000e+00 : f32 |
| 15 | +!CHECK: %[[LOAD_Y:[0-9]+]] = fir.load %[[Y]]#0 : !fir.ref<f32> |
| 16 | +!CHECK: %[[Y_1:[0-9]+]] = arith.addf %cst, %[[LOAD_Y]] fastmath<fast> : f32 |
| 17 | +!CHECK: %cst_0 = arith.constant 2.000000e+00 : f32 |
| 18 | +!CHECK: %[[Y_1_2:[0-9]+]] = arith.addf %[[Y_1]], %cst_0 fastmath<fast> : f32 |
| 19 | +!CHECK: omp.atomic.update memory_order(relaxed) %[[X]]#0 : !fir.ref<f32> { |
| 20 | +!CHECK: ^bb0(%[[ARG:arg[0-9]+]]: f32): |
| 21 | +!CHECK: %[[ARG_P:[0-9]+]] = arith.addf %[[ARG]], %[[Y_1_2]] fastmath<fast> : f32 |
| 22 | +!CHECK: omp.yield(%[[ARG_P]] : f32) |
| 23 | +!CHECK: } |
| 24 | + |
| 25 | + |
| 26 | +subroutine f01(x, y, z) |
| 27 | + implicit none |
| 28 | + complex :: x, y, z |
| 29 | + |
| 30 | + !$omp atomic update |
| 31 | + x = (x + y) + z |
| 32 | +end |
| 33 | + |
| 34 | +!CHECK-LABEL: func.func @_QPf01 |
| 35 | +!CHECK: %[[X:[0-9]+]]:2 = hlfir.declare %arg0 |
| 36 | +!CHECK: %[[Y:[0-9]+]]:2 = hlfir.declare %arg1 |
| 37 | +!CHECK: %[[Z:[0-9]+]]:2 = hlfir.declare %arg2 |
| 38 | +!CHECK: %[[LOAD_Y:[0-9]+]] = fir.load %[[Y]]#0 : !fir.ref<complex<f32>> |
| 39 | +!CHECK: %[[LOAD_Z:[0-9]+]] = fir.load %[[Z]]#0 : !fir.ref<complex<f32>> |
| 40 | +!CHECK: %[[Y_Z:[0-9]+]] = fir.addc %[[LOAD_Y]], %[[LOAD_Z]] {fastmath = #arith.fastmath<fast>} : complex<f32> |
| 41 | +!CHECK: omp.atomic.update memory_order(relaxed) %[[X]]#0 : !fir.ref<complex<f32>> { |
| 42 | +!CHECK: ^bb0(%[[ARG:arg[0-9]+]]: complex<f32>): |
| 43 | +!CHECK: %[[ARG_P:[0-9]+]] = fir.addc %[[ARG]], %[[Y_Z]] {fastmath = #arith.fastmath<fast>} : complex<f32> |
| 44 | +!CHECK: omp.yield(%[[ARG_P]] : complex<f32>) |
| 45 | +!CHECK: } |
| 46 | + |
| 47 | + |
| 48 | +subroutine f02(x, y) |
| 49 | + implicit none |
| 50 | + complex :: x |
| 51 | + real :: y |
| 52 | + |
| 53 | + !$omp atomic update |
| 54 | + x = (real(x) + y) + 1 |
| 55 | +end |
| 56 | + |
| 57 | +!CHECK-LABEL: func.func @_QPf02 |
| 58 | +!CHECK: %[[X:[0-9]+]]:2 = hlfir.declare %arg0 |
| 59 | +!CHECK: %[[Y:[0-9]+]]:2 = hlfir.declare %arg1 |
| 60 | +!CHECK: %[[LOAD_Y:[0-9]+]] = fir.load %[[Y]]#0 : !fir.ref<f32> |
| 61 | +!CHECK: %cst = arith.constant 1.000000e+00 : f32 |
| 62 | +!CHECK: %[[Y_1:[0-9]+]] = arith.addf %[[LOAD_Y]], %cst fastmath<fast> : f32 |
| 63 | +!CHECK: omp.atomic.update memory_order(relaxed) %[[X]]#0 : !fir.ref<complex<f32>> { |
| 64 | +!CHECK: ^bb0(%[[ARG:arg[0-9]+]]: complex<f32>): |
| 65 | +!CHECK: %[[ARG_X:[0-9]+]] = fir.extract_value %[[ARG]], [0 : index] : (complex<f32>) -> f32 |
| 66 | +!CHECK: %[[ARG_P:[0-9]+]] = arith.addf %[[ARG_X]], %[[Y_1]] fastmath<fast> : f32 |
| 67 | +!CHECK: %cst_0 = arith.constant 0.000000e+00 : f32 |
| 68 | +!CHECK: %[[CPLX:[0-9]+]] = fir.undefined complex<f32> |
| 69 | +!CHECK: %[[CPLX_I:[0-9]+]] = fir.insert_value %[[CPLX]], %[[ARG_P]], [0 : index] : (complex<f32>, f32) -> complex<f32> |
| 70 | +!CHECK: %[[CPLX_R:[0-9]+]] = fir.insert_value %[[CPLX_I]], %cst_0, [1 : index] : (complex<f32>, f32) -> complex<f32> |
| 71 | +!CHECK: omp.yield(%[[CPLX_R]] : complex<f32>) |
| 72 | +!CHECK: } |
| 73 | + |
| 74 | + |
| 75 | +subroutine f03(x, a, b, c) |
| 76 | + implicit none |
| 77 | + real(kind=4) :: x |
| 78 | + real(kind=8) :: a, b, c |
| 79 | + |
| 80 | + !$omp atomic update |
| 81 | + x = ((b + a) + x) + c |
| 82 | +end |
| 83 | + |
| 84 | +!CHECK-LABEL: func.func @_QPf03 |
| 85 | +!CHECK: %[[A:[0-9]+]]:2 = hlfir.declare %arg1 |
| 86 | +!CHECK: %[[B:[0-9]+]]:2 = hlfir.declare %arg2 |
| 87 | +!CHECK: %[[C:[0-9]+]]:2 = hlfir.declare %arg3 |
| 88 | +!CHECK: %[[X:[0-9]+]]:2 = hlfir.declare %arg0 |
| 89 | +!CHECK: %[[LOAD_B:[0-9]+]] = fir.load %[[B]]#0 : !fir.ref<f64> |
| 90 | +!CHECK: %[[LOAD_A:[0-9]+]] = fir.load %[[A]]#0 : !fir.ref<f64> |
| 91 | +!CHECK: %[[A_B:[0-9]+]] = arith.addf %[[LOAD_B]], %[[LOAD_A]] fastmath<fast> : f64 |
| 92 | +!CHECK: %[[LOAD_C:[0-9]+]] = fir.load %[[C]]#0 : !fir.ref<f64> |
| 93 | +!CHECK: %[[A_B_C:[0-9]+]] = arith.addf %[[A_B]], %[[LOAD_C]] fastmath<fast> : f64 |
| 94 | +!CHECK: omp.atomic.update memory_order(relaxed) %[[X]]#0 : !fir.ref<f32> { |
| 95 | +!CHECK: ^bb0(%[[ARG:arg[0-9]+]]: f32): |
| 96 | +!CHECK: %[[ARG_8:[0-9]+]] = fir.convert %[[ARG]] : (f32) -> f64 |
| 97 | +!CHECK: %[[ARG_P:[0-9]+]] = arith.addf %[[ARG_8]], %[[A_B_C]] fastmath<fast> : f64 |
| 98 | +!CHECK: %[[ARG_4:[0-9]+]] = fir.convert %[[ARG_P]] : (f64) -> f32 |
| 99 | +!CHECK: omp.yield(%[[ARG_4]] : f32) |
| 100 | +!CHECK: } |
0 commit comments