| ! RUN: bbc -emit-fir -hlfir=false -fopenmp --force-byref-reduction -o - %s 2>&1 | FileCheck %s |
| ! RUN: %flang_fc1 -emit-fir -flang-deprecated-no-hlfir -fopenmp -mmlir --force-byref-reduction -o - %s 2>&1 | FileCheck %s |
| |
| !CHECK: omp.declare_reduction @max_byref_f32 : !fir.ref<f32> |
| !CHECK-SAME: init { |
| !CHECK: %[[MINIMUM_VAL:.*]] = arith.constant -3.40282347E+38 : f32 |
| !CHECK: %[[REF:.*]] = fir.alloca f32 |
| !CHECK: fir.store %[[MINIMUM_VAL]] to %[[REF]] : !fir.ref<f32> |
| !CHECK: omp.yield(%[[REF]] : !fir.ref<f32>) |
| !CHECK: combiner |
| !CHECK: ^bb0(%[[ARG0:.*]]: !fir.ref<f32>, %[[ARG1:.*]]: !fir.ref<f32>): |
| !CHECK: %[[LD0:.*]] = fir.load %[[ARG0]] : !fir.ref<f32> |
| !CHECK: %[[LD1:.*]] = fir.load %[[ARG1]] : !fir.ref<f32> |
| !CHECK: %[[RES:.*]] = arith.maxnumf %[[LD0]], %[[LD1]] {{.*}}: f32 |
| !CHECK: fir.store %[[RES]] to %[[ARG0]] : !fir.ref<f32> |
| !CHECK: omp.yield(%[[ARG0]] : !fir.ref<f32>) |
| |
| !CHECK-LABEL: omp.declare_reduction @max_byref_i32 : !fir.ref<i32> |
| !CHECK-SAME: init { |
| !CHECK: %[[MINIMUM_VAL:.*]] = arith.constant -2147483648 : i32 |
| !CHECK: fir.store %[[MINIMUM_VAL]] to %[[REF]] : !fir.ref<i32> |
| !CHECK: omp.yield(%[[REF]] : !fir.ref<i32>) |
| !CHECK: combiner |
| !CHECK: ^bb0(%[[ARG0:.*]]: !fir.ref<i32>, %[[ARG1:.*]]: !fir.ref<i32>): |
| !CHECK: %[[LD0:.*]] = fir.load %[[ARG0]] : !fir.ref<i32> |
| !CHECK: %[[LD1:.*]] = fir.load %[[ARG1]] : !fir.ref<i32> |
| !CHECK: %[[RES:.*]] = arith.maxsi %[[LD0]], %[[LD1]] : i32 |
| !CHECK: fir.store %[[RES]] to %[[ARG0]] : !fir.ref<i32> |
| !CHECK: omp.yield(%[[ARG0]] : !fir.ref<i32>) |
| |
| !CHECK-LABEL: @_QPreduction_max_int |
| !CHECK-SAME: %[[Y_BOX:.*]]: !fir.box<!fir.array<?xi32>> |
| !CHECK: %[[X_REF:.*]] = fir.alloca i32 {bindc_name = "x", uniq_name = "_QFreduction_max_intEx"} |
| !CHECK: omp.parallel |
| !CHECK: omp.wsloop byref reduction(@max_byref_i32 %[[X_REF]] -> %[[PRV:.+]] : !fir.ref<i32>) for |
| !CHECK: %[[LPRV:.+]] = fir.load %[[PRV]] : !fir.ref<i32> |
| !CHECK: %[[Y_I_REF:.*]] = fir.coordinate_of %[[Y_BOX]] |
| !CHECK: %[[Y_I:.*]] = fir.load %[[Y_I_REF]] : !fir.ref<i32> |
| !CHECK: %[[RES:.+]] = arith.cmpi sgt, %[[LPRV]], %[[Y_I]] : i32 |
| !CHECK: %[[SEL:.+]] = arith.select %[[RES]], %[[LPRV]], %[[Y_I]] |
| !CHECK: fir.store %[[SEL]] to %[[PRV]] : !fir.ref<i32> |
| !CHECK: omp.terminator |
| |
| !CHECK-LABEL: @_QPreduction_max_real |
| !CHECK-SAME: %[[Y_BOX:.*]]: !fir.box<!fir.array<?xf32>> |
| !CHECK: %[[X_REF:.*]] = fir.alloca f32 {bindc_name = "x", uniq_name = "_QFreduction_max_realEx"} |
| !CHECK: omp.parallel |
| !CHECK: omp.wsloop byref reduction(@max_byref_f32 %[[X_REF]] -> %[[PRV:.+]] : !fir.ref<f32>) for |
| !CHECK: %[[LPRV:.+]] = fir.load %[[PRV]] : !fir.ref<f32> |
| !CHECK: %[[Y_I_REF:.*]] = fir.coordinate_of %[[Y_BOX]] |
| !CHECK: %[[Y_I:.*]] = fir.load %[[Y_I_REF]] : !fir.ref<f32> |
| !CHECK: %[[RES:.+]] = arith.cmpf ogt, %[[Y_I]], %[[LPRV]] {{.*}} : f32 |
| !CHECK: omp.yield |
| !CHECK: omp.terminator |
| |
| subroutine reduction_max_int(y) |
| integer :: x, y(:) |
| x = 0 |
| !$omp parallel |
| !$omp do reduction(max:x) |
| do i=1, 100 |
| x = max(x, y(i)) |
| end do |
| !$omp end do |
| !$omp end parallel |
| print *, x |
| end subroutine |
| |
| subroutine reduction_max_real(y) |
| real :: x, y(:) |
| x = 0.0 |
| !$omp parallel |
| !$omp do reduction(max:x) |
| do i=1, 100 |
| x = max(y(i), x) |
| end do |
| !$omp end do |
| !$omp end parallel |
| print *, x |
| |
| !$omp parallel |
| !$omp do reduction(max:x) |
| do i=1, 100 |
| !CHECK-NOT: omp.reduction |
| if (y(i) .gt. x) x = y(i) |
| end do |
| !$omp end do |
| !$omp end parallel |
| print *, x |
| end subroutine |