Upstreams further parts of `do concurrent` to OpenMP conversion pass from AMD's fork. This PR extends the pass by adding support for mapping to the device. PR stack: - https://github.com/llvm/llvm-project/pull/155754 - https://github.com/llvm/llvm-project/pull/155987 ◀️ - https://github.com/llvm/llvm-project/pull/155992 - https://github.com/llvm/llvm-project/pull/155993 - https://github.com/llvm/llvm-project/pull/157638 - https://github.com/llvm/llvm-project/pull/156610 - https://github.com/llvm/llvm-project/pull/156837
84 lines
3.6 KiB
Fortran
84 lines
3.6 KiB
Fortran
! Tests mapping of a basic `do concurrent` loop to
|
|
! `!$omp target teams distribute parallel do`.
|
|
|
|
! RUN: %flang_fc1 -emit-hlfir -fopenmp -fdo-concurrent-to-openmp=device %s -o - \
|
|
! RUN: | FileCheck %s
|
|
! RUN: bbc -emit-hlfir -fopenmp -fdo-concurrent-to-openmp=device %s -o - \
|
|
! RUN: | FileCheck %s
|
|
|
|
program do_concurrent_basic
|
|
implicit none
|
|
integer :: a(10)
|
|
integer :: i
|
|
|
|
! CHECK: %[[I_ORIG_ALLOC:.*]] = fir.alloca i32 {bindc_name = "i"}
|
|
! CHECK: %[[I_ORIG_DECL:.*]]:2 = hlfir.declare %[[I_ORIG_ALLOC]]
|
|
|
|
! CHECK: %[[A_ADDR:.*]] = fir.address_of(@_QFEa)
|
|
! CHECK: %[[A_SHAPE:.*]] = fir.shape %[[A_EXTENT:.*]] : (index) -> !fir.shape<1>
|
|
! CHECK: %[[A_ORIG_DECL:.*]]:2 = hlfir.declare %[[A_ADDR]](%[[A_SHAPE]])
|
|
|
|
! CHECK-NOT: fir.do_loop
|
|
|
|
! CHECK: %[[C1:.*]] = arith.constant 1 : i32
|
|
! CHECK: %[[HOST_LB:.*]] = fir.convert %[[C1]] : (i32) -> index
|
|
! CHECK: %[[C10:.*]] = arith.constant 10 : i32
|
|
! CHECK: %[[HOST_UB:.*]] = fir.convert %[[C10]] : (i32) -> index
|
|
! CHECK: %[[HOST_STEP:.*]] = arith.constant 1 : index
|
|
|
|
! CHECK: %[[I_MAP_INFO:.*]] = omp.map.info var_ptr(%[[I_ORIG_DECL]]#1
|
|
! CHECK: %[[C0:.*]] = arith.constant 0 : index
|
|
! CHECK: %[[UPPER_BOUND:.*]] = arith.subi %[[A_EXTENT]], %{{c1.*}} : index
|
|
|
|
! CHECK: %[[A_BOUNDS:.*]] = omp.map.bounds lower_bound(%[[C0]] : index)
|
|
! CHECK-SAME: upper_bound(%[[UPPER_BOUND]] : index)
|
|
! CHECK-SAME: extent(%[[A_EXTENT]] : index)
|
|
|
|
! CHECK: %[[A_MAP_INFO:.*]] = omp.map.info var_ptr(%[[A_ORIG_DECL]]#1 : {{[^(]+}})
|
|
! CHECK-SAME: map_clauses(implicit, tofrom) capture(ByRef) bounds(%[[A_BOUNDS]])
|
|
|
|
! CHECK: omp.target
|
|
! CHECK-SAME: host_eval(%[[HOST_LB]] -> %[[LB:[[:alnum:]]+]], %[[HOST_UB]] -> %[[UB:[[:alnum:]]+]], %[[HOST_STEP]] -> %[[STEP:[[:alnum:]]+]] : index, index, index)
|
|
! CHECK-SAME: map_entries(
|
|
! CHECK-SAME: %{{[[:alnum:]]+}} -> %{{[^,]+}},
|
|
! CHECK-SAME: %{{[[:alnum:]]+}} -> %{{[^,]+}},
|
|
! CHECK-SAME: %{{[[:alnum:]]+}} -> %{{[^,]+}},
|
|
! CHECK-SAME: %[[I_MAP_INFO]] -> %[[I_ARG:[[:alnum:]]+]],
|
|
! CHECK-SAME: %[[A_MAP_INFO]] -> %[[A_ARG:.[[:alnum:]]+]]
|
|
|
|
! CHECK: %[[A_DEV_DECL:.*]]:2 = hlfir.declare %[[A_ARG]]
|
|
! CHECK: omp.teams {
|
|
! CHECK-NEXT: omp.parallel {
|
|
|
|
! CHECK-NEXT: %[[ITER_VAR:.*]] = fir.alloca i32 {bindc_name = "i"}
|
|
! CHECK-NEXT: %[[BINDING:.*]]:2 = hlfir.declare %[[ITER_VAR]] {uniq_name = "_QFEi"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
|
|
|
|
! CHECK-NEXT: omp.distribute {
|
|
! CHECK-NEXT: omp.wsloop {
|
|
|
|
! CHECK-NEXT: omp.loop_nest (%[[ARG0:.*]]) : index = (%[[LB]]) to (%[[UB]]) inclusive step (%[[STEP]]) {
|
|
! CHECK-NEXT: %[[IV_IDX:.*]] = fir.convert %[[ARG0]] : (index) -> i32
|
|
! CHECK-NEXT: fir.store %[[IV_IDX]] to %[[BINDING]]#0 : !fir.ref<i32>
|
|
! CHECK-NEXT: %[[IV_VAL1:.*]] = fir.load %[[BINDING]]#0 : !fir.ref<i32>
|
|
! CHECK-NEXT: %[[IV_VAL2:.*]] = fir.load %[[BINDING]]#0 : !fir.ref<i32>
|
|
! CHECK-NEXT: %[[IV_VAL_I64:.*]] = fir.convert %[[IV_VAL2]] : (i32) -> i64
|
|
! CHECK-NEXT: %[[ARR_ACCESS:.*]] = hlfir.designate %[[A_DEV_DECL]]#0 (%[[IV_VAL_I64]]) : (!fir.ref<!fir.array<10xi32>>, i64) -> !fir.ref<i32>
|
|
! CHECK-NEXT: hlfir.assign %[[IV_VAL1]] to %[[ARR_ACCESS]] : i32, !fir.ref<i32>
|
|
! CHECK-NEXT: omp.yield
|
|
! CHECK-NEXT: }
|
|
|
|
! CHECK-NEXT: } {omp.composite}
|
|
! CHECK-NEXT: } {omp.composite}
|
|
! CHECK-NEXT: omp.terminator
|
|
! CHECK-NEXT: } {omp.composite}
|
|
! CHECK-NEXT: omp.terminator
|
|
! CHECK-NEXT: }
|
|
! CHECK-NEXT: omp.terminator
|
|
! CHECK-NEXT: }
|
|
do concurrent (i=1:10)
|
|
a(i) = i
|
|
end do
|
|
|
|
! CHECK-NOT: fir.do_loop
|
|
end program do_concurrent_basic
|