Index: flang/lib/Lower/OpenMP.cpp =================================================================== --- flang/lib/Lower/OpenMP.cpp +++ flang/lib/Lower/OpenMP.cpp @@ -120,6 +120,24 @@ } } +static mlir::Type getLoopVarType(Fortran::lower::AbstractConverter &converter, + std::size_t loopVarTypeSize) { + // OpenMP runtime requires 32-bit or 64-bit loop variables. + loopVarTypeSize = loopVarTypeSize * 8; + if (loopVarTypeSize < 32) { + loopVarTypeSize = 32; + } else if (loopVarTypeSize == 128) { + loopVarTypeSize = 64; + mlir::emitWarning(converter.getCurrentLocation(), + "OpenMP loop iteration variable cannot have more than 64 " + "bits size and will be narrowed into 64 bits."); + } + assert((loopVarTypeSize == 32 || loopVarTypeSize == 64) && + "OpenMP loop iteration variable size must be transformed into 32-bit " + "or 64-bit"); + return converter.getFirOpBuilder().getIntegerType(loopVarTypeSize); +} + /// Create the body (block) for an OpenMP Operation. /// /// \param [in] op - the operation the body belongs to. @@ -143,15 +161,19 @@ // e.g. For loops the arguments are the induction variable. And all further // uses of the induction variable should use this mlir value. if (args.size()) { + std::size_t loopVarTypeSize = 0; + for (const Fortran::semantics::Symbol *arg : args) + loopVarTypeSize = std::max(loopVarTypeSize, arg->GetUltimate().size()); + mlir::Type loopVarType = getLoopVarType(converter, loopVarTypeSize); SmallVector tiv; SmallVector locs; - int argIndex = 0; - for (auto &arg : args) { - tiv.push_back(converter.genType(*arg)); + for (int i = 0; i < (int)args.size(); i++) { + tiv.push_back(loopVarType); locs.push_back(loc); } firOpBuilder.createBlock(&op.getRegion(), {}, tiv, locs); - for (auto &arg : args) { + int argIndex = 0; + for (const Fortran::semantics::Symbol *arg : args) { fir::ExtendedValue exval = op.getRegion().front().getArgument(argIndex); converter.bindSymbol(*arg, exval); argIndex++; @@ -426,11 +448,12 @@ TODO(converter.getCurrentLocation(), "Combined worksharing loop construct"); } - int64_t collapseValue = Fortran::lower::getCollapseValue(wsLoopOpClauseList); - // Collect the loops to collapse. auto *doConstructEval = &eval.getFirstNestedEvaluation(); + std::int64_t collapseValue = + Fortran::lower::getCollapseValue(wsLoopOpClauseList); + std::size_t loopVarTypeSize = 0; SmallVector iv; do { auto *doLoop = &doConstructEval->getFirstNestedEvaluation(); @@ -454,6 +477,8 @@ currentLocation, firOpBuilder.getIntegerType(32), 1)); } iv.push_back(bounds->name.thing.symbol); + loopVarTypeSize = std::max( + loopVarTypeSize, bounds->name.thing.symbol->GetUltimate().size()); } collapseValue--; @@ -461,6 +486,18 @@ &*std::next(doConstructEval->getNestedEvaluations().begin()); } while (collapseValue > 0); + // The types of lower bound, upper bound, and step are converted into the + // type of the loop variable if necessary. + mlir::Type loopVarType = getLoopVarType(converter, loopVarTypeSize); + for (unsigned it = 0; it < (unsigned)lowerBound.size(); it++) { + lowerBound[it] = firOpBuilder.createConvert(currentLocation, loopVarType, + lowerBound[it]); + upperBound[it] = firOpBuilder.createConvert(currentLocation, loopVarType, + upperBound[it]); + step[it] = + firOpBuilder.createConvert(currentLocation, loopVarType, step[it]); + } + // FIXME: Add support for following clauses: // 1. linear // 2. order Index: flang/test/Lower/OpenMP/omp-wsloop-variable.f90 =================================================================== --- /dev/null +++ flang/test/Lower/OpenMP/omp-wsloop-variable.f90 @@ -0,0 +1,67 @@ +! This test checks lowering of OpenMP DO Directive(Worksharing) for different +! types of loop iteration variable, lower bound, upper bound, and step. + +!REQUIRES: shell +!RUN: bbc -fopenmp -emit-fir %s -o - 2>&1 | FileCheck %s + +program wsloop_variable + integer(kind=1) :: i1_lb, i1_ub + integer(kind=2) :: i2, i2_ub, i2_s + integer(kind=4) :: i4_s + integer(kind=8) :: i8, i8_s + integer(kind=16) :: i16, i16_lb + real :: x + +!CHECK: OpenMP loop iteration variable cannot have more than 64 bits size and will be narrowed into 64 bits. + +!CHECK: [[TMP0:%.*]] = arith.constant 1 : i32 +!CHECK: [[TMP1:%.*]] = arith.constant 100 : i32 +!CHECK: [[TMP2:%.*]] = fir.convert [[TMP0]] : (i32) -> i64 +!CHECK: [[TMP3:%.*]] = fir.convert %{{.*}} : (i8) -> i64 +!CHECK: [[TMP4:%.*]] = fir.convert %{{.*}} : (i16) -> i64 +!CHECK: [[TMP5:%.*]] = fir.convert %{{.*}} : (i128) -> i64 +!CHECK: [[TMP6:%.*]] = fir.convert [[TMP1]] : (i32) -> i64 +!CHECK: [[TMP7:%.*]] = fir.convert %{{.*}} : (i32) -> i64 +!CHECK: omp.wsloop collapse(2) for ([[TMP8:%.*]], [[TMP9:%.*]]) : i64 = ([[TMP2]], [[TMP5]]) to ([[TMP3]], [[TMP6]]) inclusive step ([[TMP4]], [[TMP7]]) { +!CHECK: [[TMP10:%.*]] = arith.addi [[TMP8]], [[TMP9]] : i64 +!CHECK: [[TMP11:%.*]] = fir.convert [[TMP10]] : (i64) -> f32 +!CHECK: fir.store [[TMP11]] to %{{.*}} : !fir.ref +!CHECK: omp.yield +!CHECK: } + !$omp do collapse(2) + do i2 = 1, i1_ub, i2_s + do i8 = i16_lb, 100, i4_s + x = i2 + i8 + end do + end do + !$omp end do + +!CHECK: [[TMP12:%.*]] = arith.constant 1 : i32 +!CHECK: [[TMP13:%.*]] = fir.convert %{{.*}} : (i8) -> i32 +!CHECK: [[TMP14:%.*]] = fir.convert %{{.*}} : (i64) -> i32 +!CHECK: omp.wsloop for ([[TMP15:%.*]]) : i32 = ([[TMP12]]) to ([[TMP13]]) inclusive step ([[TMP14]]) { +!CHECK: [[TMP16:%.*]] = fir.convert [[TMP15]] : (i32) -> f32 +!CHECK: fir.store [[TMP16]] to %{{.*}} : !fir.ref +!CHECK: omp.yield +!CHECK: } + !$omp do + do i2 = 1, i1_ub, i8_s + x = i2 + end do + !$omp end do + +!CHECK: [[TMP17:%.*]] = fir.convert %{{.*}} : (i8) -> i64 +!CHECK: [[TMP18:%.*]] = fir.convert %{{.*}} : (i16) -> i64 +!CHECK: [[TMP19:%.*]] = fir.convert %{{.*}} : (i32) -> i64 +!CHECK: omp.wsloop for ([[TMP20:%.*]]) : i64 = ([[TMP17]]) to ([[TMP18]]) inclusive step ([[TMP19]]) { +!CHECK: [[TMP21:%.*]] = fir.convert [[TMP20]] : (i64) -> f32 +!CHECK: fir.store [[TMP21]] to %{{.*}} : !fir.ref +!CHECK: omp.yield +!CHECK: } + !$omp do + do i16 = i1_lb, i2_ub, i4_s + x = i16 + end do + !$omp end do + +end program wsloop_variable