Index: flang/include/flang/Optimizer/Builder/Runtime/Reduction.h =================================================================== --- flang/include/flang/Optimizer/Builder/Runtime/Reduction.h +++ flang/include/flang/Optimizer/Builder/Runtime/Reduction.h @@ -148,6 +148,16 @@ mlir::Value resultBox, mlir::Value arrayBox, mlir::Value dim, mlir::Value maskBox); +/// Generate call to `Norm2` intrinsic runtime routine. This is the version +/// that does not take a dim argument. +mlir::Value genNorm2(fir::FirOpBuilder &builder, mlir::Location loc, + mlir::Value arrayBox); + +/// Generate call to `Norm2Dim` intrinsic runtime routine. This is the version +/// that takes a dim argument. +void genNorm2Dim(fir::FirOpBuilder &builder, mlir::Location loc, + mlir::Value resultBox, mlir::Value arrayBox, mlir::Value dim); + /// Generate call to `Parity` runtime routine. This version of `parity` is /// specialized for rank 1 mask arguments. /// This calls the version that returns a scalar logical value. Index: flang/lib/Lower/IntrinsicCall.cpp =================================================================== --- flang/lib/Lower/IntrinsicCall.cpp +++ flang/lib/Lower/IntrinsicCall.cpp @@ -546,6 +546,7 @@ void genMvbits(llvm::ArrayRef); mlir::Value genNearest(mlir::Type, llvm::ArrayRef); mlir::Value genNint(mlir::Type, llvm::ArrayRef); + fir::ExtendedValue genNorm2(mlir::Type, llvm::ArrayRef); mlir::Value genNot(mlir::Type, llvm::ArrayRef); fir::ExtendedValue genNull(mlir::Type, llvm::ArrayRef); fir::ExtendedValue genPack(mlir::Type, llvm::ArrayRef); @@ -940,6 +941,10 @@ {"topos", asValue}}}}, {"nearest", &I::genNearest}, {"nint", &I::genNint}, + {"norm2", + &I::genNorm2, + {{{"array", asBox}, {"dim", asValue}}}, + /*isElemental=*/false}, {"not", &I::genNot}, {"null", &I::genNull, {{{"mold", asInquired}}}, /*isElemental=*/false}, {"pack", @@ -4100,6 +4105,50 @@ return genRuntimeCall("nint", resultType, {args[0]}); } +// NORM2 +fir::ExtendedValue +IntrinsicLibrary::genNorm2(mlir::Type resultType, + llvm::ArrayRef args) { + assert(args.size() == 2); + + // Handle required array argument + mlir::Value array = builder.createBox(loc, args[0]); + unsigned rank = fir::BoxValue(array).rank(); + assert(rank >= 1); + + // Check if the dim argument is present + bool absentDim = isStaticallyAbsent(args[1]); + + // If dim argument is absent or the array is rank 1, then the result is + // a scalar (since the the result is rank-1 or 0). Otherwise, the result is + // an array. + if (absentDim || rank == 1) { + return fir::runtime::genNorm2(builder, loc, array); + } else { + // Create mutable fir.box to be passed to the runtime for the result. + mlir::Type resultArrayType = builder.getVarLenSeqTy(resultType, rank - 1); + fir::MutableBoxValue resultMutableBox = + fir::factory::createTempMutableBox(builder, loc, resultArrayType); + mlir::Value resultIrBox = + fir::factory::getMutableIRBox(builder, loc, resultMutableBox); + + mlir::Value dim = fir::getBase(args[1]); + fir::runtime::genNorm2Dim(builder, loc, resultIrBox, array, dim); + + // Handle cleanup of allocatable result descriptor and return + fir::ExtendedValue res = + fir::factory::genMutableBoxRead(builder, loc, resultMutableBox); + return res.match( + [&](const fir::ArrayBoxValue &box) -> fir::ExtendedValue { + addCleanUpForTemp(loc, box.getAddr()); + return box; + }, + [&](const auto &) -> fir::ExtendedValue { + fir::emitFatalError(loc, "unexpected result for Norm2"); + }); + } +} + // NOT mlir::Value IntrinsicLibrary::genNot(mlir::Type resultType, llvm::ArrayRef args) { Index: flang/lib/Optimizer/Builder/Runtime/Reduction.cpp =================================================================== --- flang/lib/Optimizer/Builder/Runtime/Reduction.cpp +++ flang/lib/Optimizer/Builder/Runtime/Reduction.cpp @@ -119,6 +119,38 @@ } }; +/// Placeholder for real*10 version of Norm2 Intrinsic +struct ForcedNorm2Real10 { + static constexpr const char *name = ExpandAndQuoteKey(RTNAME(Norm2_10)); + static constexpr fir::runtime::FuncTypeBuilderFunc getTypeModel() { + return [](mlir::MLIRContext *ctx) { + auto ty = mlir::FloatType::getF80(ctx); + auto boxTy = + fir::runtime::getModel()(ctx); + auto strTy = fir::ReferenceType::get(mlir::IntegerType::get(ctx, 8)); + auto intTy = mlir::IntegerType::get(ctx, 8 * sizeof(int)); + return mlir::FunctionType::get(ctx, {boxTy, strTy, intTy, intTy, boxTy}, + {ty}); + }; + } +}; + +/// Placeholder for real*16 version of Norm2 Intrinsic +struct ForcedNorm2Real16 { + static constexpr const char *name = ExpandAndQuoteKey(RTNAME(Norm2_16)); + static constexpr fir::runtime::FuncTypeBuilderFunc getTypeModel() { + return [](mlir::MLIRContext *ctx) { + auto ty = mlir::FloatType::getF128(ctx); + auto boxTy = + fir::runtime::getModel()(ctx); + auto strTy = fir::ReferenceType::get(mlir::IntegerType::get(ctx, 8)); + auto intTy = mlir::IntegerType::get(ctx, 8 * sizeof(int)); + return mlir::FunctionType::get(ctx, {boxTy, strTy, intTy, intTy, boxTy}, + {ty}); + }; + } +}; + /// Placeholder for real*10 version of Product Intrinsic struct ForcedProductReal10 { static constexpr const char *name = ExpandAndQuoteKey(RTNAME(ProductReal10)); @@ -849,6 +881,52 @@ return builder.create(loc, func, args).getResult(0); } +/// Generate call to `Norm2Dim` intrinsic runtime routine. This is the version +/// that takes a dim argument. +void fir::runtime::genNorm2Dim(fir::FirOpBuilder &builder, mlir::Location loc, + mlir::Value resultBox, mlir::Value arrayBox, + mlir::Value dim) { + auto maskBox = + builder.createNullConstant(loc, fir::BoxType::get(builder.getI1Type())); + auto func = fir::runtime::getRuntimeFunc(loc, builder); + genReduction3Args(func, builder, loc, resultBox, arrayBox, dim, maskBox); +} + +/// Generate call to `Norm2` intrinsic runtime routine. This is the version +/// that does not take a dim argument. +mlir::Value fir::runtime::genNorm2(fir::FirOpBuilder &builder, + mlir::Location loc, mlir::Value arrayBox) { + mlir::func::FuncOp func; + auto ty = arrayBox.getType(); + auto arrTy = fir::dyn_cast_ptrOrBoxEleTy(ty); + auto eleTy = arrTy.cast().getEleTy(); + auto dim = builder.createIntegerConstant(loc, builder.getIndexType(), 0); + auto maskBox = + builder.createNullConstant(loc, fir::BoxType::get(builder.getI1Type())); + + if (eleTy.isF16() || eleTy.isBF16()) + TODO(loc, "half-precision NORM2"); + else if (eleTy.isF32()) + func = fir::runtime::getRuntimeFunc(loc, builder); + else if (eleTy.isF64()) + func = fir::runtime::getRuntimeFunc(loc, builder); + else if (eleTy.isF80()) + func = fir::runtime::getRuntimeFunc(loc, builder); + else if (eleTy.isF128()) + func = fir::runtime::getRuntimeFunc(loc, builder); + else + fir::emitFatalError(loc, "invalid type in NORM2"); + + auto fTy = func.getFunctionType(); + auto sourceFile = fir::factory::locationToFilename(builder, loc); + auto sourceLine = + fir::factory::locationToLineNo(builder, loc, fTy.getInput(2)); + auto args = fir::runtime::createArguments( + builder, loc, fTy, arrayBox, sourceFile, sourceLine, dim, maskBox); + + return builder.create(loc, func, args).getResult(0); +} + /// Generate call to `Parity` intrinsic runtime routine. This routine is /// specialized for mask arguments with rank == 1. mlir::Value fir::runtime::genParity(fir::FirOpBuilder &builder, Index: flang/test/Lower/Intrinsics/norm2.f90 =================================================================== --- /dev/null +++ flang/test/Lower/Intrinsics/norm2.f90 @@ -0,0 +1,90 @@ +! RUN: bbc -emit-fir %s -o - | FileCheck %s +! RUN: %flang_fc1 -emit-fir %s -o - | FileCheck %s + +! CHECK-LABEL: func @_QPnorm2_test_4( +! CHECK-SAME: %[[arg0:.*]]: !fir.box>{{.*}}) -> f32 +real(4) function norm2_test_4(a) + real(4) :: a(:) + ! CHECK-DAG: %[[c0:.*]] = arith.constant 0 : index + ! CHECK-DAG: %[[m:.*]] = fir.zero_bits !fir.box + ! CHECK-DAG: %[[arr:.*]] = fir.convert %[[arg0]] : (!fir.box>) -> !fir.box + ! CHECK: %[[dim:.*]] = fir.convert %[[c0]] : (index) -> i32 + ! CHECK: %[[mask:.*]] = fir.convert %[[m]] : (!fir.box) -> !fir.box + norm2_test_4 = norm2(a) + ! CHECK: %{{.*}} = fir.call @_FortranANorm2_4(%[[arr]], %{{.*}}, %{{.*}}, %[[dim]], %[[mask]]) fastmath : (!fir.box, !fir.ref, i32, i32, !fir.box) -> f32 +end function norm2_test_4 + +! CHECK-LABEL: func @_QPnorm2_test_8( +! CHECK-SAME: %[[arg0:.*]]: !fir.box>{{.*}}) -> f64 +real(8) function norm2_test_8(a) + real(8) :: a(:,:) + ! CHECK-DAG: %[[c0:.*]] = arith.constant 0 : index + ! CHECK-DAG: %[[m:.*]] = fir.zero_bits !fir.box + ! CHECK-DAG: %[[arr:.*]] = fir.convert %[[arg0]] : (!fir.box>) -> !fir.box + ! CHECK: %[[dim:.*]] = fir.convert %[[c0]] : (index) -> i32 + ! CHECK: %[[mask:.*]] = fir.convert %[[m]] : (!fir.box) -> !fir.box + norm2_test_8 = norm2(a) + ! CHECK: %{{.*}} = fir.call @_FortranANorm2_8(%[[arr]], %{{.*}}, %{{.*}}, %[[dim]], %[[mask]]) fastmath : (!fir.box, !fir.ref, i32, i32, !fir.box) -> f64 +end function norm2_test_8 + +! CHECK-LABEL: func @_QPnorm2_test_10( +! CHECK-SAME: %[[arg0:.*]]: !fir.box>{{.*}}) -> f80 +real(10) function norm2_test_10(a) + real(10) :: a(:,:,:) + ! CHECK-DAG: %[[c0:.*]] = arith.constant 0 : index + ! CHECK-DAG: %[[m:.*]] = fir.zero_bits !fir.box + ! CHECK-DAG: %[[arr:.*]] = fir.convert %[[arg0]] : (!fir.box>) -> !fir.box + ! CHECK: %[[dim:.*]] = fir.convert %[[c0]] : (index) -> i32 + ! CHECK: %[[mask:.*]] = fir.convert %[[m]] : (!fir.box) -> !fir.box + norm2_test_10 = norm2(a) + ! CHECK: %{{.*}} = fir.call @_FortranANorm2_10(%[[arr]], %{{.*}}, %{{.*}}, %[[dim]], %[[mask]]) fastmath : (!fir.box, !fir.ref, i32, i32, !fir.box) -> f80 +end function norm2_test_10 + +! CHECK-LABEL: func @_QPnorm2_test_16( +! CHECK-SAME: %[[arg0:.*]]: !fir.box>{{.*}}) -> f128 +real(16) function norm2_test_16(a) + real(16) :: a(:,:,:) + ! CHECK-DAG: %[[c0:.*]] = arith.constant 0 : index + ! CHECK-DAG: %[[m:.*]] = fir.zero_bits !fir.box + ! CHECK-DAG: %[[arr:.*]] = fir.convert %[[arg0]] : (!fir.box>) -> !fir.box + ! CHECK: %[[dim:.*]] = fir.convert %[[c0]] : (index) -> i32 + ! CHECK: %[[mask:.*]] = fir.convert %[[m]] : (!fir.box) -> !fir.box + norm2_test_16 = norm2(a) + ! CHECK: %{{.*}} = fir.call @_FortranANorm2_16(%[[arr]], %{{.*}}, %{{.*}}, %[[dim]], %[[mask]]) fastmath : (!fir.box, !fir.ref, i32, i32, !fir.box) -> f128 +end function norm2_test_16 + +! CHECK-LABEL: func @_QPnorm2_test_dim_2( +! CHECK-SAME: %[[arg0:.*]]: !fir.box>{{.*}}, %[[arg1:.*]]: !fir.box>{{.*}}) +subroutine norm2_test_dim_2(a,r) + real :: a(:,:) + real :: r(:) + ! CHECK-DAG: %[[dim:.*]] = arith.constant 1 : i32 + ! CHECK-DAG: %[[r:.*]] = fir.alloca !fir.box>> + ! CHECK-DAG: %[[m:.*]] = fir.zero_bits !fir.box + ! CHECK-DAG: %[[res:.*]] = fir.convert %[[r]] : (!fir.ref>>>) -> !fir.ref> + ! CHECK: %[[arr:.*]] = fir.convert %[[arg0]] : (!fir.box>) -> !fir.box + ! CHECK-DAG: %[[mask:.*]] = fir.convert %[[m]] : (!fir.box) -> !fir.box + r = norm2(a,dim=1) + ! CHECK: %{{.*}} = fir.call @_FortranANorm2Dim(%[[res]], %[[arr]], %[[dim]], %{{.*}}, %{{.*}}, %[[mask]]) fastmath : (!fir.ref>, !fir.box, i32, !fir.ref, i32, !fir.box) -> none + ! CHECK: %[[box:.*]] = fir.load %[[r]] : !fir.ref>>> + ! CHECK-DAG: %[[addr:.*]] = fir.box_addr %[[box]] : (!fir.box>>) -> !fir.heap> + ! CHECK-DAG: fir.freemem %[[addr]] +end subroutine norm2_test_dim_2 + +! CHECK-LABEL: func @_QPnorm2_test_dim_3( +! CHECK-SAME: %[[arg0:.*]]: !fir.box>{{.*}}, %[[arg1:.*]]: !fir.box>{{.*}}) +subroutine norm2_test_dim_3(a,r) + real :: a(:,:,:) + real :: r(:,:) + ! CHECK-DAG: %[[dim:.*]] = arith.constant 3 : i32 + ! CHECK-DAG: %[[r:.*]] = fir.alloca !fir.box>> + ! CHECK-DAG: %[[m:.*]] = fir.zero_bits !fir.box + ! CHECK-DAG: %[[res:.*]] = fir.convert %[[r]] : (!fir.ref>>>) -> !fir.ref> + ! CHECK: %[[arr:.*]] = fir.convert %[[arg0]] : (!fir.box>) -> !fir.box + ! CHECK-DAG: %[[mask:.*]] = fir.convert %[[m]] : (!fir.box) -> !fir.box + r = norm2(a,dim=3) + ! CHECK: %{{.*}} = fir.call @_FortranANorm2Dim(%[[res]], %[[arr]], %[[dim]], %{{.*}}, %{{.*}}, %[[mask]]) fastmath : (!fir.ref>, !fir.box, i32, !fir.ref, i32, !fir.box) -> none + ! CHECK: %[[box:.*]] = fir.load %[[r]] : !fir.ref>>> + ! CHECK-DAG: %[[addr:.*]] = fir.box_addr %[[box]] : (!fir.box>>) -> !fir.heap> + ! CHECK-DAG: fir.freemem %[[addr]] +end subroutine norm2_test_dim_3