diff --git a/llvm/docs/LangRef.rst b/llvm/docs/LangRef.rst --- a/llvm/docs/LangRef.rst +++ b/llvm/docs/LangRef.rst @@ -19164,6 +19164,105 @@ Other values may be used to represent additional rounding modes, supported by a target. These values are target-specific. +'``llvm.get.fpmode``' Intrinsic +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Syntax: +""""""" + +This is an overloaded intrinsic. The overloaded type is an integer type used by +particular target to represent floating-point control modes. + +:: + + declare i8 @llvm.get.fpmode.i8() + declare i16 @llvm.get.fpmode.i16() + declare i32 @llvm.get.fpmode.i32() + declare i64 @llvm.get.fpmode.i64() + +Overview: +""""""""" + +The '``llvm.get.fpmode``' intrinsic reads floating-point control modes. + +Arguments: +"""""""""" + +None. + +Semantics: +"""""""""" + +The '``llvm.get.fpmode``' intrinsic reads the current floating-point control +modes, such as rounding direction, precision, treatment of denormals and so on. +It is similar to C library function 'fegetmode', however this function does not +store the set of control modes into memory but returns it as an integer value. +Interpretation of the bits in this value is target-dependent. + +'``llvm.set.fpmode``' Intrinsic +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Syntax: +""""""" + +This is an overloaded intrinsic. The overloaded type is an integer type used by +particular target to represent floating-point control modes. + +:: + + declare void @llvm.set.fpmode.i8(i8 ) + declare void @llvm.set.fpmode.i16(i16 ) + declare void @llvm.set.fpmode.i32(i32 ) + declare void @llvm.set.fpmode.i64(i64 ) + +Overview: +""""""""" + +The '``llvm.set.fpmode``' intrinsic sets floating-point control modes. + +Arguments: +"""""""""" + +The argument is a set of floating-point control modes. + +Semantics: +"""""""""" + +The '``llvm.set.fpmode``' intrinsic sets the current dynamic floating-point +control modes to the state specified by the argument, which must be obtained by +call to '``llvm.get.fpmode``' or constructed in a target-specific way. It is +similar to C library function 'fesetmode', however this function does not read +set of control modes from memory but gets it as integer value. + +'``llvm.reset.fpmode``' Intrinsic +^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ + +Syntax: +""""""" + +:: + + declare void @llvm.reset.fpmode() + +Overview: +""""""""" + +The '``llvm.reset.fpmode``' intrinsic sets default dynamic floating-point control +modes. + +Arguments: +"""""""""" + +None. + +Semantics: +"""""""""" + +The '``llvm.reset.fpmode``' intrinsic sets the current dynamic floating-point +environment to default state. It is similar to the call 'fesetmode(FE_DFL_MODE)', +however this function does not return any value. + + General Intrinsics ------------------ diff --git a/llvm/include/llvm/CodeGen/ISDOpcodes.h b/llvm/include/llvm/CodeGen/ISDOpcodes.h --- a/llvm/include/llvm/CodeGen/ISDOpcodes.h +++ b/llvm/include/llvm/CodeGen/ISDOpcodes.h @@ -821,6 +821,18 @@ /// FSINCOS - Compute both fsin and fcos as a single operation. FSINCOS, + /// Reads current dynamic floating-point control modes. The argument is token + /// chain. + GET_FPMODE, + + /// Sets current dynamic floating-point control modes. The first argument is + /// token chain, the second is control modes represented as integer value. + SET_FPMODE, + + /// Sets default dynamic floating-point control modes. The argument is token + /// chain. + RESET_FPMODE, + /// LOAD and STORE have token chains as their first operand, then the same /// operands as an LLVM load/store instruction, then an offset node that /// is added / subtracted from the base pointer to form the address (for diff --git a/llvm/include/llvm/IR/IRBuilder.h b/llvm/include/llvm/IR/IRBuilder.h --- a/llvm/include/llvm/IR/IRBuilder.h +++ b/llvm/include/llvm/IR/IRBuilder.h @@ -897,6 +897,24 @@ return CreateBinaryIntrinsic(Intrinsic::maximum, LHS, RHS, nullptr, Name); } + /// Create call to the get_fpmode intrinsic. + /// \param ModeTy Integer type used by target to represent floating-point + /// control modes. + CallInst *CreateGetFPMode(Type *ModeTy, const Twine &Name = "") { + return CreateIntrinsic(Intrinsic::get_fpmode, {ModeTy}, {}, nullptr, Name); + } + + /// Create call to the set_fpmode intrinsic. + CallInst *CreateSetFPMode(Value *Modes, const Twine &Name = "") { + return CreateIntrinsic(Intrinsic::set_fpmode, {Modes->getType()}, {Modes}, + nullptr, Name); + } + + /// Create call to the reset_fpmode intrinsic. + CallInst *CreateResetFPMode(const Twine &Name = "") { + return CreateIntrinsic(Intrinsic::reset_fpmode, {}, {}, nullptr, Name); + } + private: /// Create a call to a masked intrinsic with given Id. CallInst *CreateMaskedIntrinsic(Intrinsic::ID Id, ArrayRef Ops, diff --git a/llvm/include/llvm/IR/Intrinsics.td b/llvm/include/llvm/IR/Intrinsics.td --- a/llvm/include/llvm/IR/Intrinsics.td +++ b/llvm/include/llvm/IR/Intrinsics.td @@ -654,6 +654,17 @@ def int_flt_rounds : Intrinsic<[llvm_i32_ty], []>; } +def int_get_fpmode : Intrinsic<[llvm_anyint_ty], [], + [IntrWillReturn, IntrReadMem, IntrNoSync, + IntrInaccessibleMemOnly]>; +def int_set_fpmode : Intrinsic<[], [llvm_anyint_ty], + [IntrWillReturn, IntrWriteMem, IntrNoSync, + IntrInaccessibleMemOnly]>; +def int_reset_fpmode : Intrinsic<[], [], + [IntrWillReturn, IntrWriteMem, IntrNoSync, + IntrInaccessibleMemOnly]>; + + //===--------------- Constrained Floating Point Intrinsics ----------------===// // diff --git a/llvm/include/llvm/IR/RuntimeLibcalls.def b/llvm/include/llvm/IR/RuntimeLibcalls.def --- a/llvm/include/llvm/IR/RuntimeLibcalls.def +++ b/llvm/include/llvm/IR/RuntimeLibcalls.def @@ -280,6 +280,10 @@ HANDLE_LIBCALL(LLRINT_F128, "llrintl") HANDLE_LIBCALL(LLRINT_PPCF128, "llrintl") +// Floating point environment +HANDLE_LIBCALL(FEGETMODE, "fegetmode") +HANDLE_LIBCALL(FESETMODE, "fesetmode") + // Conversion HANDLE_LIBCALL(FPEXT_F32_PPCF128, "__gcc_stoq") HANDLE_LIBCALL(FPEXT_F64_PPCF128, "__gcc_dtoq") diff --git a/llvm/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp b/llvm/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp --- a/llvm/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp @@ -186,6 +186,8 @@ SDValue ExpandInsertToVectorThroughStack(SDValue Op); SDValue ExpandVectorBuildThroughStack(SDNode* Node); + SDValue makeStateFunctionCall(SDNode *Node, RTLIB::Libcall LC, SDValue MemOp); + SDValue ExpandConstantFP(ConstantFPSDNode *CFP, bool UseCP); SDValue ExpandConstant(ConstantSDNode *CP); @@ -1161,6 +1163,10 @@ Action = TLI.getOperationAction( Node->getOpcode(), Node->getOperand(0).getValueType()); break; + case ISD::SET_FPMODE: + Action = TLI.getOperationAction(Node->getOpcode(), + Node->getOperand(1).getValueType()); + break; default: if (Node->getOpcode() >= ISD::BUILTIN_OP_END) { Action = TargetLowering::Legal; @@ -1447,6 +1453,30 @@ return DAG.getLoad(VT, dl, StoreChain, FIPtr, PtrInfo); } +// Helper used to make call to a library function that has one argument of +// pointer type. Return value is void or ignored. Such functions include +// 'fegetmode', 'fesetenv' and others, which are used to get or set state. +// Returns outgoing token chain. +SDValue SelectionDAGLegalize::makeStateFunctionCall(SDNode *Node, + RTLIB::Libcall LC, + SDValue MemOp) { + SDLoc DLoc(Node); + TargetLowering::ArgListTy Args; + TargetLowering::ArgListEntry Entry; + Entry.Node = MemOp; + Entry.Ty = MemOp.getValueType().getTypeForEVT(*DAG.getContext()); + Args.push_back(Entry); + SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC), + TLI.getPointerTy(DAG.getDataLayout())); + TargetLowering::CallLoweringInfo CLI(DAG); + CLI.setDebugLoc(DLoc) + .setChain(Node->getOperand(0)) + .setLibCallee(TLI.getLibcallCallingConv(LC), + Type::getVoidTy(*DAG.getContext()), Callee, + std::move(Args)); + return TLI.LowerCallTo(CLI).second; +} + /// Bitcast a floating-point value to an integer value. Only bitcast the part /// containing the sign bit if the target has no integer value capable of /// holding all bits of the floating-point value. @@ -4317,6 +4347,43 @@ break; } break; + case ISD::GET_FPMODE: { + // Call fegetmode, which saves control modes into stack slot. Then load + // the value to return from the stack. + SDValue StackPtr = DAG.CreateStackTemporary(Node->getValueType(0)); + int SPFI = cast(StackPtr.getNode())->getIndex(); + SDValue Chain = makeStateFunctionCall(Node, RTLIB::FEGETMODE, StackPtr); + SDValue LdInst = DAG.getLoad( + StackPtr.getValueType(), dl, Chain, StackPtr, + MachinePointerInfo::getFixedStack(DAG.getMachineFunction(), SPFI)); + Results.push_back(LdInst); + Results.push_back(LdInst.getValue(1)); + break; + } + case ISD::SET_FPMODE: { + // Move control modes to stack slot and then call fesetmode with the pointer + // to the slot as argument. + SDValue Mode = Node->getOperand(1); + EVT ModeVT = Mode.getValueType(); + SDValue StackPtr = DAG.CreateStackTemporary(ModeVT); + int SPFI = cast(StackPtr.getNode())->getIndex(); + DAG.getStore( + Node->getOperand(0), dl, Mode, StackPtr, + MachinePointerInfo::getFixedStack(DAG.getMachineFunction(), SPFI)); + Results.push_back(makeStateFunctionCall(Node, RTLIB::FESETMODE, StackPtr)); + break; + } + case ISD::RESET_FPMODE: { + // It is legalized to call 'fesetmode(FE_DFL_MODE)'. On most targets + // FE_DFL_MODE is defined as '((const femode_t *) -1)' in glibc. + const DataLayout &DL = DAG.getDataLayout(); + Type *ByteTy = EVT(MVT::i8).getTypeForEVT(*DAG.getContext()); + auto *PtrTy = PointerType::get(ByteTy, DL.getAllocaAddrSpace()); + Type *IntTy = DL.getIntPtrType(PtrTy); + SDValue Mode = DAG.getConstant(-1LL, dl, MVT::getVT(IntTy)); + Results.push_back(makeStateFunctionCall(Node, RTLIB::FESETMODE, Mode)); + break; + } } // Replace the original node with the legalized result. diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp --- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp @@ -6200,6 +6200,25 @@ DAG.getNode(ISD::BITCAST, sdl, MVT::f16, getValue(I.getArgOperand(0))))); return; + case Intrinsic::get_fpmode: + Res = DAG.getNode( + ISD::GET_FPMODE, sdl, + DAG.getVTList(TLI.getValueType(DAG.getDataLayout(), I.getType()), + MVT::Other), + DAG.getRoot()); + setValue(&I, Res); + DAG.setRoot(Res.getValue(1)); + return; + case Intrinsic::set_fpmode: + Res = DAG.getNode(ISD::SET_FPMODE, sdl, MVT::Other, {DAG.getRoot()}, + getValue(I.getArgOperand(0))); + DAG.setRoot(Res); + return; + case Intrinsic::reset_fpmode: { + Res = DAG.getNode(ISD::RESET_FPMODE, sdl, MVT::Other, getRoot()); + DAG.setRoot(Res); + return; + } case Intrinsic::pcmarker: { SDValue Tmp = getValue(I.getArgOperand(0)); DAG.setRoot(DAG.getNode(ISD::PCMARKER, sdl, MVT::Other, getRoot(), Tmp)); diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp --- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp @@ -403,6 +403,11 @@ case ISD::PREALLOCATED_ARG: return "call_alloc"; + // Environment manipulation + case ISD::GET_FPMODE: return "get_fpmode"; + case ISD::SET_FPMODE: return "set_fpmode"; + case ISD::RESET_FPMODE: return "reset_fpmode"; + // Bit manipulation case ISD::ABS: return "abs"; case ISD::BITREVERSE: return "bitreverse"; diff --git a/llvm/lib/CodeGen/TargetLoweringBase.cpp b/llvm/lib/CodeGen/TargetLoweringBase.cpp --- a/llvm/lib/CodeGen/TargetLoweringBase.cpp +++ b/llvm/lib/CodeGen/TargetLoweringBase.cpp @@ -774,6 +774,13 @@ // On most systems, DEBUGTRAP and TRAP have no difference. The "Expand" // here is to inform DAG Legalizer to replace DEBUGTRAP with TRAP. setOperationAction(ISD::DEBUGTRAP, MVT::Other, Expand); + + // Environment operations default to expand to library calls. + for (MVT VT : {MVT::i8, MVT::i16, MVT::i32, MVT::i64}) + setOperationAction(ISD::GET_FPMODE, VT, Expand); + for (MVT VT : {MVT::i8, MVT::i16, MVT::i32, MVT::i64}) + setOperationAction(ISD::SET_FPMODE, VT, Expand); + setOperationAction(ISD::RESET_FPMODE, MVT::Other, Expand); } MVT TargetLoweringBase::getScalarShiftAmountTy(const DataLayout &DL, diff --git a/llvm/test/CodeGen/Generic/fpenv.ll b/llvm/test/CodeGen/Generic/fpenv.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/Generic/fpenv.ll @@ -0,0 +1,53 @@ +; RUN: llc -mtriple=msp430 -o - < %s | FileCheck %s + +; This test checks default lowering of the intrinsics operating floating point +; environment. MSP430 is used as a target in this test because it does not have +; native FP support, so it hopefully won't get custom lowering for these +; intrinsics. +; +; REQUIRES: msp430-registered-target + +target datalayout = "e-p:16:16:16-i8:8:8-i16:16:16-i32:16:32-n8:16" +target triple = "msp430---elf" + + +define i16 @func_01() { +entry: + %fpenv = call i16 @llvm.get.fpmode.i16() + ret i16 %fpenv +} +; CHECK-LABEL: func_01: +; CHECK: sub #2, r1 +; CHECK-NEXT: mov r1, r12 +; CHECK-NEXT: call #fegetmode +; CHECK-NEXT: mov 0(r1), r12 +; CHECK-NEXT: add #2, r1 +; CHECK-NEXT: ret + + +define void @func_02(i16 %fpenv) { +entry: + call void @llvm.set.fpmode.i16(i16 %fpenv) + ret void +} +; CHECK-LABEL: func_02: +; CHECK: sub #2, r1 +; CHECK-NEXT: mov r1, r12 +; CHECK-NEXT: call #fesetmode +; CHECK-NEXT: add #2, r1 +; CHECK-NEXT: ret + + +define void @func_03() { +entry: + call void @llvm.reset.fpmode() + ret void +} +; CHECK-LABEL: func_03: +; CHECK: mov #-1, r12 +; CHECK-NEXT: call #fesetmode +; CHECK-NEXT: ret + +declare i16 @llvm.get.fpmode.i16() +declare void @llvm.set.fpmode.i16(i16 %fpenv) +declare void @llvm.reset.fpmode() diff --git a/llvm/unittests/IR/IRBuilderTest.cpp b/llvm/unittests/IR/IRBuilderTest.cpp --- a/llvm/unittests/IR/IRBuilderTest.cpp +++ b/llvm/unittests/IR/IRBuilderTest.cpp @@ -988,4 +988,24 @@ Builder.CreateAdd(Builder.getInt32(1), Builder.getInt32(2), "add"); EXPECT_EQ(Add->getName(), "add"); } + +TEST_F(IRBuilderTest, FPEnvironment) { + IRBuilder<> Builder(BB); + CallInst *Call; + IntrinsicInst *II; + + Call = Builder.CreateResetFPMode(); + II = cast(Call); + EXPECT_EQ(Intrinsic::reset_fpmode, II->getIntrinsicID()); + + Call = Builder.CreateGetFPMode(Builder.getInt32Ty()); + II = cast(Call); + EXPECT_EQ(Intrinsic::get_fpmode, II->getIntrinsicID()); + EXPECT_EQ(Call->getType(), Builder.getInt32Ty()); + + AllocaInst *Var1 = Builder.CreateAlloca(Builder.getInt32Ty()); + Call = Builder.CreateSetFPMode(Var1); + II = cast(Call); + EXPECT_EQ(Intrinsic::set_fpmode, II->getIntrinsicID()); +} }