Diff 235882

llvm/include/llvm/CodeGen/ISDOpcodes.h

Show First 20 Lines • Show All 931 Lines • ▼ Show 20 Lines	enum NodeType {
VECREDUCE_AND, VECREDUCE_OR, VECREDUCE_XOR,		VECREDUCE_AND, VECREDUCE_OR, VECREDUCE_XOR,
VECREDUCE_SMAX, VECREDUCE_SMIN, VECREDUCE_UMAX, VECREDUCE_UMIN,		VECREDUCE_SMAX, VECREDUCE_SMIN, VECREDUCE_UMAX, VECREDUCE_UMIN,

/// BUILTIN_OP_END - This must be the last enum value in this list.		/// BUILTIN_OP_END - This must be the last enum value in this list.
/// The target-specific pre-isel opcode values start here.		/// The target-specific pre-isel opcode values start here.
BUILTIN_OP_END		BUILTIN_OP_END
};		};

		/// FIRST_TARGET_STRICTFP_OPCODE - Target-specific pre-isel operations
		/// which cannot raise FP exceptions should be less than this value.
		/// Those that do must not be less than this value.
		static const int FIRST_TARGET_STRICTFP_OPCODE = BUILTIN_OP_END+400;

/// FIRST_TARGET_MEMORY_OPCODE - Target-specific pre-isel operations		/// FIRST_TARGET_MEMORY_OPCODE - Target-specific pre-isel operations
/// which do not reference a specific memory location should be less than		/// which do not reference a specific memory location should be less than
/// this value. Those that do must not be less than this value, and can		/// this value. Those that do must not be less than this value, and can
/// be used with SelectionDAG::getMemIntrinsicNode.		/// be used with SelectionDAG::getMemIntrinsicNode.
static const int FIRST_TARGET_MEMORY_OPCODE = BUILTIN_OP_END+400;		static const int FIRST_TARGET_MEMORY_OPCODE = BUILTIN_OP_END+500;

//===--------------------------------------------------------------------===//		//===--------------------------------------------------------------------===//
/// MemIndexedMode enum - This enum defines the load / store indexed		/// MemIndexedMode enum - This enum defines the load / store indexed
/// addressing modes.		/// addressing modes.
///		///
/// UNINDEXED "Normal" load / store. The effective address is already		/// UNINDEXED "Normal" load / store. The effective address is already
/// computed and is available in the base pointer. The offset		/// computed and is available in the base pointer. The offset
/// operand is always undefined. In addition to producing a		/// operand is always undefined. In addition to producing a
▲ Show 20 Lines • Show All 163 Lines • Show Last 20 Lines

llvm/include/llvm/CodeGen/SelectionDAGISel.h

Show First 20 Lines • Show All 304 Lines • ▼ Show 20 Lines	void SelectCodeCommon(SDNode NodeToMatch, const unsigned char MatcherTable,
unsigned TableSize);		unsigned TableSize);

/// Return true if complex patterns for this target can mutate the		/// Return true if complex patterns for this target can mutate the
/// DAG.		/// DAG.
virtual bool ComplexPatternFuncMutatesDAG() const {		virtual bool ComplexPatternFuncMutatesDAG() const {
return false;		return false;
}		}

		/// Return whether the node may raise an FP exception.
		bool mayRaiseFPException(SDNode *Node) const;

bool isOrEquivalentToAdd(const SDNode *N) const;		bool isOrEquivalentToAdd(const SDNode *N) const;

private:		private:

// Calls to these functions are generated by tblgen.		// Calls to these functions are generated by tblgen.
void Select_INLINEASM(SDNode *N, bool Branch);		void Select_INLINEASM(SDNode *N, bool Branch);
void Select_READ_REGISTER(SDNode *Op);		void Select_READ_REGISTER(SDNode *Op);
void Select_WRITE_REGISTER(SDNode *Op);		void Select_WRITE_REGISTER(SDNode *Op);
▲ Show 20 Lines • Show All 52 Lines • Show Last 20 Lines

llvm/include/llvm/CodeGen/SelectionDAGNodes.h

Show First 20 Lines • Show All 381 Lines • ▼ Show 20 Lines

public:		public:
/// Default constructor turns off all optimization flags.		/// Default constructor turns off all optimization flags.
SDNodeFlags()		SDNodeFlags()
: AnyDefined(false), NoUnsignedWrap(false), NoSignedWrap(false),		: AnyDefined(false), NoUnsignedWrap(false), NoSignedWrap(false),
Exact(false), NoNaNs(false), NoInfs(false),		Exact(false), NoNaNs(false), NoInfs(false),
NoSignedZeros(false), AllowReciprocal(false), VectorReduction(false),		NoSignedZeros(false), AllowReciprocal(false), VectorReduction(false),
AllowContract(false), ApproximateFuncs(false),		AllowContract(false), ApproximateFuncs(false),
AllowReassociation(false), NoFPExcept(true) {}		AllowReassociation(false), NoFPExcept(false) {}

/// Propagate the fast-math-flags from an IR FPMathOperator.		/// Propagate the fast-math-flags from an IR FPMathOperator.
void copyFMF(const FPMathOperator &FPMO) {		void copyFMF(const FPMathOperator &FPMO) {
setNoNaNs(FPMO.hasNoNaNs());		setNoNaNs(FPMO.hasNoNaNs());
setNoInfs(FPMO.hasNoInfs());		setNoInfs(FPMO.hasNoInfs());
setNoSignedZeros(FPMO.hasNoSignedZeros());		setNoSignedZeros(FPMO.hasNoSignedZeros());
setAllowReciprocal(FPMO.hasAllowReciprocal());		setAllowReciprocal(FPMO.hasAllowReciprocal());
setAllowContract(FPMO.hasAllowContract());		setAllowContract(FPMO.hasAllowContract());
▲ Show 20 Lines • Show All 46 Lines • ▼ Show 20 Lines	public:
void setApproximateFuncs(bool b) {		void setApproximateFuncs(bool b) {
setDefined();		setDefined();
ApproximateFuncs = b;		ApproximateFuncs = b;
}		}
void setAllowReassociation(bool b) {		void setAllowReassociation(bool b) {
setDefined();		setDefined();
AllowReassociation = b;		AllowReassociation = b;
}		}
void setFPExcept(bool b) {		void setNoFPExcept(bool b) {
setDefined();		setDefined();
NoFPExcept = !b;		NoFPExcept = b;
}		}

// These are accessors for each flag.		// These are accessors for each flag.
bool hasNoUnsignedWrap() const { return NoUnsignedWrap; }		bool hasNoUnsignedWrap() const { return NoUnsignedWrap; }
bool hasNoSignedWrap() const { return NoSignedWrap; }		bool hasNoSignedWrap() const { return NoSignedWrap; }
bool hasExact() const { return Exact; }		bool hasExact() const { return Exact; }
bool hasNoNaNs() const { return NoNaNs; }		bool hasNoNaNs() const { return NoNaNs; }
bool hasNoInfs() const { return NoInfs; }		bool hasNoInfs() const { return NoInfs; }
bool hasNoSignedZeros() const { return NoSignedZeros; }		bool hasNoSignedZeros() const { return NoSignedZeros; }
bool hasAllowReciprocal() const { return AllowReciprocal; }		bool hasAllowReciprocal() const { return AllowReciprocal; }
bool hasVectorReduction() const { return VectorReduction; }		bool hasVectorReduction() const { return VectorReduction; }
bool hasAllowContract() const { return AllowContract; }		bool hasAllowContract() const { return AllowContract; }
bool hasApproximateFuncs() const { return ApproximateFuncs; }		bool hasApproximateFuncs() const { return ApproximateFuncs; }
bool hasAllowReassociation() const { return AllowReassociation; }		bool hasAllowReassociation() const { return AllowReassociation; }
bool hasFPExcept() const { return !NoFPExcept; }		bool hasNoFPExcept() const { return NoFPExcept; }

bool isFast() const {		bool isFast() const {
return NoSignedZeros && AllowReciprocal && NoNaNs && NoInfs && NoFPExcept &&		return NoSignedZeros && AllowReciprocal && NoNaNs && NoInfs && NoFPExcept &&
AllowContract && ApproximateFuncs && AllowReassociation;		AllowContract && ApproximateFuncs && AllowReassociation;
}		}

/// Clear any flags in this flag set that aren't also set in Flags.		/// Clear any flags in this flag set that aren't also set in Flags.
/// If the given Flags are undefined then don't do anything.		/// If the given Flags are undefined then don't do anything.
▲ Show 20 Lines • Show All 182 Lines • ▼ Show 20 Lines	public:
/// are the opcode values in the ISD and <target>ISD namespaces. For		/// are the opcode values in the ISD and <target>ISD namespaces. For
/// post-isel opcodes, see getMachineOpcode.		/// post-isel opcodes, see getMachineOpcode.
unsigned getOpcode() const { return (unsigned short)NodeType; }		unsigned getOpcode() const { return (unsigned short)NodeType; }

/// Test if this node has a target-specific opcode (in the		/// Test if this node has a target-specific opcode (in the
/// \<target\>ISD namespace).		/// \<target\>ISD namespace).
bool isTargetOpcode() const { return NodeType >= ISD::BUILTIN_OP_END; }		bool isTargetOpcode() const { return NodeType >= ISD::BUILTIN_OP_END; }

		/// Test if this node has a target-specific opcode that may raise
		/// FP exceptions (in the \<target\>ISD namespace and greater than
		/// FIRST_TARGET_STRICTFP_OPCODE). Note that all target memory
		/// opcode are currently automatically considered to possibly raise
		/// FP exceptions as well.
		bool isTargetStrictFPOpcode() const {
		return NodeType >= ISD::FIRST_TARGET_STRICTFP_OPCODE;
		andrew.w.kaylorUnsubmitted Not Done Reply Inline Actions Shouldn't this also check for < FIRST_TARGET_MEMORY_OPCODE? andrew.w.kaylor: Shouldn't this also check for < FIRST_TARGET_MEMORY_OPCODE?
		uweigandAuthorUnsubmitted Done Reply Inline Actions As I said above: (Note that there a bit of a quirk in identifying target nodes that are both memory nodes and strict FP nodes. To simplify the logic, right now all target memory nodes are automatically also considered strict FP nodes -- this could be fixed by adding one more range.) Not sure what the best way to handle this is. uweigand: As I said above: > (Note that there a bit of a quirk in identifying target nodes that are…
		andrew.w.kaylorUnsubmitted Not Done Reply Inline Actions Yeah, sorry, I comment before reading the whole description (or apparently the comment here). I'm not sure how much practical impact this will have, but it just feels wrong. andrew.w.kaylor: Yeah, sorry, I comment before reading the whole description (or apparently the comment here).
		}

/// Test if this node has a target-specific		/// Test if this node has a target-specific
/// memory-referencing opcode (in the \<target\>ISD namespace and		/// memory-referencing opcode (in the \<target\>ISD namespace and
/// greater than FIRST_TARGET_MEMORY_OPCODE).		/// greater than FIRST_TARGET_MEMORY_OPCODE).
bool isTargetMemoryOpcode() const {		bool isTargetMemoryOpcode() const {
return NodeType >= ISD::FIRST_TARGET_MEMORY_OPCODE;		return NodeType >= ISD::FIRST_TARGET_MEMORY_OPCODE;
}		}

/// Return true if the type of the node type undefined.		/// Return true if the type of the node type undefined.
▲ Show 20 Lines • Show All 1,997 Lines • Show Last 20 Lines

llvm/lib/CodeGen/SelectionDAG/InstrEmitter.cpp

Show First 20 Lines • Show All 876 Lines • ▼ Show 20 Lines	if (Flags.hasNoUnsignedWrap())
MI->setFlag(MachineInstr::MIFlag::NoUWrap);		MI->setFlag(MachineInstr::MIFlag::NoUWrap);

if (Flags.hasNoSignedWrap())		if (Flags.hasNoSignedWrap())
MI->setFlag(MachineInstr::MIFlag::NoSWrap);		MI->setFlag(MachineInstr::MIFlag::NoSWrap);

if (Flags.hasExact())		if (Flags.hasExact())
MI->setFlag(MachineInstr::MIFlag::IsExact);		MI->setFlag(MachineInstr::MIFlag::IsExact);

if (Flags.hasFPExcept())		if (MI->getDesc().mayRaiseFPException() && !Flags.hasNoFPExcept())
MI->setFlag(MachineInstr::MIFlag::FPExcept);		MI->setFlag(MachineInstr::MIFlag::FPExcept);
}		}

// Emit all of the actual operands of this instruction, adding them to the		// Emit all of the actual operands of this instruction, adding them to the
// instruction as appropriate.		// instruction as appropriate.
bool HasOptPRefs = NumDefs > NumResults;		bool HasOptPRefs = NumDefs > NumResults;
assert((!HasOptPRefs \|\| !HasPhysRegOuts) &&		assert((!HasOptPRefs \|\| !HasPhysRegOuts) &&
"Unable to cope with optional defs and phys regs defs!");		"Unable to cope with optional defs and phys regs defs!");
▲ Show 20 Lines • Show All 272 Lines • Show Last 20 Lines

llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 1,102 Lines • ▼ Show 20 Lines	if (SDNode *Node = getNodeForIRValue(&I)) {
SDNodeFlags IncomingFlags;		SDNodeFlags IncomingFlags;
IncomingFlags.copyFMF(*FPMO);		IncomingFlags.copyFMF(*FPMO);
if (!Node->getFlags().isDefined())		if (!Node->getFlags().isDefined())
Node->setFlags(IncomingFlags);		Node->setFlags(IncomingFlags);
else		else
Node->intersectFlagsWith(IncomingFlags);		Node->intersectFlagsWith(IncomingFlags);
}		}
}		}
		// Constrained FP intrinsics with fpexcept.ignore should also get
		// the NoFPExcept flag.
		if (auto *FPI = dyn_cast<ConstrainedFPIntrinsic>(&I))
		if (FPI->getExceptionBehavior() == fp::ExceptionBehavior::ebIgnore)
		if (SDNode *Node = getNodeForIRValue(&I)) {
		SDNodeFlags Flags = Node->getFlags();
		Flags.setNoFPExcept(true);
		Node->setFlags(Flags);
		}

if (!I.isTerminator() && !HasTailCall &&		if (!I.isTerminator() && !HasTailCall &&
!isStatepoint(&I)) // statepoints handle their exports internally		!isStatepoint(&I)) // statepoints handle their exports internally
CopyToExportRegsIfNeeded(&I);		CopyToExportRegsIfNeeded(&I);

CurInst = nullptr;		CurInst = nullptr;
}		}

▲ Show 20 Lines • Show All 5,848 Lines • ▼ Show 20 Lines	case ISD::STRICT_FSETCCS: {
Opers.push_back(DAG.getCondCode(getFCmpCondCode(FPCmp->getPredicate())));		Opers.push_back(DAG.getCondCode(getFCmpCondCode(FPCmp->getPredicate())));
break;		break;
}		}
}		}

SDVTList VTs = DAG.getVTList(ValueVTs);		SDVTList VTs = DAG.getVTList(ValueVTs);
SDValue Result = DAG.getNode(Opcode, sdl, VTs, Opers);		SDValue Result = DAG.getNode(Opcode, sdl, VTs, Opers);

if (FPI.getExceptionBehavior() != fp::ExceptionBehavior::ebIgnore) {
SDNodeFlags Flags;
Flags.setFPExcept(true);
Result->setFlags(Flags);
}

assert(Result.getNode()->getNumValues() == 2);		assert(Result.getNode()->getNumValues() == 2);
// See above -- chain is handled like for loads here.		// See above -- chain is handled like for loads here.
SDValue OutChain = Result.getValue(1);		SDValue OutChain = Result.getValue(1);
PendingLoads.push_back(OutChain);		PendingLoads.push_back(OutChain);
SDValue FPResult = Result.getValue(0);		SDValue FPResult = Result.getValue(0);
setValue(&FPI, FPResult);		setValue(&FPI, FPResult);
}		}

▲ Show 20 Lines • Show All 3,561 Lines • Show Last 20 Lines

llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp

Show First 20 Lines • Show All 541 Lines • ▼ Show 20 Lines	if (getFlags().hasApproximateFuncs())
OS << " afn";		OS << " afn";

if (getFlags().hasAllowReassociation())		if (getFlags().hasAllowReassociation())
OS << " reassoc";		OS << " reassoc";

if (getFlags().hasVectorReduction())		if (getFlags().hasVectorReduction())
OS << " vector-reduction";		OS << " vector-reduction";

if (getFlags().hasFPExcept())		if (getFlags().hasNoFPExcept())
OS << " fpexcept";		OS << " nofpexcept";

if (const MachineSDNode *MN = dyn_cast<MachineSDNode>(this)) {		if (const MachineSDNode *MN = dyn_cast<MachineSDNode>(this)) {
if (!MN->memoperands_empty()) {		if (!MN->memoperands_empty()) {
OS << "<";		OS << "<";
OS << "Mem:";		OS << "Mem:";
for (MachineSDNode::mmo_iterator i = MN->memoperands_begin(),		for (MachineSDNode::mmo_iterator i = MN->memoperands_begin(),
e = MN->memoperands_end(); i != e; ++i) {		e = MN->memoperands_end(); i != e; ++i) {
printMemOperand(OS, **i, G);		printMemOperand(OS, **i, G);
▲ Show 20 Lines • Show All 421 Lines • Show Last 20 Lines

llvm/lib/CodeGen/SelectionDAG/SelectionDAGISel.cpp

Show First 20 Lines • Show All 3,452 Lines • ▼ Show 20 Lines	case OPC_MorphNodeTo0: case OPC_MorphNodeTo1: case OPC_MorphNodeTo2: {
}		}

// If this has chain/glue inputs, add them.		// If this has chain/glue inputs, add them.
if (EmitNodeInfo & OPFL_Chain)		if (EmitNodeInfo & OPFL_Chain)
Ops.push_back(InputChain);		Ops.push_back(InputChain);
if ((EmitNodeInfo & OPFL_GlueInput) && InputGlue.getNode() != nullptr)		if ((EmitNodeInfo & OPFL_GlueInput) && InputGlue.getNode() != nullptr)
Ops.push_back(InputGlue);		Ops.push_back(InputGlue);

		// Check whether any matched node could raise an FP exception. Since all
		// such nodes must have a chain, it suffices to check ChainNodesMatched.
		craig.topperUnsubmitted Done Reply Inline Actions Why is only NodeToMatch important? Couldn't we be pattern matching multiple strict nodes? craig.topper: Why is only NodeToMatch important? Couldn't we be pattern matching multiple strict nodes?
		uweigandAuthorUnsubmitted Done Reply Inline Actions Good point. I've changed the code to check whether any of the matched nodes may raise an exception. uweigand: Good point. I've changed the code to check whether any of the matched nodes may raise an…
		// We need to perform this check before potentially modifying one of the
		// nodes via MorphNode.
		bool MayRaiseFPException = false;
		for (auto *N : ChainNodesMatched)
		if (mayRaiseFPException(N) && !N->getFlags().hasNoFPExcept()) {
		MayRaiseFPException = true;
		break;
		}

// Create the node.		// Create the node.
MachineSDNode *Res = nullptr;		MachineSDNode *Res = nullptr;
bool IsMorphNodeTo = Opcode == OPC_MorphNodeTo \|\|		bool IsMorphNodeTo = Opcode == OPC_MorphNodeTo \|\|
(Opcode >= OPC_MorphNodeTo0 && Opcode <= OPC_MorphNodeTo2);		(Opcode >= OPC_MorphNodeTo0 && Opcode <= OPC_MorphNodeTo2);
if (!IsMorphNodeTo) {		if (!IsMorphNodeTo) {
// If this is a normal EmitNode command, just create the new node and		// If this is a normal EmitNode command, just create the new node and
// add the results to the RecordedNodes list.		// add the results to the RecordedNodes list.
Res = CurDAG->getMachineNode(TargetOpc, SDLoc(NodeToMatch),		Res = CurDAG->getMachineNode(TargetOpc, SDLoc(NodeToMatch),
Show All 15 Lines	case OPC_MorphNodeTo0: case OPC_MorphNodeTo1: case OPC_MorphNodeTo2: {
assert((!E \|\| !is_contained(Chain, N)) &&		assert((!E \|\| !is_contained(Chain, N)) &&
"Chain node replaced during MorphNode");		"Chain node replaced during MorphNode");
Chain.erase(std::remove(Chain.begin(), Chain.end(), N), Chain.end());		Chain.erase(std::remove(Chain.begin(), Chain.end(), N), Chain.end());
});		});
Res = cast<MachineSDNode>(MorphNode(NodeToMatch, TargetOpc, VTList,		Res = cast<MachineSDNode>(MorphNode(NodeToMatch, TargetOpc, VTList,
Ops, EmitNodeInfo));		Ops, EmitNodeInfo));
}		}

		// Set the NoFPExcept flag when no original matched node could
		// raise an FP exception, but the new node potentially might.
		if (!MayRaiseFPException && mayRaiseFPException(Res)) {
		SDNodeFlags Flags = Res->getFlags();
		Flags.setNoFPExcept(true);
		Res->setFlags(Flags);
		}

// If the node had chain/glue results, update our notion of the current		// If the node had chain/glue results, update our notion of the current
// chain and glue.		// chain and glue.
if (EmitNodeInfo & OPFL_GlueOutput) {		if (EmitNodeInfo & OPFL_GlueOutput) {
InputGlue = SDValue(Res, VTs.size()-1);		InputGlue = SDValue(Res, VTs.size()-1);
if (EmitNodeInfo & OPFL_Chain)		if (EmitNodeInfo & OPFL_Chain)
InputChain = SDValue(Res, VTs.size()-2);		InputChain = SDValue(Res, VTs.size()-2);
} else if (EmitNodeInfo & OPFL_Chain)		} else if (EmitNodeInfo & OPFL_Chain)
InputChain = SDValue(Res, VTs.size()-1);		InputChain = SDValue(Res, VTs.size()-1);
▲ Show 20 Lines • Show All 139 Lines • ▼ Show 20 Lines	while (true) {

// End of this scope, pop it and try the next child in the containing		// End of this scope, pop it and try the next child in the containing
// scope.		// scope.
MatchScopes.pop_back();		MatchScopes.pop_back();
}		}
}		}
}		}

		/// Return whether the node may raise an FP exception.
		bool SelectionDAGISel::mayRaiseFPException(SDNode *N) const {
		// For machine opcodes, consult the MCID flag.
		if (N->isMachineOpcode()) {
		const MCInstrDesc &MCID = TII->get(N->getMachineOpcode());
		return MCID.mayRaiseFPException();
		}

		// For ISD opcodes, only StrictFP opcodes may raise an FP
		// exception.
		if (N->isTargetOpcode())
		return N->isTargetStrictFPOpcode();
		return N->isStrictFPOpcode();
		}

bool SelectionDAGISel::isOrEquivalentToAdd(const SDNode *N) const {		bool SelectionDAGISel::isOrEquivalentToAdd(const SDNode *N) const {
assert(N->getOpcode() == ISD::OR && "Unexpected opcode");		assert(N->getOpcode() == ISD::OR && "Unexpected opcode");
auto *C = dyn_cast<ConstantSDNode>(N->getOperand(1));		auto *C = dyn_cast<ConstantSDNode>(N->getOperand(1));
if (!C)		if (!C)
return false;		return false;

// Detect when "or" is used to add an offset to a stack object.		// Detect when "or" is used to add an offset to a stack object.
if (auto *FN = dyn_cast<FrameIndexSDNode>(N->getOperand(0))) {		if (auto *FN = dyn_cast<FrameIndexSDNode>(N->getOperand(0))) {
Show All 36 Lines

llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 6,184 Lines • ▼ Show 20 Lines	if (Node->isStrictFPOpcode()) {
{ Node->getOperand(0), InCvt });		{ Node->getOperand(0), InCvt });
Slow = DAG.getNode(ISD::STRICT_FADD, dl, { DstVT, MVT::Other },		Slow = DAG.getNode(ISD::STRICT_FADD, dl, { DstVT, MVT::Other },
{ Fast.getValue(1), Fast, Fast });		{ Fast.getValue(1), Fast, Fast });
Chain = Slow.getValue(1);		Chain = Slow.getValue(1);
// The STRICT_SINT_TO_FP inherits the exception mode from the		// The STRICT_SINT_TO_FP inherits the exception mode from the
// incoming STRICT_UINT_TO_FP node; the STRICT_FADD node can		// incoming STRICT_UINT_TO_FP node; the STRICT_FADD node can
// never raise any exception.		// never raise any exception.
SDNodeFlags Flags;		SDNodeFlags Flags;
Flags.setFPExcept(Node->getFlags().hasFPExcept());		Flags.setNoFPExcept(Node->getFlags().hasNoFPExcept());
Fast->setFlags(Flags);		Fast->setFlags(Flags);
		Flags.setNoFPExcept(true);
		Slow->setFlags(Flags);
} else {		} else {
SDValue SignCvt = DAG.getNode(ISD::SINT_TO_FP, dl, DstVT, Or);		SDValue SignCvt = DAG.getNode(ISD::SINT_TO_FP, dl, DstVT, Or);
Slow = DAG.getNode(ISD::FADD, dl, DstVT, SignCvt, SignCvt);		Slow = DAG.getNode(ISD::FADD, dl, DstVT, SignCvt, SignCvt);
Fast = DAG.getNode(ISD::SINT_TO_FP, dl, DstVT, Src);		Fast = DAG.getNode(ISD::SINT_TO_FP, dl, DstVT, Src);
}		}

Result = DAG.getSelect(dl, DstVT, SignBitTest, Slow, Fast);		Result = DAG.getSelect(dl, DstVT, SignBitTest, Slow, Fast);
return true;		return true;
▲ Show 20 Lines • Show All 1,319 Lines • Show Last 20 Lines

llvm/lib/Target/SystemZ/SystemZISelLowering.h

Show First 20 Lines • Show All 52 Lines • ▼ Show 20 Lines	enum NodeType : unsigned {
// Integer absolute.		// Integer absolute.
IABS,		IABS,

// Integer comparisons. There are three operands: the two values		// Integer comparisons. There are three operands: the two values
// to compare, and an integer of type SystemZICMP.		// to compare, and an integer of type SystemZICMP.
ICMP,		ICMP,

// Floating-point comparisons. The two operands are the values to compare.		// Floating-point comparisons. The two operands are the values to compare.
// Regular and strict (quiet and signaling) versions.		FCMP,
FCMP, STRICT_FCMP, STRICT_FCMPS,

// Test under mask. The first operand is ANDed with the second operand		// Test under mask. The first operand is ANDed with the second operand
// and the condition codes are set on the result. The third operand is		// and the condition codes are set on the result. The third operand is
// a boolean that is true if the condition codes need to distinguish		// a boolean that is true if the condition codes need to distinguish
// between CCMASK_TM_MIXED_MSB_0 and CCMASK_TM_MIXED_MSB_1 (which the		// between CCMASK_TM_MIXED_MSB_0 and CCMASK_TM_MIXED_MSB_1 (which the
// register forms do but the memory forms don't).		// register forms do but the memory forms don't).
TM,		TM,

▲ Show 20 Lines • Show All 173 Lines • ▼ Show 20 Lines	enum NodeType : unsigned {
// Likewise, but also set the condition codes on the result.		// Likewise, but also set the condition codes on the result.
VICMPES,		VICMPES,
VICMPHS,		VICMPHS,
VICMPHLS,		VICMPHLS,

// Compare floating-point vector operands 0 and 1 to produce the usual 0/-1		// Compare floating-point vector operands 0 and 1 to produce the usual 0/-1
// vector result. VFCMPE is for "ordered and equal", VFCMPH for "ordered and		// vector result. VFCMPE is for "ordered and equal", VFCMPH for "ordered and
// greater than" and VFCMPHE for "ordered and greater than or equal to".		// greater than" and VFCMPHE for "ordered and greater than or equal to".
// Regular and strict (quiet and signaling) versions.		VFCMPE,
VFCMPE, STRICT_VFCMPE, STRICT_VFCMPES,		VFCMPH,
VFCMPH, STRICT_VFCMPH, STRICT_VFCMPHS,		VFCMPHE,
VFCMPHE, STRICT_VFCMPHE, STRICT_VFCMPHES,

// Likewise, but also set the condition codes on the result.		// Likewise, but also set the condition codes on the result.
VFCMPES,		VFCMPES,
VFCMPHS,		VFCMPHS,
VFCMPHES,		VFCMPHES,

// Test floating-point data class for vectors.		// Test floating-point data class for vectors.
VFTCI,		VFTCI,

// Extend the even f32 elements of vector operand 0 to produce a vector		// Extend the even f32 elements of vector operand 0 to produce a vector
// of f64 elements. Regular and strict versions.		// of f64 elements.
VEXTEND, STRICT_VEXTEND,		VEXTEND,

// Round the f64 elements of vector operand 0 to f32s and store them in the		// Round the f64 elements of vector operand 0 to f32s and store them in the
// even elements of the result. Regular and strict versions.		// even elements of the result.
VROUND, STRICT_VROUND,		VROUND,

// AND the two vector operands together and set CC based on the result.		// AND the two vector operands together and set CC based on the result.
VTM,		VTM,

// String operations that set CC as a side-effect.		// String operations that set CC as a side-effect.
VFAE_CC,		VFAE_CC,
VFAEZ_CC,		VFAEZ_CC,
VFEE_CC,		VFEE_CC,
VFEEZ_CC,		VFEEZ_CC,
VFENE_CC,		VFENE_CC,
VFENEZ_CC,		VFENEZ_CC,
VISTR_CC,		VISTR_CC,
VSTRC_CC,		VSTRC_CC,
VSTRCZ_CC,		VSTRCZ_CC,
VSTRS_CC,		VSTRS_CC,
VSTRSZ_CC,		VSTRSZ_CC,

// Test Data Class.		// Test Data Class.
//		//
// Operand 0: the value to test		// Operand 0: the value to test
// Operand 1: the bit mask		// Operand 1: the bit mask
TDC,		TDC,

		// Strict variants of scalar floating-point comparisons.
		// Quiet and signaling versions.
		STRICT_FCMP = ISD::FIRST_TARGET_STRICTFP_OPCODE,
		STRICT_FCMPS,

		// Strict variants of vector floating-point comparisons.
		// Quiet and signaling versions.
		STRICT_VFCMPE,
		STRICT_VFCMPH,
		STRICT_VFCMPHE,
		STRICT_VFCMPES,
		STRICT_VFCMPHS,
		STRICT_VFCMPHES,

		// Strict variants of VEXTEND and VROUND.
		STRICT_VEXTEND,
		STRICT_VROUND,

// Wrappers around the inner loop of an 8- or 16-bit ATOMIC_SWAP or		// Wrappers around the inner loop of an 8- or 16-bit ATOMIC_SWAP or
// ATOMIC_LOAD_<op>.		// ATOMIC_LOAD_<op>.
//		//
// Operand 0: the address of the containing 32-bit-aligned field		// Operand 0: the address of the containing 32-bit-aligned field
// Operand 1: the second operand of <op>, in the high bits of an i32		// Operand 1: the second operand of <op>, in the high bits of an i32
// for everything except ATOMIC_SWAPW		// for everything except ATOMIC_SWAPW
// Operand 2: how many bits to rotate the i32 left to bring the first		// Operand 2: how many bits to rotate the i32 left to bring the first
// operand into the high bits		// operand into the high bits
▲ Show 20 Lines • Show All 385 Lines • Show Last 20 Lines

llvm/lib/Target/X86/X86ISelLowering.h

Show First 20 Lines • Show All 73 Lines • ▼ Show 20 Lines	enum NodeType : unsigned {
CALL,		CALL,

/// Same as call except it adds the NoTrack prefix.		/// Same as call except it adds the NoTrack prefix.
NT_CALL,		NT_CALL,

/// X86 compare and logical compare instructions.		/// X86 compare and logical compare instructions.
CMP, COMI, UCOMI,		CMP, COMI, UCOMI,

/// X86 strict FP compare instructions.
STRICT_FCMP, STRICT_FCMPS,

/// X86 bit-test instructions.		/// X86 bit-test instructions.
BT,		BT,

/// X86 SetCC. Operand 0 is condition code, and operand 1 is the EFLAGS		/// X86 SetCC. Operand 0 is condition code, and operand 1 is the EFLAGS
/// operand, usually produced by a CMP instruction.		/// operand, usually produced by a CMP instruction.
SETCC,		SETCC,

/// X86 Select		/// X86 Select
▲ Show 20 Lines • Show All 227 Lines • ▼ Show 20 Lines	enum NodeType : unsigned {
// Shifts of mask registers.		// Shifts of mask registers.
KSHIFTL, KSHIFTR,		KSHIFTL, KSHIFTR,

// Bit rotate by immediate		// Bit rotate by immediate
VROTLI, VROTRI,		VROTLI, VROTRI,

// Vector packed double/float comparison.		// Vector packed double/float comparison.
CMPP,		CMPP,
STRICT_CMPP,

// Vector integer comparisons.		// Vector integer comparisons.
PCMPEQ, PCMPGT,		PCMPEQ, PCMPGT,

// v8i16 Horizontal minimum and position.		// v8i16 Horizontal minimum and position.
PHMINPOS,		PHMINPOS,

MULTISHIFT,		MULTISHIFT,

/// Vector comparison generating mask bits for fp and		/// Vector comparison generating mask bits for fp and
/// integer signed and unsigned data types.		/// integer signed and unsigned data types.
CMPM,		CMPM,
STRICT_CMPM,
// Vector comparison with SAE for FP values		// Vector comparison with SAE for FP values
CMPM_SAE,		CMPM_SAE,

// Arithmetic operations with FLAGS results.		// Arithmetic operations with FLAGS results.
ADD, SUB, ADC, SBB, SMUL, UMUL,		ADD, SUB, ADC, SBB, SMUL, UMUL,
OR, XOR, AND,		OR, XOR, AND,

// Bit field extract.		// Bit field extract.
▲ Show 20 Lines • Show All 151 Lines • ▼ Show 20 Lines	enum NodeType : unsigned {

// Vector float/double to signed/unsigned integer.		// Vector float/double to signed/unsigned integer.
CVTP2SI, CVTP2UI, CVTP2SI_RND, CVTP2UI_RND,		CVTP2SI, CVTP2UI, CVTP2SI_RND, CVTP2UI_RND,
// Scalar float/double to signed/unsigned integer.		// Scalar float/double to signed/unsigned integer.
CVTS2SI, CVTS2UI, CVTS2SI_RND, CVTS2UI_RND,		CVTS2SI, CVTS2UI, CVTS2SI_RND, CVTS2UI_RND,

// Vector float/double to signed/unsigned integer with truncation.		// Vector float/double to signed/unsigned integer with truncation.
CVTTP2SI, CVTTP2UI, CVTTP2SI_SAE, CVTTP2UI_SAE,		CVTTP2SI, CVTTP2UI, CVTTP2SI_SAE, CVTTP2UI_SAE,
STRICT_CVTTP2SI, STRICT_CVTTP2UI,
// Scalar float/double to signed/unsigned integer with truncation.		// Scalar float/double to signed/unsigned integer with truncation.
CVTTS2SI, CVTTS2UI, CVTTS2SI_SAE, CVTTS2UI_SAE,		CVTTS2SI, CVTTS2UI, CVTTS2SI_SAE, CVTTS2UI_SAE,

// Vector signed/unsigned integer to float/double.		// Vector signed/unsigned integer to float/double.
CVTSI2P, CVTUI2P,		CVTSI2P, CVTUI2P,
STRICT_CVTSI2P, STRICT_CVTUI2P,		STRICT_CVTSI2P, STRICT_CVTUI2P,

// Masked versions of above. Used for v2f64->v4f32.		// Masked versions of above. Used for v2f64->v4f32.
▲ Show 20 Lines • Show All 82 Lines • ▼ Show 20 Lines	enum NodeType : unsigned {
UMWAIT, TPAUSE,		UMWAIT, TPAUSE,

// Enqueue Stores Instructions		// Enqueue Stores Instructions
ENQCMD, ENQCMDS,		ENQCMD, ENQCMDS,

// For avx512-vp2intersect		// For avx512-vp2intersect
VP2INTERSECT,		VP2INTERSECT,

		/// X86 strict FP compare instructions.
		STRICT_FCMP = ISD::FIRST_TARGET_STRICTFP_OPCODE,
		STRICT_FCMPS,

		// Vector packed double/float comparison.
		STRICT_CMPP,

		/// Vector comparison generating mask bits for fp and
		/// integer signed and unsigned data types.
		STRICT_CMPM,

		// Vector float/double to signed/unsigned integer with truncation.
		STRICT_CVTTP2SI, STRICT_CVTTP2UI,

// Compare and swap.		// Compare and swap.
LCMPXCHG_DAG = ISD::FIRST_TARGET_MEMORY_OPCODE,		LCMPXCHG_DAG = ISD::FIRST_TARGET_MEMORY_OPCODE,
LCMPXCHG8_DAG,		LCMPXCHG8_DAG,
LCMPXCHG16_DAG,		LCMPXCHG16_DAG,
LCMPXCHG8_SAVE_EBX_DAG,		LCMPXCHG8_SAVE_EBX_DAG,
LCMPXCHG16_SAVE_RBX_DAG,		LCMPXCHG16_SAVE_RBX_DAG,

/// LOCK-prefixed arithmetic read-modify-write instructions.		/// LOCK-prefixed arithmetic read-modify-write instructions.
▲ Show 20 Lines • Show All 1,084 Lines • Show Last 20 Lines

llvm/test/CodeGen/X86/fp-intrinsics-flags-x86_64.ll

	; RUN: llc -O3 -mtriple=x86_64-pc-linux < %s -stop-after=finalize-isel \| FileCheck %s			; RUN: llc -O3 -mtriple=x86_64-pc-linux < %s -stop-after=finalize-isel \| FileCheck %s

	define i32 @f20u(double %x) #0 {			define i32 @f20u(double %x) #0 {
	; CHECK-LABEL: name: f20u			; CHECK-LABEL: name: f20u
	; CHECK: liveins: $xmm0			; CHECK: liveins: $xmm0
	; CHECK: [[COPY:%[0-9]+]]:fr64 = COPY $xmm0			; CHECK: [[COPY:%[0-9]+]]:fr64 = COPY $xmm0
	; CHECK: [[CVTTSD2SI64rr:%[0-9]+]]:gr64 = CVTTSD2SI64rr [[COPY]], implicit $mxcsr			; CHECK: [[CVTTSD2SI64rr:%[0-9]+]]:gr64 = fpexcept CVTTSD2SI64rr [[COPY]], implicit $mxcsr
	; CHECK: [[COPY1:%[0-9]+]]:gr32 = COPY [[CVTTSD2SI64rr]].sub_32bit			; CHECK: [[COPY1:%[0-9]+]]:gr32 = COPY [[CVTTSD2SI64rr]].sub_32bit
	; CHECK: $eax = COPY [[COPY1]]			; CHECK: $eax = COPY [[COPY1]]
	; CHECK: RET 0, $eax			; CHECK: RET 0, $eax
	entry:			entry:
	%result = call i32 @llvm.experimental.constrained.fptoui.i32.f64(double %x, metadata !"fpexcept.strict") #0			%result = call i32 @llvm.experimental.constrained.fptoui.i32.f64(double %x, metadata !"fpexcept.strict") #0
	ret i32 %result			ret i32 %result
	}			}

	attributes #0 = { strictfp }			attributes #0 = { strictfp }

	declare i32 @llvm.experimental.constrained.fptoui.i32.f64(double, metadata)			declare i32 @llvm.experimental.constrained.fptoui.i32.f64(double, metadata)

llvm/test/CodeGen/X86/fp-intrinsics-flags.ll

Show All 23 Lines	; CHECK: RET 0, killed [[LD_Fp64m80_]]
ret double %result		ret double %result
}		}

define i64 @f20u64(double %x) #0 {		define i64 @f20u64(double %x) #0 {
entry:		entry:
; CHECK-LABEL: name: f20u64		; CHECK-LABEL: name: f20u64
; CHECK: [[MOVSDrm_alt:%[0-9]+]]:fr64 = MOVSDrm_alt %fixed-stack.0, 1, $noreg, 0, $noreg :: (load 8 from %fixed-stack.0, align 16)		; CHECK: [[MOVSDrm_alt:%[0-9]+]]:fr64 = MOVSDrm_alt %fixed-stack.0, 1, $noreg, 0, $noreg :: (load 8 from %fixed-stack.0, align 16)
; CHECK: [[MOVSDrm_alt1:%[0-9]+]]:fr64 = MOVSDrm_alt $noreg, 1, $noreg, %const.0, $noreg :: (load 8 from constant-pool)		; CHECK: [[MOVSDrm_alt1:%[0-9]+]]:fr64 = MOVSDrm_alt $noreg, 1, $noreg, %const.0, $noreg :: (load 8 from constant-pool)
; CHECK: COMISDrr [[MOVSDrm_alt1]], [[MOVSDrm_alt]], implicit-def $eflags, implicit $mxcsr		; CHECK: fpexcept COMISDrr [[MOVSDrm_alt1]], [[MOVSDrm_alt]], implicit-def $eflags, implicit $mxcsr
		craig.topperUnsubmitted Not Done Reply Inline Actions Does this compare have fpexcept on it too? craig.topper: Does this compare have fpexcept on it too?
		uweigandAuthorUnsubmitted Done Reply Inline Actions Yes, it does ... updated the patch to check for it. uweigand: Yes, it does ... updated the patch to check for it.
; CHECK: [[FsFLD0SD:%[0-9]+]]:fr64 = FsFLD0SD		; CHECK: [[FsFLD0SD:%[0-9]+]]:fr64 = FsFLD0SD
; CHECK: JCC_1		; CHECK: JCC_1
; CHECK: [[PHI:%[0-9]+]]:fr64 = PHI [[MOVSDrm_alt1]], {{.}}, [[FsFLD0SD]], {{.}}		; CHECK: [[PHI:%[0-9]+]]:fr64 = PHI [[MOVSDrm_alt1]], {{.}}, [[FsFLD0SD]], {{.}}
; CHECK: [[SUBSDrr:%[0-9]+]]:fr64 = SUBSDrr [[MOVSDrm_alt]], killed [[PHI]], implicit $mxcsr		; CHECK: [[SUBSDrr:%[0-9]+]]:fr64 = fpexcept SUBSDrr [[MOVSDrm_alt]], killed [[PHI]], implicit $mxcsr
; CHECK: MOVSDmr %stack.0, 1, $noreg, 0, $noreg, killed [[SUBSDrr]] :: (store 8 into %stack.0)		; CHECK: MOVSDmr %stack.0, 1, $noreg, 0, $noreg, killed [[SUBSDrr]] :: (store 8 into %stack.0)
; CHECK: [[SETCCr:%[0-9]+]]:gr8 = SETCCr 6, implicit $eflags		; CHECK: [[SETCCr:%[0-9]+]]:gr8 = SETCCr 6, implicit $eflags
; CHECK: [[LD_Fp64m:%[0-9]+]]:rfp64 = LD_Fp64m %stack.0, 1, $noreg, 0, $noreg, implicit-def dead $fpsw, implicit $fpcw :: (load 8 from %stack.0)		; CHECK: [[LD_Fp64m:%[0-9]+]]:rfp64 = fpexcept LD_Fp64m %stack.0, 1, $noreg, 0, $noreg, implicit-def dead $fpsw, implicit $fpcw :: (load 8 from %stack.0)
; CHECK: FNSTCW16m %stack.1, 1, $noreg, 0, $noreg, implicit-def $fpsw, implicit $fpcw :: (store 2 into %stack.1)		; CHECK: FNSTCW16m %stack.1, 1, $noreg, 0, $noreg, implicit-def $fpsw, implicit $fpcw :: (store 2 into %stack.1)
; CHECK: [[MOVZX32rm16_:%[0-9]+]]:gr32 = MOVZX32rm16 %stack.1, 1, $noreg, 0, $noreg :: (load 2 from %stack.1)		; CHECK: [[MOVZX32rm16_:%[0-9]+]]:gr32 = MOVZX32rm16 %stack.1, 1, $noreg, 0, $noreg :: (load 2 from %stack.1)
; CHECK: [[OR32ri:%[0-9]+]]:gr32 = OR32ri killed [[MOVZX32rm16_]], 3072, implicit-def $eflags		; CHECK: [[OR32ri:%[0-9]+]]:gr32 = OR32ri killed [[MOVZX32rm16_]], 3072, implicit-def $eflags
; CHECK: [[COPY3:%[0-9]+]]:gr16 = COPY killed [[OR32ri]].sub_16bit		; CHECK: [[COPY3:%[0-9]+]]:gr16 = COPY killed [[OR32ri]].sub_16bit
; CHECK: MOV16mr %stack.2, 1, $noreg, 0, $noreg, killed [[COPY3]] :: (store 2 into %stack.2)		; CHECK: MOV16mr %stack.2, 1, $noreg, 0, $noreg, killed [[COPY3]] :: (store 2 into %stack.2)
; CHECK: FLDCW16m %stack.2, 1, $noreg, 0, $noreg, implicit-def $fpsw, implicit-def $fpcw :: (load 2 from %stack.2)		; CHECK: FLDCW16m %stack.2, 1, $noreg, 0, $noreg, implicit-def $fpsw, implicit-def $fpcw :: (load 2 from %stack.2)
; CHECK: IST_Fp64m64 %stack.0, 1, $noreg, 0, $noreg, [[LD_Fp64m]], implicit-def $fpsw, implicit $fpcw		; CHECK: IST_Fp64m64 %stack.0, 1, $noreg, 0, $noreg, [[LD_Fp64m]], implicit-def $fpsw, implicit $fpcw
; CHECK: FLDCW16m %stack.1, 1, $noreg, 0, $noreg, implicit-def $fpsw, implicit-def $fpcw :: (load 2 from %stack.1)		; CHECK: FLDCW16m %stack.1, 1, $noreg, 0, $noreg, implicit-def $fpsw, implicit-def $fpcw :: (load 2 from %stack.1)
; CHECK: [[MOVZX32rr8_:%[0-9]+]]:gr32 = MOVZX32rr8 killed [[SETCCr]]		; CHECK: [[MOVZX32rr8_:%[0-9]+]]:gr32 = MOVZX32rr8 killed [[SETCCr]]
; CHECK: [[SHL32ri:%[0-9]+]]:gr32 = SHL32ri [[MOVZX32rr8_]], 31, implicit-def dead $eflags		; CHECK: [[SHL32ri:%[0-9]+]]:gr32 = SHL32ri [[MOVZX32rr8_]], 31, implicit-def dead $eflags
; CHECK: [[XOR32rm:%[0-9]+]]:gr32 = XOR32rm [[SHL32ri]], %stack.0, 1, $noreg, 4, $noreg, implicit-def dead $eflags :: (load 4 from %stack.0 + 4)		; CHECK: [[XOR32rm:%[0-9]+]]:gr32 = XOR32rm [[SHL32ri]], %stack.0, 1, $noreg, 4, $noreg, implicit-def dead $eflags :: (load 4 from %stack.0 + 4)
; CHECK: [[MOV32rm:%[0-9]+]]:gr32 = MOV32rm %stack.0, 1, $noreg, 0, $noreg :: (load 4 from %stack.0, align 8)		; CHECK: [[MOV32rm:%[0-9]+]]:gr32 = MOV32rm %stack.0, 1, $noreg, 0, $noreg :: (load 4 from %stack.0, align 8)
; CHECK: $eax = COPY [[MOV32rm]]		; CHECK: $eax = COPY [[MOV32rm]]
; CHECK: $edx = COPY [[XOR32rm]]		; CHECK: $edx = COPY [[XOR32rm]]
; CHECK: RET 0, $eax, $edx		; CHECK: RET 0, $eax, $edx
%result = call i64 @llvm.experimental.constrained.fptoui.i64.f64(double %x, metadata !"fpexcept.strict") #0		%result = call i64 @llvm.experimental.constrained.fptoui.i64.f64(double %x, metadata !"fpexcept.strict") #0
ret i64 %result		ret i64 %result
}		}

define i8 @f20s8(double %x) #0 {		define i8 @f20s8(double %x) #0 {
entry:		entry:
; CHECK-LABEL: name: f20s8		; CHECK-LABEL: name: f20s8
; CHECK: [[CVTTSD2SIrm:%[0-9]+]]:gr32 = CVTTSD2SIrm %fixed-stack.0, 1, $noreg, 0, $noreg, implicit $mxcsr :: (load 8 from %fixed-stack.0, align 16)		; CHECK: [[CVTTSD2SIrm:%[0-9]+]]:gr32 = fpexcept CVTTSD2SIrm %fixed-stack.0, 1, $noreg, 0, $noreg, implicit $mxcsr :: (load 8 from %fixed-stack.0, align 16)
; CHECK: [[COPY:%[0-9]+]]:gr32_abcd = COPY [[CVTTSD2SIrm]]		; CHECK: [[COPY:%[0-9]+]]:gr32_abcd = COPY [[CVTTSD2SIrm]]
; CHECK: [[COPY1:%[0-9]+]]:gr8 = COPY [[COPY]].sub_8bit		; CHECK: [[COPY1:%[0-9]+]]:gr8 = COPY [[COPY]].sub_8bit
; CHECK: $al = COPY [[COPY1]]		; CHECK: $al = COPY [[COPY1]]
; CHECK: RET 0, $al		; CHECK: RET 0, $al
%result = call i8 @llvm.experimental.constrained.fptosi.i8.f64(double %x, metadata !"fpexcept.strict") #0		%result = call i8 @llvm.experimental.constrained.fptosi.i8.f64(double %x, metadata !"fpexcept.strict") #0
ret i8 %result		ret i8 %result
}		}

define i16 @f20s16(double %x) #0 {		define i16 @f20s16(double %x) #0 {
entry:		entry:
; CHECK-LABEL: name: f20s16		; CHECK-LABEL: name: f20s16
; CHECK: [[CVTTSD2SIrm:%[0-9]+]]:gr32 = CVTTSD2SIrm %fixed-stack.0, 1, $noreg, 0, $noreg, implicit $mxcsr :: (load 8 from %fixed-stack.0, align 16)		; CHECK: [[CVTTSD2SIrm:%[0-9]+]]:gr32 = fpexcept CVTTSD2SIrm %fixed-stack.0, 1, $noreg, 0, $noreg, implicit $mxcsr :: (load 8 from %fixed-stack.0, align 16)
; CHECK: [[COPY:%[0-9]+]]:gr16 = COPY [[CVTTSD2SIrm]].sub_16bit		; CHECK: [[COPY:%[0-9]+]]:gr16 = COPY [[CVTTSD2SIrm]].sub_16bit
; CHECK: $ax = COPY [[COPY]]		; CHECK: $ax = COPY [[COPY]]
; CHECK: RET 0, $ax		; CHECK: RET 0, $ax
%result = call i16 @llvm.experimental.constrained.fptosi.i16.f64(double %x, metadata !"fpexcept.strict") #0		%result = call i16 @llvm.experimental.constrained.fptosi.i16.f64(double %x, metadata !"fpexcept.strict") #0
ret i16 %result		ret i16 %result
}		}

define i32 @f20u(double %x) #0 {		define i32 @f20u(double %x) #0 {
entry:		entry:
; CHECK-LABEL: name: f20u		; CHECK-LABEL: name: f20u
; CHECK: [[MOVSDrm_alt:%[0-9]+]]:fr64 = MOVSDrm_alt %fixed-stack.0, 1, $noreg, 0, $noreg :: (load 8 from %fixed-stack.0, align 16)		; CHECK: [[MOVSDrm_alt:%[0-9]+]]:fr64 = MOVSDrm_alt %fixed-stack.0, 1, $noreg, 0, $noreg :: (load 8 from %fixed-stack.0, align 16)
; CHECK: [[MOVSDrm_alt1:%[0-9]+]]:fr64 = MOVSDrm_alt $noreg, 1, $noreg, %const.0, $noreg :: (load 8 from constant-pool)		; CHECK: [[MOVSDrm_alt1:%[0-9]+]]:fr64 = MOVSDrm_alt $noreg, 1, $noreg, %const.0, $noreg :: (load 8 from constant-pool)
; CHECK: COMISDrr [[MOVSDrm_alt1]], [[MOVSDrm_alt]], implicit-def $eflags, implicit $mxcsr		; CHECK: fpexcept COMISDrr [[MOVSDrm_alt1]], [[MOVSDrm_alt]], implicit-def $eflags, implicit $mxcsr
; CHECK: [[FsFLD0SD:%[0-9]+]]:fr64 = FsFLD0SD		; CHECK: [[FsFLD0SD:%[0-9]+]]:fr64 = FsFLD0SD
; CHECK: JCC_1		; CHECK: JCC_1
; CHECK: [[PHI:%[0-9]+]]:fr64 = PHI [[MOVSDrm_alt1]], {{.}}, [[FsFLD0SD]], {{.}}		; CHECK: [[PHI:%[0-9]+]]:fr64 = PHI [[MOVSDrm_alt1]], {{.}}, [[FsFLD0SD]], {{.}}
; CHECK: [[SETCCr:%[0-9]+]]:gr8 = SETCCr 6, implicit $eflags		; CHECK: [[SETCCr:%[0-9]+]]:gr8 = SETCCr 6, implicit $eflags
; CHECK: [[MOVZX32rr8_:%[0-9]+]]:gr32 = MOVZX32rr8 killed [[SETCCr]]		; CHECK: [[MOVZX32rr8_:%[0-9]+]]:gr32 = MOVZX32rr8 killed [[SETCCr]]
; CHECK: [[SHL32ri:%[0-9]+]]:gr32 = SHL32ri [[MOVZX32rr8_]], 31, implicit-def dead $eflags		; CHECK: [[SHL32ri:%[0-9]+]]:gr32 = SHL32ri [[MOVZX32rr8_]], 31, implicit-def dead $eflags
; CHECK: [[SUBSDrr:%[0-9]+]]:fr64 = SUBSDrr [[MOVSDrm_alt]], killed [[PHI]], implicit $mxcsr		; CHECK: [[SUBSDrr:%[0-9]+]]:fr64 = fpexcept SUBSDrr [[MOVSDrm_alt]], killed [[PHI]], implicit $mxcsr
; CHECK: [[CVTTSD2SIrr:%[0-9]+]]:gr32 = CVTTSD2SIrr killed [[SUBSDrr]], implicit $mxcsr		; CHECK: [[CVTTSD2SIrr:%[0-9]+]]:gr32 = fpexcept CVTTSD2SIrr killed [[SUBSDrr]], implicit $mxcsr
; CHECK: [[XOR32rr:%[0-9]+]]:gr32 = XOR32rr [[CVTTSD2SIrr]], killed [[SHL32ri]], implicit-def dead $eflags		; CHECK: [[XOR32rr:%[0-9]+]]:gr32 = XOR32rr [[CVTTSD2SIrr]], killed [[SHL32ri]], implicit-def dead $eflags
; CHECK: $eax = COPY [[XOR32rr]]		; CHECK: $eax = COPY [[XOR32rr]]
; CHECK: RET 0, $eax		; CHECK: RET 0, $eax
%result = call i32 @llvm.experimental.constrained.fptoui.i32.f64(double %x, metadata !"fpexcept.strict") #0		%result = call i32 @llvm.experimental.constrained.fptoui.i32.f64(double %x, metadata !"fpexcept.strict") #0
ret i32 %result		ret i32 %result
}		}

attributes #0 = { strictfp }		attributes #0 = { strictfp }

declare double @llvm.experimental.constrained.sitofp.f64.i8(i8, metadata, metadata)		declare double @llvm.experimental.constrained.sitofp.f64.i8(i8, metadata, metadata)
declare double @llvm.experimental.constrained.sitofp.f64.i16(i16, metadata, metadata)		declare double @llvm.experimental.constrained.sitofp.f64.i16(i16, metadata, metadata)
declare i32 @llvm.experimental.constrained.fptoui.i32.f64(double, metadata)		declare i32 @llvm.experimental.constrained.fptoui.i32.f64(double, metadata)
declare i64 @llvm.experimental.constrained.fptoui.i64.f64(double, metadata)		declare i64 @llvm.experimental.constrained.fptoui.i64.f64(double, metadata)
declare i8 @llvm.experimental.constrained.fptosi.i8.f64(double, metadata)		declare i8 @llvm.experimental.constrained.fptosi.i8.f64(double, metadata)
declare i16 @llvm.experimental.constrained.fptosi.i16.f64(double, metadata)		declare i16 @llvm.experimental.constrained.fptosi.i16.f64(double, metadata)

llvm/test/CodeGen/X86/vector-constrained-fp-intrinsics-flags.ll

	; RUN: llc -O3 -mtriple=x86_64-pc-linux -stop-after=finalize-isel < %s \| FileCheck %s			; RUN: llc -O3 -mtriple=x86_64-pc-linux -stop-after=finalize-isel < %s \| FileCheck %s

	define <1 x float> @constrained_vector_fadd_v1f32() #0 {			define <1 x float> @constrained_vector_fadd_v1f32() #0 {
	; CHECK-LABEL: name: constrained_vector_fadd_v1f32			; CHECK-LABEL: name: constrained_vector_fadd_v1f32
	; CHECK: [[MOVSSrm_alt:%[0-9]+]]:fr32 = MOVSSrm_alt $rip, 1, $noreg, %const.0, $noreg :: (load 4 from constant-pool)			; CHECK: [[MOVSSrm_alt:%[0-9]+]]:fr32 = MOVSSrm_alt $rip, 1, $noreg, %const.0, $noreg :: (load 4 from constant-pool)
	; CHECK: [[ADDSSrm:%[0-9]+]]:fr32 = ADDSSrm [[MOVSSrm_alt]], $rip, 1, $noreg, %const.1, $noreg, implicit $mxcsr :: (load 4 from constant-pool)			; CHECK: [[ADDSSrm:%[0-9]+]]:fr32 = fpexcept ADDSSrm [[MOVSSrm_alt]], $rip, 1, $noreg, %const.1, $noreg, implicit $mxcsr :: (load 4 from constant-pool)
	; CHECK: $xmm0 = COPY [[ADDSSrm]]			; CHECK: $xmm0 = COPY [[ADDSSrm]]
	; CHECK: RET 0, $xmm0			; CHECK: RET 0, $xmm0
	entry:			entry:
	%add = call <1 x float> @llvm.experimental.constrained.fadd.v1f32(<1 x float> <float 0x7FF0000000000000>, <1 x float> <float 1.0>, metadata !"round.dynamic", metadata !"fpexcept.strict") #0			%add = call <1 x float> @llvm.experimental.constrained.fadd.v1f32(<1 x float> <float 0x7FF0000000000000>, <1 x float> <float 1.0>, metadata !"round.dynamic", metadata !"fpexcept.strict") #0
	ret <1 x float> %add			ret <1 x float> %add
	}			}

	define <3 x float> @constrained_vector_fadd_v3f32() #0 {			define <3 x float> @constrained_vector_fadd_v3f32() #0 {
	; CHECK-LABEL: name: constrained_vector_fadd_v3f32			; CHECK-LABEL: name: constrained_vector_fadd_v3f32
	; CHECK: [[FsFLD0SS:%[0-9]+]]:fr32 = FsFLD0SS			; CHECK: [[FsFLD0SS:%[0-9]+]]:fr32 = FsFLD0SS
	; CHECK: [[MOVSSrm_alt:%[0-9]+]]:fr32 = MOVSSrm_alt $rip, 1, $noreg, %const.0, $noreg :: (load 4 from constant-pool)			; CHECK: [[MOVSSrm_alt:%[0-9]+]]:fr32 = MOVSSrm_alt $rip, 1, $noreg, %const.0, $noreg :: (load 4 from constant-pool)
	; CHECK: [[ADDSSrr:%[0-9]+]]:fr32 = ADDSSrr [[MOVSSrm_alt]], killed [[FsFLD0SS]], implicit $mxcsr			; CHECK: [[ADDSSrr:%[0-9]+]]:fr32 = fpexcept ADDSSrr [[MOVSSrm_alt]], killed [[FsFLD0SS]], implicit $mxcsr
	; CHECK: [[ADDSSrm:%[0-9]+]]:fr32 = ADDSSrm [[MOVSSrm_alt]], $rip, 1, $noreg, %const.1, $noreg, implicit $mxcsr :: (load 4 from constant-pool)			; CHECK: [[ADDSSrm:%[0-9]+]]:fr32 = fpexcept ADDSSrm [[MOVSSrm_alt]], $rip, 1, $noreg, %const.1, $noreg, implicit $mxcsr :: (load 4 from constant-pool)
	; CHECK: [[ADDSSrm1:%[0-9]+]]:fr32 = ADDSSrm [[MOVSSrm_alt]], $rip, 1, $noreg, %const.2, $noreg, implicit $mxcsr :: (load 4 from constant-pool)			; CHECK: [[ADDSSrm1:%[0-9]+]]:fr32 = fpexcept ADDSSrm [[MOVSSrm_alt]], $rip, 1, $noreg, %const.2, $noreg, implicit $mxcsr :: (load 4 from constant-pool)
	; CHECK: [[COPY:%[0-9]+]]:vr128 = COPY [[ADDSSrm1]]			; CHECK: [[COPY:%[0-9]+]]:vr128 = COPY [[ADDSSrm1]]
	; CHECK: [[COPY1:%[0-9]+]]:vr128 = COPY [[ADDSSrm]]			; CHECK: [[COPY1:%[0-9]+]]:vr128 = COPY [[ADDSSrm]]
	; CHECK: [[UNPCKLPSrr:%[0-9]+]]:vr128 = UNPCKLPSrr [[COPY1]], killed [[COPY]]			; CHECK: [[UNPCKLPSrr:%[0-9]+]]:vr128 = UNPCKLPSrr [[COPY1]], killed [[COPY]]
	; CHECK: [[COPY2:%[0-9]+]]:vr128 = COPY [[ADDSSrr]]			; CHECK: [[COPY2:%[0-9]+]]:vr128 = COPY [[ADDSSrr]]
	; CHECK: [[UNPCKLPDrr:%[0-9]+]]:vr128 = UNPCKLPDrr [[UNPCKLPSrr]], killed [[COPY2]]			; CHECK: [[UNPCKLPDrr:%[0-9]+]]:vr128 = UNPCKLPDrr [[UNPCKLPSrr]], killed [[COPY2]]
	; CHECK: $xmm0 = COPY [[UNPCKLPDrr]]			; CHECK: $xmm0 = COPY [[UNPCKLPDrr]]
	; CHECK: RET 0, $xmm0			; CHECK: RET 0, $xmm0
	entry:			entry:
	%add = call <3 x float> @llvm.experimental.constrained.fadd.v3f32(			%add = call <3 x float> @llvm.experimental.constrained.fadd.v3f32(
	<3 x float> <float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000,			<3 x float> <float 0xFFFFFFFFE0000000, float 0xFFFFFFFFE0000000,
	float 0xFFFFFFFFE0000000>,			float 0xFFFFFFFFE0000000>,
	<3 x float> <float 2.0, float 1.0, float 0.0>,			<3 x float> <float 2.0, float 1.0, float 0.0>,
	metadata !"round.dynamic",			metadata !"round.dynamic",
	metadata !"fpexcept.strict") #0			metadata !"fpexcept.strict") #0
	ret <3 x float> %add			ret <3 x float> %add
	}			}

	define <4 x double> @constrained_vector_fadd_v4f64() #0 {			define <4 x double> @constrained_vector_fadd_v4f64() #0 {
	; CHECK-LABEL: name: constrained_vector_fadd_v4f64			; CHECK-LABEL: name: constrained_vector_fadd_v4f64
	; CHECK: [[MOVAPDrm:%[0-9]+]]:vr128 = MOVAPDrm $rip, 1, $noreg, %const.0, $noreg :: (load 16 from constant-pool)			; CHECK: [[MOVAPDrm:%[0-9]+]]:vr128 = MOVAPDrm $rip, 1, $noreg, %const.0, $noreg :: (load 16 from constant-pool)
	; CHECK: [[ADDPDrm:%[0-9]+]]:vr128 = ADDPDrm [[MOVAPDrm]], $rip, 1, $noreg, %const.1, $noreg, implicit $mxcsr :: (load 16 from constant-pool)			; CHECK: [[ADDPDrm:%[0-9]+]]:vr128 = fpexcept ADDPDrm [[MOVAPDrm]], $rip, 1, $noreg, %const.1, $noreg, implicit $mxcsr :: (load 16 from constant-pool)
	; CHECK: [[ADDPDrm1:%[0-9]+]]:vr128 = ADDPDrm [[MOVAPDrm]], $rip, 1, $noreg, %const.2, $noreg, implicit $mxcsr :: (load 16 from constant-pool)			; CHECK: [[ADDPDrm1:%[0-9]+]]:vr128 = fpexcept ADDPDrm [[MOVAPDrm]], $rip, 1, $noreg, %const.2, $noreg, implicit $mxcsr :: (load 16 from constant-pool)
	; CHECK: $xmm0 = COPY [[ADDPDrm]]			; CHECK: $xmm0 = COPY [[ADDPDrm]]
	; CHECK: $xmm1 = COPY [[ADDPDrm1]]			; CHECK: $xmm1 = COPY [[ADDPDrm1]]
	; CHECK: RET 0, $xmm0, $xmm1			; CHECK: RET 0, $xmm0, $xmm1
	entry:			entry:
	%add = call <4 x double> @llvm.experimental.constrained.fadd.v4f64(			%add = call <4 x double> @llvm.experimental.constrained.fadd.v4f64(
	<4 x double> <double 0x7FEFFFFFFFFFFFFF, double 0x7FEFFFFFFFFFFFFF,			<4 x double> <double 0x7FEFFFFFFFFFFFFF, double 0x7FEFFFFFFFFFFFFF,
	double 0x7FEFFFFFFFFFFFFF, double 0x7FEFFFFFFFFFFFFF>,			double 0x7FEFFFFFFFFFFFFF, double 0x7FEFFFFFFFFFFFFF>,
	<4 x double> <double 1.000000e+00, double 1.000000e-01,			<4 x double> <double 1.000000e+00, double 1.000000e-01,
	Show All 9 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[FPEnv] Default NoFPExcept SDNodeFlag to false
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 235882

llvm/include/llvm/CodeGen/ISDOpcodes.h

llvm/include/llvm/CodeGen/SelectionDAGISel.h

llvm/include/llvm/CodeGen/SelectionDAGNodes.h

llvm/lib/CodeGen/SelectionDAG/InstrEmitter.cpp

llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp

llvm/lib/CodeGen/SelectionDAG/SelectionDAGISel.cpp

llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

llvm/lib/Target/SystemZ/SystemZISelLowering.h

llvm/lib/Target/X86/X86ISelLowering.h

llvm/test/CodeGen/X86/fp-intrinsics-flags-x86_64.ll

llvm/test/CodeGen/X86/fp-intrinsics-flags.ll

llvm/test/CodeGen/X86/vector-constrained-fp-intrinsics-flags.ll

This is an archive of the discontinued LLVM Phabricator instance.

[FPEnv] Default NoFPExcept SDNodeFlag to falseClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 235882

llvm/include/llvm/CodeGen/ISDOpcodes.h

llvm/include/llvm/CodeGen/SelectionDAGISel.h

llvm/include/llvm/CodeGen/SelectionDAGNodes.h

llvm/lib/CodeGen/SelectionDAG/InstrEmitter.cpp

llvm/lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

llvm/lib/CodeGen/SelectionDAG/SelectionDAGDumper.cpp

llvm/lib/CodeGen/SelectionDAG/SelectionDAGISel.cpp

llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

llvm/lib/Target/SystemZ/SystemZISelLowering.h

llvm/lib/Target/X86/X86ISelLowering.h

llvm/test/CodeGen/X86/fp-intrinsics-flags-x86_64.ll

llvm/test/CodeGen/X86/fp-intrinsics-flags.ll

llvm/test/CodeGen/X86/vector-constrained-fp-intrinsics-flags.ll

[FPEnv] Default NoFPExcept SDNodeFlag to false
ClosedPublic