Diff 201555

llvm/trunk/lib/CodeGen/SelectionDAG/InstrEmitter.h

Show All 36 Lines	class LLVM_LIBRARY_VISIBILITY InstrEmitter {

/// EmitCopyFromReg - Generate machine code for an CopyFromReg node or an		/// EmitCopyFromReg - Generate machine code for an CopyFromReg node or an
/// implicit physical register output.		/// implicit physical register output.
void EmitCopyFromReg(SDNode *Node, unsigned ResNo,		void EmitCopyFromReg(SDNode *Node, unsigned ResNo,
bool IsClone, bool IsCloned,		bool IsClone, bool IsCloned,
unsigned SrcReg,		unsigned SrcReg,
DenseMap<SDValue, unsigned> &VRBaseMap);		DenseMap<SDValue, unsigned> &VRBaseMap);

/// getDstOfCopyToRegUse - If the only use of the specified result number of
/// node is a CopyToReg, return its destination register. Return 0 otherwise.
unsigned getDstOfOnlyCopyToRegUse(SDNode *Node,
unsigned ResNo) const;

void CreateVirtualRegisters(SDNode *Node,		void CreateVirtualRegisters(SDNode *Node,
MachineInstrBuilder &MIB,		MachineInstrBuilder &MIB,
const MCInstrDesc &II,		const MCInstrDesc &II,
bool IsClone, bool IsCloned,		bool IsClone, bool IsCloned,
DenseMap<SDValue, unsigned> &VRBaseMap);		DenseMap<SDValue, unsigned> &VRBaseMap);

/// getVR - Return the virtual register corresponding to the specified result		/// getVR - Return the virtual register corresponding to the specified result
/// of the specified node.		/// of the specified node.
▲ Show 20 Lines • Show All 90 Lines • Show Last 20 Lines

llvm/trunk/lib/CodeGen/SelectionDAG/InstrEmitter.cpp

Show First 20 Lines • Show All 180 Lines • ▼ Show 20 Lines	EmitCopyFromReg(SDNode *Node, unsigned ResNo, bool IsClone, bool IsCloned,
SDValue Op(Node, ResNo);		SDValue Op(Node, ResNo);
if (IsClone)		if (IsClone)
VRBaseMap.erase(Op);		VRBaseMap.erase(Op);
bool isNew = VRBaseMap.insert(std::make_pair(Op, VRBase)).second;		bool isNew = VRBaseMap.insert(std::make_pair(Op, VRBase)).second;
(void)isNew; // Silence compiler warning.		(void)isNew; // Silence compiler warning.
assert(isNew && "Node emitted out of order - early");		assert(isNew && "Node emitted out of order - early");
}		}

/// getDstOfCopyToRegUse - If the only use of the specified result number of
/// node is a CopyToReg, return its destination register. Return 0 otherwise.
unsigned InstrEmitter::getDstOfOnlyCopyToRegUse(SDNode *Node,
unsigned ResNo) const {
if (!Node->hasOneUse())
return 0;

SDNode User = Node->use_begin();
if (User->getOpcode() == ISD::CopyToReg &&
User->getOperand(2).getNode() == Node &&
User->getOperand(2).getResNo() == ResNo) {
unsigned Reg = cast<RegisterSDNode>(User->getOperand(1))->getReg();
if (TargetRegisterInfo::isVirtualRegister(Reg))
return Reg;
}
return 0;
}

void InstrEmitter::CreateVirtualRegisters(SDNode *Node,		void InstrEmitter::CreateVirtualRegisters(SDNode *Node,
MachineInstrBuilder &MIB,		MachineInstrBuilder &MIB,
const MCInstrDesc &II,		const MCInstrDesc &II,
bool IsClone, bool IsCloned,		bool IsClone, bool IsCloned,
DenseMap<SDValue, unsigned> &VRBaseMap) {		DenseMap<SDValue, unsigned> &VRBaseMap) {
assert(Node->getMachineOpcode() != TargetOpcode::IMPLICIT_DEF &&		assert(Node->getMachineOpcode() != TargetOpcode::IMPLICIT_DEF &&
"IMPLICIT_DEF should have been handled as a special case elsewhere!");		"IMPLICIT_DEF should have been handled as a special case elsewhere!");

▲ Show 20 Lines • Show All 66 Lines • ▼ Show 20 Lines

/// getVR - Return the virtual register corresponding to the specified result		/// getVR - Return the virtual register corresponding to the specified result
/// of the specified node.		/// of the specified node.
unsigned InstrEmitter::getVR(SDValue Op,		unsigned InstrEmitter::getVR(SDValue Op,
DenseMap<SDValue, unsigned> &VRBaseMap) {		DenseMap<SDValue, unsigned> &VRBaseMap) {
if (Op.isMachineOpcode() &&		if (Op.isMachineOpcode() &&
Op.getMachineOpcode() == TargetOpcode::IMPLICIT_DEF) {		Op.getMachineOpcode() == TargetOpcode::IMPLICIT_DEF) {
// Add an IMPLICIT_DEF instruction before every use.		// Add an IMPLICIT_DEF instruction before every use.
unsigned VReg = getDstOfOnlyCopyToRegUse(Op.getNode(), Op.getResNo());
// IMPLICIT_DEF can produce any type of result so its MCInstrDesc		// IMPLICIT_DEF can produce any type of result so its MCInstrDesc
// does not include operand register class info.		// does not include operand register class info.
if (!VReg) {
const TargetRegisterClass *RC = TLI->getRegClassFor(		const TargetRegisterClass *RC = TLI->getRegClassFor(
Op.getSimpleValueType(), Op.getNode()->isDivergent());		Op.getSimpleValueType(), Op.getNode()->isDivergent());
VReg = MRI->createVirtualRegister(RC);		unsigned VReg = MRI->createVirtualRegister(RC);
}
BuildMI(*MBB, InsertPos, Op.getDebugLoc(),		BuildMI(*MBB, InsertPos, Op.getDebugLoc(),
TII->get(TargetOpcode::IMPLICIT_DEF), VReg);		TII->get(TargetOpcode::IMPLICIT_DEF), VReg);
return VReg;		return VReg;
}		}

DenseMap<SDValue, unsigned>::iterator I = VRBaseMap.find(Op);		DenseMap<SDValue, unsigned>::iterator I = VRBaseMap.find(Op);
assert(I != VRBaseMap.end() && "Node emitted out of order - late");		assert(I != VRBaseMap.end() && "Node emitted out of order - late");
return I->second;		return I->second;
▲ Show 20 Lines • Show All 701 Lines • ▼ Show 20 Lines
#endif		#endif
llvm_unreachable("This target-independent node should have been selected!");		llvm_unreachable("This target-independent node should have been selected!");
case ISD::EntryToken:		case ISD::EntryToken:
llvm_unreachable("EntryToken should have been excluded from the schedule!");		llvm_unreachable("EntryToken should have been excluded from the schedule!");
case ISD::MERGE_VALUES:		case ISD::MERGE_VALUES:
case ISD::TokenFactor: // fall thru		case ISD::TokenFactor: // fall thru
break;		break;
case ISD::CopyToReg: {		case ISD::CopyToReg: {
unsigned SrcReg;		unsigned DestReg = cast<RegisterSDNode>(Node->getOperand(1))->getReg();
SDValue SrcVal = Node->getOperand(2);		SDValue SrcVal = Node->getOperand(2);
		if (TargetRegisterInfo::isVirtualRegister(DestReg) &&
		SrcVal.isMachineOpcode() &&
		SrcVal.getMachineOpcode() == TargetOpcode::IMPLICIT_DEF) {
		// Instead building a COPY to that vreg destination, build an
		// IMPLICIT_DEF instruction instead.
		BuildMI(*MBB, InsertPos, Node->getDebugLoc(),
		TII->get(TargetOpcode::IMPLICIT_DEF), DestReg);
		break;
		}
		unsigned SrcReg;
if (RegisterSDNode *R = dyn_cast<RegisterSDNode>(SrcVal))		if (RegisterSDNode *R = dyn_cast<RegisterSDNode>(SrcVal))
SrcReg = R->getReg();		SrcReg = R->getReg();
else		else
SrcReg = getVR(SrcVal, VRBaseMap);		SrcReg = getVR(SrcVal, VRBaseMap);

unsigned DestReg = cast<RegisterSDNode>(Node->getOperand(1))->getReg();
if (SrcReg == DestReg) // Coalesced away the copy? Ignore.		if (SrcReg == DestReg) // Coalesced away the copy? Ignore.
break;		break;

BuildMI(*MBB, InsertPos, Node->getDebugLoc(), TII->get(TargetOpcode::COPY),		BuildMI(*MBB, InsertPos, Node->getDebugLoc(), TII->get(TargetOpcode::COPY),
DestReg).addReg(SrcReg);		DestReg).addReg(SrcReg);
break;		break;
}		}
case ISD::CopyFromReg: {		case ISD::CopyFromReg: {
▲ Show 20 Lines • Show All 146 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/AMDGPU/i1-copy-phi.ll

	Show All 31 Lines

	bb6: ; preds = %bb4, %bb3			bb6: ; preds = %bb4, %bb3
	ret void			ret void
	}			}

	declare i32 @llvm.amdgcn.workitem.id.x() #0			declare i32 @llvm.amdgcn.workitem.id.x() #0

	attributes #0 = { nounwind readnone }			attributes #0 = { nounwind readnone }

				; Make sure this won't crash.
				; SI-LABEL: {{^}}vcopy_i1_undef
				; SI: v_cndmask_b32_e64
				; SI: v_cndmask_b32_e64
				define <2 x float> @vcopy_i1_undef(<2 x float> addrspace(1)* %p) {
				entry:
				br i1 undef, label %exit, label %false

				false:
				%x = load <2 x float>, <2 x float> addrspace(1)* %p
				%cmp = fcmp one <2 x float> %x, zeroinitializer
				br label %exit

				exit:
				%c = phi <2 x i1> [ undef, %entry ], [ %cmp, %false ]
				%ret = select <2 x i1> %c, <2 x float> <float 2.0, float 2.0>, <2 x float> <float 4.0, float 4.0>
				ret <2 x float> %ret
				}

llvm/trunk/test/CodeGen/AMDGPU/implicit-def-muse.ll

				; RUN: llc -march=amdgcn -stop-after=amdgpu-isel -verify-machineinstrs -o - %s \| FileCheck %s

				; CHECK-LABEL: vcopy_i1_undef
				; CHECK: IMPLICIT_DEF
				; CHECK-NOT: COPY
				; CHECK: IMPLICIT_DEF
				; CHECK-NOT: COPY
				; CHECK: .false:
				define <2 x float> @vcopy_i1_undef(<2 x float> addrspace(1)* %p) {
				entry:
				br i1 undef, label %exit, label %false

				false:
				%x = load <2 x float>, <2 x float> addrspace(1)* %p
				%cmp = fcmp one <2 x float> %x, zeroinitializer
				br label %exit

				exit:
				%c = phi <2 x i1> [ undef, %entry ], [ %cmp, %false ]
				%ret = select <2 x i1> %c, <2 x float> <float 2.0, float 2.0>, <2 x float> <float 4.0, float 4.0>
				ret <2 x float> %ret
				}

This is an archive of the discontinued LLVM Phabricator instance.

[SelectionDAG] Enhance the simplification of `copyto` from `implicit-def`.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 201555

llvm/trunk/lib/CodeGen/SelectionDAG/InstrEmitter.h

llvm/trunk/lib/CodeGen/SelectionDAG/InstrEmitter.cpp

llvm/trunk/test/CodeGen/AMDGPU/i1-copy-phi.ll

llvm/trunk/test/CodeGen/AMDGPU/implicit-def-muse.ll

This is an archive of the discontinued LLVM Phabricator instance.

[SelectionDAG] Enhance the simplification of `copyto` from `implicit-def`.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 201555

llvm/trunk/lib/CodeGen/SelectionDAG/InstrEmitter.h

llvm/trunk/lib/CodeGen/SelectionDAG/InstrEmitter.cpp

llvm/trunk/test/CodeGen/AMDGPU/i1-copy-phi.ll

llvm/trunk/test/CodeGen/AMDGPU/implicit-def-muse.ll

[SelectionDAG] Enhance the simplification of `copyto` from `implicit-def`.
ClosedPublic