Diff 327818

llvm/lib/CodeGen/LiveIntervals.cpp

	Show First 20 Lines • Show All 696 Lines • ▼ Show 20 Lines

	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	// Register allocator hooks.			// Register allocator hooks.
	//			//

	void LiveIntervals::addKillFlags(const VirtRegMap *VRM) {			void LiveIntervals::addKillFlags(const VirtRegMap *VRM) {
	// Keep track of regunit ranges.			// Keep track of regunit ranges.
	SmallVector<std::pair<const LiveRange*, LiveRange::const_iterator>, 8> RU;			SmallVector<std::pair<const LiveRange*, LiveRange::const_iterator>, 8> RU;
	// Keep track of subregister ranges.
	SmallVector<std::pair<const LiveInterval::SubRange*,
	LiveRange::const_iterator>, 4> SRs;
	arsenmUnsubmitted Not Done Reply Inline Actions What was the point of copying out the subranges here before? arsenm: What was the point of copying out the subranges here before?
	bsaleilUnsubmitted Done Reply Inline Actions To be honest, I don't understand why we copied the subranges here. @MatzeB, do you have any idea ? bsaleil: To be honest, I don't understand why we copied the subranges here. @MatzeB, do you have any…

	for (unsigned i = 0, e = MRI->getNumVirtRegs(); i != e; ++i) {			for (unsigned i = 0, e = MRI->getNumVirtRegs(); i != e; ++i) {
	Register Reg = Register::index2VirtReg(i);			Register Reg = Register::index2VirtReg(i);
	if (MRI->reg_nodbg_empty(Reg))			if (MRI->reg_nodbg_empty(Reg))
	continue;			continue;
	const LiveInterval &LI = getInterval(Reg);			const LiveInterval &LI = getInterval(Reg);
	if (LI.empty())			if (LI.empty())
	continue;			continue;

	// Find the regunit intervals for the assigned register. They may overlap			// Find the regunit intervals for the assigned register. They may overlap
	// the virtual register live range, cancelling any kills.			// the virtual register live range, cancelling any kills.
	RU.clear();			RU.clear();
	for (MCRegUnitIterator Unit(VRM->getPhys(Reg), TRI); Unit.isValid();			for (MCRegUnitIterator Unit(VRM->getPhys(Reg), TRI); Unit.isValid();
	++Unit) {			++Unit) {
	const LiveRange &RURange = getRegUnit(*Unit);			const LiveRange &RURange = getRegUnit(*Unit);
	if (RURange.empty())			if (RURange.empty())
	continue;			continue;
	RU.push_back(std::make_pair(&RURange, RURange.find(LI.begin()->end)));			RU.push_back(std::make_pair(&RURange, RURange.find(LI.begin()->end)));
	}			}

	if (MRI->subRegLivenessEnabled()) {
	SRs.clear();
	for (const LiveInterval::SubRange &SR : LI.subranges()) {
	SRs.push_back(std::make_pair(&SR, SR.find(LI.begin()->end)));
	}
	}

	// Every instruction that kills Reg corresponds to a segment range end			// Every instruction that kills Reg corresponds to a segment range end
	// point.			// point.
	for (LiveInterval::const_iterator RI = LI.begin(), RE = LI.end(); RI != RE;			for (LiveInterval::const_iterator RI = LI.begin(), RE = LI.end(); RI != RE;
	++RI) {			++RI) {
	// A block index indicates an MBB edge.			// A block index indicates an MBB edge.
	if (RI->end.isBlock())			if (RI->end.isBlock())
	continue;			continue;
	MachineInstr *MI = getInstructionFromIndex(RI->end);			MachineInstr *MI = getInstructionFromIndex(RI->end);
	if (!MI)			if (!MI)
	continue;			continue;

	// Check if any of the regunits are live beyond the end of RI. That could			// Check if any of the regunits are live beyond the end of RI. That could
	// happen when a physreg is defined as a copy of a virtreg:			// happen when a physreg is defined as a copy of a virtreg:
	//			//
	// %eax = COPY %5			// %eax = COPY %5
	// FOO %5 <--- MI, cancel kill because %eax is live.			// FOO %5 <--- MI, cancel kill because %eax is live.
	// BAR killed %eax			// BAR killed %eax
	//			//
	// There should be no kill flag on FOO when %5 is rewritten as %eax.			// There should be no kill flag on FOO when %5 is rewritten as %eax.
	for (auto &RUP : RU) {			for (auto &RUP : RU) {
	const LiveRange &RURange = *RUP.first;			const LiveRange &RURange = *RUP.first;
	LiveRange::const_iterator &I = RUP.second;			LiveRange::const_iterator &I = RUP.second;
	if (I == RURange.end())			if (I == RURange.end())
	continue;			continue;
	I = RURange.advanceTo(I, RI->end);			I = RURange.advanceTo(I, RI->end);
	if (I == RURange.end() \|\| I->start >= RI->end)			if (I == RURange.end() \|\| I->start >= RI->end)
	continue;			continue;
				arsenmUnsubmitted Done Reply Inline Actions This looks like a separate NFC change arsenm: This looks like a separate NFC change
				bsaleilUnsubmitted Done Reply Inline Actions you're right, I removed that. bsaleil: you're right, I removed that.
	// I is overlapping RI.			// I is overlapping RI.
	goto CancelKill;			goto CancelKill;
	}			}

	if (MRI->subRegLivenessEnabled()) {			if (MRI->subRegLivenessEnabled()) {
	// When reading a partial undefined value we must not add a kill flag.			// When reading a partial undefined value we must not add a kill flag.
	// The regalloc might have used the undef lane for something else.			// The regalloc might have used the undef lane for something else.
	// Example:			// Example:
	// %1 = ... ; R32: %1			// %1 = ... ; R32: %1
	// %2:high16 = ... ; R64: %2			// %2:high16 = ... ; R64: %2
	// = read killed %2 ; R64: %2			// = read killed %2 ; R64: %2
	// = read %1 ; R32: %1			// = read %1 ; R32: %1
	// The <kill> flag is correct for %2, but the register allocator may			// The <kill> flag is correct for %2, but the register allocator may
	// assign R0L to %1, and R0 to %2 because the low 32bits of R0			// assign R0L to %1, and R0 to %2 because the low 32bits of R0
	// are actually never written by %2. After assignment the <kill>			// are actually never written by %2. After assignment the <kill>
	// flag at the read instruction is invalid.			// flag at the read instruction is invalid.
	LaneBitmask DefinedLanesMask;			LaneBitmask DefinedLanesMask;
	if (!SRs.empty()) {			if (LI.hasSubRanges()) {
	// Compute a mask of lanes that are defined.			// Compute a mask of lanes that are defined.
	DefinedLanesMask = LaneBitmask::getNone();			DefinedLanesMask = LaneBitmask::getNone();
	for (auto &SRP : SRs) {			for (const LiveInterval::SubRange &SR : LI.subranges())
	const LiveInterval::SubRange &SR = *SRP.first;			for (const LiveRange::Segment &Segment : SR.segments) {
	LiveRange::const_iterator &I = SRP.second;			if (Segment.start >= RI->end)
	if (I == SR.end())			break;
	continue;			if (Segment.end == RI->end) {
	I = SR.advanceTo(I, RI->end);
	if (I == SR.end() \|\| I->start >= RI->end)
	continue;
	// I is overlapping RI
	DefinedLanesMask \|= SR.LaneMask;			DefinedLanesMask \|= SR.LaneMask;
				break;
				}
	}			}
	} else			} else
	DefinedLanesMask = LaneBitmask::getAll();			DefinedLanesMask = LaneBitmask::getAll();

	bool IsFullWrite = false;			bool IsFullWrite = false;
	for (const MachineOperand &MO : MI->operands()) {			for (const MachineOperand &MO : MI->operands()) {
	if (!MO.isReg() \|\| MO.getReg() != Reg)			if (!MO.isReg() \|\| MO.getReg() != Reg)
	continue;			continue;
	if (MO.isUse()) {			if (MO.isUse()) {
	// Reading any undefined lanes?			// Reading any undefined lanes?
	LaneBitmask UseMask = TRI->getSubRegIndexLaneMask(MO.getSubReg());			unsigned SubReg = MO.getSubReg();
				LaneBitmask UseMask = SubReg ? TRI->getSubRegIndexLaneMask(SubReg)
				: MRI->getMaxLaneMaskForVReg(Reg);
	if ((UseMask & ~DefinedLanesMask).any())			if ((UseMask & ~DefinedLanesMask).any())
	goto CancelKill;			goto CancelKill;
	} else if (MO.getSubReg() == 0) {			} else if (MO.getSubReg() == 0) {
				arsenmUnsubmitted Done Reply Inline Actions getRegClass should be sufficient. There can't be a vreg without a class at this point arsenm: getRegClass should be sufficient. There can't be a vreg without a class at this point
				lkailUnsubmitted Done Reply Inline Actions I think it can be simplified as unsigned SubReg = MO.getSubReg(); LaneBitmask UseMask = SubReg ? TRI->getSubRegIndexLaneMask(SubReg) : MRI->getMaxLaneMaskForVReg(Reg); lkail: I think it can be simplified as ``` unsigned SubReg = MO.getSubReg()…
				bsaleilUnsubmitted Done Reply Inline Actions Thanks, good catch @lkail I simplified that. bsaleil: Thanks, good catch @lkail I simplified that.
	// Writing to the full register?			// Writing to the full register?
	assert(MO.isDef());			assert(MO.isDef());
	IsFullWrite = true;			IsFullWrite = true;
	}			}
	}			}

	// If an instruction writes to a subregister, a new segment starts in			// If an instruction writes to a subregister, a new segment starts in
	// the LiveInterval. But as this is only overriding part of the register			// the LiveInterval. But as this is only overriding part of the register
	▲ Show 20 Lines • Show All 922 Lines • Show Last 20 Lines

llvm/test/CodeGen/AMDGPU/load-global-i16.ll

This file is larger than 256 KB, so syntax highlighting is disabled by default.

	Show First 20 Lines • Show All 7,297 Lines • ▼ Show 20 Lines
	; GCN-NOHSA-SI-NEXT: s_waitcnt expcnt(2)			; GCN-NOHSA-SI-NEXT: s_waitcnt expcnt(2)
	; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v19, s0, v4			; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v19, s0, v4
	; GCN-NOHSA-SI-NEXT: s_waitcnt expcnt(0)			; GCN-NOHSA-SI-NEXT: s_waitcnt expcnt(0)
	; GCN-NOHSA-SI-NEXT: buffer_store_dword v19, off, s[12:15], 0 offset:20 ; 4-byte Folded Spill			; GCN-NOHSA-SI-NEXT: buffer_store_dword v19, off, s[12:15], 0 offset:20 ; 4-byte Folded Spill
	; GCN-NOHSA-SI-NEXT: s_waitcnt vmcnt(0)			; GCN-NOHSA-SI-NEXT: s_waitcnt vmcnt(0)
	; GCN-NOHSA-SI-NEXT: buffer_store_dword v20, off, s[12:15], 0 offset:24 ; 4-byte Folded Spill			; GCN-NOHSA-SI-NEXT: buffer_store_dword v20, off, s[12:15], 0 offset:24 ; 4-byte Folded Spill
	; GCN-NOHSA-SI-NEXT: buffer_store_dword v21, off, s[12:15], 0 offset:28 ; 4-byte Folded Spill			; GCN-NOHSA-SI-NEXT: buffer_store_dword v21, off, s[12:15], 0 offset:28 ; 4-byte Folded Spill
	; GCN-NOHSA-SI-NEXT: buffer_store_dword v22, off, s[12:15], 0 offset:32 ; 4-byte Folded Spill			; GCN-NOHSA-SI-NEXT: buffer_store_dword v22, off, s[12:15], 0 offset:32 ; 4-byte Folded Spill
	; GCN-NOHSA-SI-NEXT: s_waitcnt expcnt(1)			; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v4, s0, v3
	; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v21, s0, v3
	; GCN-NOHSA-SI-NEXT: v_lshrrev_b32_e32 v32, 16, v5			; GCN-NOHSA-SI-NEXT: v_lshrrev_b32_e32 v32, 16, v5
	; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v30, s0, v5			; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v30, s0, v5
	; GCN-NOHSA-SI-NEXT: v_lshrrev_b32_e32 v36, 16, v6			; GCN-NOHSA-SI-NEXT: v_lshrrev_b32_e32 v36, 16, v6
	; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v34, s0, v6			; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v34, s0, v6
	; GCN-NOHSA-SI-NEXT: v_lshrrev_b32_e32 v28, 16, v8			; GCN-NOHSA-SI-NEXT: v_lshrrev_b32_e32 v28, 16, v8
	; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v26, s0, v8			; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v26, s0, v8
	; GCN-NOHSA-SI-NEXT: v_lshrrev_b32_e32 v40, 16, v7			; GCN-NOHSA-SI-NEXT: v_lshrrev_b32_e32 v40, 16, v7
	; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v38, s0, v7			; GCN-NOHSA-SI-NEXT: v_and_b32_e32 v38, s0, v7
	Show All 24 Lines
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v51, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v51, v1
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v53, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v53, v1
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v43, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v43, v1
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v45, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v45, v1
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v39, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v39, v1
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v41, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v41, v1
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v31, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v31, v1
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v33, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v33, v1
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v4, v21
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v6, v23			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v6, v23
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v5, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v5, v1
	; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v7, v1			; GCN-NOHSA-SI-NEXT: v_mov_b32_e32 v7, v1
	; GCN-NOHSA-SI-NEXT: buffer_store_dword v4, off, s[12:15], 0 offset:36 ; 4-byte Folded Spill			; GCN-NOHSA-SI-NEXT: buffer_store_dword v4, off, s[12:15], 0 offset:36 ; 4-byte Folded Spill
	; GCN-NOHSA-SI-NEXT: s_waitcnt vmcnt(0)			; GCN-NOHSA-SI-NEXT: s_waitcnt vmcnt(0)
	; GCN-NOHSA-SI-NEXT: buffer_store_dword v5, off, s[12:15], 0 offset:40 ; 4-byte Folded Spill			; GCN-NOHSA-SI-NEXT: buffer_store_dword v5, off, s[12:15], 0 offset:40 ; 4-byte Folded Spill
	; GCN-NOHSA-SI-NEXT: buffer_store_dword v6, off, s[12:15], 0 offset:44 ; 4-byte Folded Spill			; GCN-NOHSA-SI-NEXT: buffer_store_dword v6, off, s[12:15], 0 offset:44 ; 4-byte Folded Spill
	; GCN-NOHSA-SI-NEXT: buffer_store_dword v7, off, s[12:15], 0 offset:48 ; 4-byte Folded Spill			; GCN-NOHSA-SI-NEXT: buffer_store_dword v7, off, s[12:15], 0 offset:48 ; 4-byte Folded Spill
	▲ Show 20 Lines • Show All 1,399 Lines • Show Last 20 Lines

llvm/test/CodeGen/AMDGPU/regbank-reassign-wave64.mir

	Show All 16 Lines
	# GCN: $vgpr24_vgpr25_vgpr26_vgpr27 = IMPLICIT_DEF			# GCN: $vgpr24_vgpr25_vgpr26_vgpr27 = IMPLICIT_DEF
	# GCN: $vgpr28_vgpr29_vgpr30_vgpr31 = IMPLICIT_DEF			# GCN: $vgpr28_vgpr29_vgpr30_vgpr31 = IMPLICIT_DEF
	# GCN: $vgpr32_vgpr33_vgpr34_vgpr35 = IMPLICIT_DEF			# GCN: $vgpr32_vgpr33_vgpr34_vgpr35 = IMPLICIT_DEF
	# GCN: $vgpr36_vgpr37_vgpr38_vgpr39 = IMPLICIT_DEF			# GCN: $vgpr36_vgpr37_vgpr38_vgpr39 = IMPLICIT_DEF
	# GCN: $vgpr40_vgpr41_vgpr42_vgpr43 = IMPLICIT_DEF			# GCN: $vgpr40_vgpr41_vgpr42_vgpr43 = IMPLICIT_DEF
	# GCN: $vgpr44_vgpr45_vgpr46_vgpr47 = IMPLICIT_DEF			# GCN: $vgpr44_vgpr45_vgpr46_vgpr47 = IMPLICIT_DEF
	# GCN: $vgpr2 = V_CNDMASK_B32_e64 0, $vgpr1, 0, $vgpr5, $vcc, implicit $exec			# GCN: $vgpr2 = V_CNDMASK_B32_e64 0, $vgpr1, 0, $vgpr5, $vcc, implicit $exec
	# GCN: $vgpr2 = V_CNDMASK_B32_e64 0, $vgpr0, 0, $vgpr4, killed $vcc, implicit $exec			# GCN: $vgpr2 = V_CNDMASK_B32_e64 0, $vgpr0, 0, $vgpr4, killed $vcc, implicit $exec
	# GCN: $sgpr0_sgpr1 = V_CMP_LT_U64_e64 $vgpr4_vgpr5, $vgpr0_vgpr1, implicit $exec			# GCN: $sgpr0_sgpr1 = V_CMP_LT_U64_e64 killed $vgpr4_vgpr5, killed $vgpr0_vgpr1, implicit $exec
	---			---
	name: vgpr64_mixed_use			name: vgpr64_mixed_use
	tracksRegLiveness: true			tracksRegLiveness: true
	registers:			registers:
	- { id: 0, class: vreg_64, preferred-register: '$vgpr0_vgpr1' }			- { id: 0, class: vreg_64, preferred-register: '$vgpr0_vgpr1' }
	- { id: 1, class: vreg_64, preferred-register: '$vgpr4_vgpr5' }			- { id: 1, class: vreg_64, preferred-register: '$vgpr4_vgpr5' }
	- { id: 2, class: sreg_64_xexec, preferred-register: '$vcc' }			- { id: 2, class: sreg_64_xexec, preferred-register: '$vcc' }
	- { id: 3, class: vgpr_32 }			- { id: 3, class: vgpr_32 }
	Show All 36 Lines

llvm/test/CodeGen/AMDGPU/regbank-reassign.mir

Show First 20 Lines • Show All 361 Lines • ▼ Show 20 Lines	bb.0:
DS_WRITE2_B32_gfx9 %2, %1.sub10, %1.sub11, 10, 11, 0, implicit $exec		DS_WRITE2_B32_gfx9 %2, %1.sub10, %1.sub11, 10, 11, 0, implicit $exec
DS_WRITE2_B32_gfx9 %2, %1.sub12, %1.sub13, 12, 13, 0, implicit $exec		DS_WRITE2_B32_gfx9 %2, %1.sub12, %1.sub13, 12, 13, 0, implicit $exec
DS_WRITE2_B32_gfx9 %2, %1.sub14, %1.sub15, 14, 15, 0, implicit $exec		DS_WRITE2_B32_gfx9 %2, %1.sub14, %1.sub15, 14, 15, 0, implicit $exec
S_ENDPGM 0		S_ENDPGM 0
...		...

# GCN-LABEL: vgpr_lo16_sub{{$}}		# GCN-LABEL: vgpr_lo16_sub{{$}}
# GCN: renamable $vgpr0 = V_AND_B32_e32 killed $vgpr3, killed $vgpr1, implicit $exec		# GCN: renamable $vgpr0 = V_AND_B32_e32 killed $vgpr3, killed $vgpr1, implicit $exec
# GCN: renamable $vgpr1_lo16 = COPY renamable $vgpr0_lo16		# GCN: renamable $vgpr1_lo16 = COPY killed renamable $vgpr0_lo16
---		---
name: vgpr_lo16_sub		name: vgpr_lo16_sub
tracksRegLiveness: true		tracksRegLiveness: true
registers:		registers:
- { id: 0, class: vgpr_32, preferred-register: '$vgpr1' }		- { id: 0, class: vgpr_32, preferred-register: '$vgpr1' }
- { id: 1, class: vgpr_32, preferred-register: '$vgpr5' }		- { id: 1, class: vgpr_32, preferred-register: '$vgpr5' }
- { id: 2, class: vgpr_32 }		- { id: 2, class: vgpr_32 }
- { id: 3, class: vgpr_lo16 }		- { id: 3, class: vgpr_lo16 }
Show All 20 Lines	bb.0:

%0 = COPY $vgpr0_lo16		%0 = COPY $vgpr0_lo16
$vgpr1_lo16 = COPY %0		$vgpr1_lo16 = COPY %0
SI_RETURN_TO_EPILOG $vgpr1_lo16		SI_RETURN_TO_EPILOG $vgpr1_lo16
...		...

# GCN-LABEL: vgpr_hi16_sub{{$}}		# GCN-LABEL: vgpr_hi16_sub{{$}}
# GCN: renamable $vgpr0 = V_AND_B32_e32 killed $vgpr3, killed $vgpr1, implicit $exec		# GCN: renamable $vgpr0 = V_AND_B32_e32 killed $vgpr3, killed $vgpr1, implicit $exec
# GCN: renamable $vgpr1_hi16 = COPY renamable $vgpr0_hi16		# GCN: renamable $vgpr1_hi16 = COPY killed renamable $vgpr0_hi16
---		---
name: vgpr_hi16_sub		name: vgpr_hi16_sub
tracksRegLiveness: true		tracksRegLiveness: true
registers:		registers:
- { id: 0, class: vgpr_32, preferred-register: '$vgpr1' }		- { id: 0, class: vgpr_32, preferred-register: '$vgpr1' }
- { id: 1, class: vgpr_32, preferred-register: '$vgpr5' }		- { id: 1, class: vgpr_32, preferred-register: '$vgpr5' }
- { id: 2, class: vgpr_32 }		- { id: 2, class: vgpr_32 }
- { id: 3, class: vgpr_hi16 }		- { id: 3, class: vgpr_hi16 }
Show All 20 Lines	bb.0:

%0 = COPY $vgpr0_hi16		%0 = COPY $vgpr0_hi16
$vgpr1_hi16 = COPY %0		$vgpr1_hi16 = COPY %0
SI_RETURN_TO_EPILOG $vgpr1_hi16		SI_RETURN_TO_EPILOG $vgpr1_hi16
...		...

# GCN-LABEL: sgpr_lo16_sub{{$}}		# GCN-LABEL: sgpr_lo16_sub{{$}}
# GCN: renamable $sgpr0 = S_AND_B32 killed renamable $sgpr14, $sgpr0, implicit-def $scc		# GCN: renamable $sgpr0 = S_AND_B32 killed renamable $sgpr14, $sgpr0, implicit-def $scc
# GCN: renamable $sgpr1_lo16 = COPY renamable $sgpr0_lo16		# GCN: renamable $sgpr1_lo16 = COPY killed renamable $sgpr0_lo16
---		---
name: sgpr_lo16_sub		name: sgpr_lo16_sub
tracksRegLiveness: true		tracksRegLiveness: true
registers:		registers:
- { id: 0, class: sgpr_32, preferred-register: '$sgpr16' }		- { id: 0, class: sgpr_32, preferred-register: '$sgpr16' }
- { id: 1, class: sgpr_32 }		- { id: 1, class: sgpr_32 }
- { id: 2, class: sgpr_lo16 }		- { id: 2, class: sgpr_lo16 }
body: \|		body: \|
Show All 40 Lines	bb.0:
$vgpr3_lo16 = IMPLICIT_DEF		$vgpr3_lo16 = IMPLICIT_DEF
%2 = V_AND_B32_e32 %1, %0, implicit $exec		%2 = V_AND_B32_e32 %1, %0, implicit $exec
S_ENDPGM 0		S_ENDPGM 0
...		...

# Test that bank of subreg is considered during scavenging.		# Test that bank of subreg is considered during scavenging.
# If handled incorrectly an infinite loop occurs.		# If handled incorrectly an infinite loop occurs.
# GCN-LABEL: s0_vs_s15_16_17_sub1{{$}}		# GCN-LABEL: s0_vs_s15_16_17_sub1{{$}}
# GCN: S_AND_B32 renamable $sgpr13, $sgpr0,		# GCN: S_AND_B32 killed renamable $sgpr13, $sgpr0,
---		---
name: s0_vs_s15_16_17_sub1		name: s0_vs_s15_16_17_sub1
tracksRegLiveness: true		tracksRegLiveness: true
registers:		registers:
- { id: 0, class: sgpr_96, preferred-register: '$sgpr15_sgpr16_sgpr17' }		- { id: 0, class: sgpr_96, preferred-register: '$sgpr15_sgpr16_sgpr17' }
- { id: 1, class: sgpr_32 }		- { id: 1, class: sgpr_32 }
body: \|		body: \|
bb.0:		bb.0:
Show All 16 Lines
# GCN: $vgpr20_vgpr21_vgpr22_vgpr23 = IMPLICIT_DEF		# GCN: $vgpr20_vgpr21_vgpr22_vgpr23 = IMPLICIT_DEF
# GCN: $vgpr24_vgpr25_vgpr26_vgpr27 = IMPLICIT_DEF		# GCN: $vgpr24_vgpr25_vgpr26_vgpr27 = IMPLICIT_DEF
# GCN: $vgpr28_vgpr29_vgpr30_vgpr31 = IMPLICIT_DEF		# GCN: $vgpr28_vgpr29_vgpr30_vgpr31 = IMPLICIT_DEF
# GCN: $vgpr32_vgpr33_vgpr34_vgpr35 = IMPLICIT_DEF		# GCN: $vgpr32_vgpr33_vgpr34_vgpr35 = IMPLICIT_DEF
# GCN: $vgpr36_vgpr37_vgpr38_vgpr39 = IMPLICIT_DEF		# GCN: $vgpr36_vgpr37_vgpr38_vgpr39 = IMPLICIT_DEF
# GCN: $vgpr40_vgpr41_vgpr42_vgpr43 = IMPLICIT_DEF		# GCN: $vgpr40_vgpr41_vgpr42_vgpr43 = IMPLICIT_DEF
# GCN: $vgpr44_vgpr45_vgpr46_vgpr47 = IMPLICIT_DEF		# GCN: $vgpr44_vgpr45_vgpr46_vgpr47 = IMPLICIT_DEF
# GCN: $vgpr0_vgpr1 = V_ADD_F64_e64 0, $vgpr11_vgpr12, 0, killed $vgpr16_vgpr17, 0, 0, implicit $mode, implicit $exec		# GCN: $vgpr0_vgpr1 = V_ADD_F64_e64 0, $vgpr11_vgpr12, 0, killed $vgpr16_vgpr17, 0, 0, implicit $mode, implicit $exec
# GCN: $vgpr0_vgpr1 = V_ADD_F64_e64 0, $vgpr9_vgpr10, 0, killed $vgpr14_vgpr15, 0, 0, implicit $mode, implicit $exec		# GCN: $vgpr0_vgpr1 = V_ADD_F64_e64 0, killed $vgpr9_vgpr10, 0, killed $vgpr14_vgpr15, 0, 0, implicit $mode, implicit $exec
---		---
name: vgpr_sub_dependence		name: vgpr_sub_dependence
tracksRegLiveness: true		tracksRegLiveness: true
registers:		registers:
- { id: 0, class: vreg_128, preferred-register: '$vgpr10_vgpr11_vgpr12_vgpr13' }		- { id: 0, class: vreg_128, preferred-register: '$vgpr10_vgpr11_vgpr12_vgpr13' }
- { id: 1, class: vreg_64, preferred-register: '$vgpr16_vgpr17' }		- { id: 1, class: vreg_64, preferred-register: '$vgpr16_vgpr17' }
- { id: 2, class: vreg_64, preferred-register: '$vgpr14_vgpr15' }		- { id: 2, class: vreg_64, preferred-register: '$vgpr14_vgpr15' }
- { id: 3, class: vreg_64 }		- { id: 3, class: vreg_64 }
Show All 32 Lines

llvm/test/CodeGen/AMDGPU/spill-scavenge-offset.ll

	Show All 10 Lines
	; is used to calculate the scratch load/store address. Make sure that this			; is used to calculate the scratch load/store address. Make sure that this
	; mechanism works even when many spills happen.			; mechanism works even when many spills happen.

	; Just test that it compiles successfully.			; Just test that it compiles successfully.
	; CHECK-LABEL: test			; CHECK-LABEL: test

	; GFX9-FLATSCR: s_mov_b32 [[SOFF1:s[0-9]+]], 4{{$}}			; GFX9-FLATSCR: s_mov_b32 [[SOFF1:s[0-9]+]], 4{{$}}
	; GFX9-FLATSCR: scratch_store_dwordx4 off, v[{{[0-9:]+}}], [[SOFF1]] ; 16-byte Folded Spill			; GFX9-FLATSCR: scratch_store_dwordx4 off, v[{{[0-9:]+}}], [[SOFF1]] ; 16-byte Folded Spill
	; GFX9-FLATSCR: s_movk_i32 [[SOFF2:s[0-9]+]], 0x{{[0-9a-f]+}}{{$}}			; GFX9-FLATSCR: s_movk_i32 [[SOFF2:s[0-9]+]], 0x1{{[0-9a-f]+}}{{$}}
				foadUnsubmitted Not Done Reply Inline Actions Why do you need this change? foad: Why do you need this change?
				bsaleilUnsubmitted Done Reply Inline Actions @foad, If I understand correctly the test case, the generated code is divided in two parts, spills and reloads. The two first check lines (`s_mov_b32` and `scratch_store_dwordx4`) are supposed to match a spill, the two other check lines (`s_movk_i32` and `scratch_load_dwordx4`) are supposed to match a reload. Currently, the first two check lines are correctly matched in the spills part. But `s_movk_i32` is actually also matched in the spills section. It turns out that there is a `scratch_load_dwordx4` for that same register in the reload part, so the test succeeds. This patch modifies a bit the register allocation for this test case and now there is no `scratch_load_dwordx4` for that register. By adding the 1 here, we force the `s_movk_i32` to be matched in the reload section because no `s_movk_i32` uses `0x1` in the spills section. Then, the `scratch_load_dwordx4` for that register is correctly matched. bsaleil: @foad, If I understand correctly the test case, the generated code is divided in two parts…
				foadUnsubmitted Not Done Reply Inline Actions Makes sense, thanks. foad: Makes sense, thanks.
	; GFX9-FLATSCR: scratch_load_dwordx4 v[{{[0-9:]+}}], off, [[SOFF2]] ; 16-byte Folded Reload			; GFX9-FLATSCR: scratch_load_dwordx4 v[{{[0-9:]+}}], off, [[SOFF2]] ; 16-byte Folded Reload

	; GFX10-FLATSCR: scratch_store_dwordx4 off, v[{{[0-9:]+}}], off offset:{{[0-9]+}} ; 16-byte Folded Spill			; GFX10-FLATSCR: scratch_store_dwordx4 off, v[{{[0-9:]+}}], off offset:{{[0-9]+}} ; 16-byte Folded Spill
	; GFX10-FLATSCR: scratch_load_dwordx4 v[{{[0-9:]+}}], off, off offset:{{[0-9]+}} ; 16-byte Folded Reload			; GFX10-FLATSCR: scratch_load_dwordx4 v[{{[0-9:]+}}], off, off offset:{{[0-9]+}} ; 16-byte Folded Reload
	define amdgpu_kernel void @test(<1280 x i32> addrspace(1)* %out, <1280 x i32> addrspace(1)* %in) {			define amdgpu_kernel void @test(<1280 x i32> addrspace(1)* %out, <1280 x i32> addrspace(1)* %in) {
	entry:			entry:
	%lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0)			%lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 -1, i32 0)
	%tid = call i32 @llvm.amdgcn.mbcnt.hi(i32 -1, i32 %lo)			%tid = call i32 @llvm.amdgcn.mbcnt.hi(i32 -1, i32 %lo)
	▲ Show 20 Lines • Show All 87 Lines • Show Last 20 Lines

llvm/test/CodeGen/AMDGPU/splitkit-nolivesubranges.mir

	Show All 13 Lines
	tracksRegLiveness: true			tracksRegLiveness: true
	body: \|			body: \|
	bb.0:			bb.0:
	liveins: $sgpr0_sgpr1			liveins: $sgpr0_sgpr1
	; CHECK-LABEL: name: func0			; CHECK-LABEL: name: func0
	; CHECK: liveins: $sgpr0_sgpr1			; CHECK: liveins: $sgpr0_sgpr1
	; CHECK: renamable $sgpr0 = IMPLICIT_DEF			; CHECK: renamable $sgpr0 = IMPLICIT_DEF
	; CHECK: renamable $sgpr1 = IMPLICIT_DEF			; CHECK: renamable $sgpr1 = IMPLICIT_DEF
	; CHECK: $sgpr104 = S_AND_B32 renamable $sgpr0, renamable $sgpr1, implicit-def $scc			; CHECK: $sgpr104 = S_AND_B32 killed renamable $sgpr0, renamable $sgpr1, implicit-def $scc
	; CHECK: KILL implicit-def $vcc, implicit-def $sgpr0_sgpr1_sgpr2_sgpr3_sgpr4_sgpr5_sgpr6_sgpr7_sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15_sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23_sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, implicit-def $sgpr32_sgpr33_sgpr34_sgpr35_sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43_sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51_sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59_sgpr60_sgpr61_sgpr62_sgpr63, implicit-def $sgpr64_sgpr65_sgpr66_sgpr67_sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75_sgpr76_sgpr77_sgpr78_sgpr79_sgpr80_sgpr81_sgpr82_sgpr83_sgpr84_sgpr85_sgpr86_sgpr87_sgpr88_sgpr89_sgpr90_sgpr91_sgpr92_sgpr93_sgpr94_sgpr95, implicit-def $sgpr96_sgpr97_sgpr98_sgpr99_sgpr100_sgpr101_sgpr102_sgpr103			; CHECK: KILL implicit-def $vcc, implicit-def $sgpr0_sgpr1_sgpr2_sgpr3_sgpr4_sgpr5_sgpr6_sgpr7_sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15_sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23_sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, implicit-def $sgpr32_sgpr33_sgpr34_sgpr35_sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43_sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51_sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59_sgpr60_sgpr61_sgpr62_sgpr63, implicit-def $sgpr64_sgpr65_sgpr66_sgpr67_sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75_sgpr76_sgpr77_sgpr78_sgpr79_sgpr80_sgpr81_sgpr82_sgpr83_sgpr84_sgpr85_sgpr86_sgpr87_sgpr88_sgpr89_sgpr90_sgpr91_sgpr92_sgpr93_sgpr94_sgpr95, implicit-def $sgpr96_sgpr97_sgpr98_sgpr99_sgpr100_sgpr101_sgpr102_sgpr103
	; CHECK: renamable $sgpr0_sgpr1 = IMPLICIT_DEF			; CHECK: renamable $sgpr0_sgpr1 = IMPLICIT_DEF
	; CHECK: renamable $sgpr0 = IMPLICIT_DEF			; CHECK: renamable $sgpr0 = IMPLICIT_DEF
	; CHECK: renamable $sgpr1 = IMPLICIT_DEF			; CHECK: renamable $sgpr1 = IMPLICIT_DEF
	; CHECK: SI_SPILL_S64_SAVE renamable $sgpr0_sgpr1, %stack.0, implicit $exec, implicit $sp_reg :: (store 8 into %stack.0, align 4, addrspace 5)			; CHECK: SI_SPILL_S64_SAVE renamable $sgpr0_sgpr1, %stack.0, implicit $exec, implicit $sp_reg :: (store 8 into %stack.0, align 4, addrspace 5)
	; CHECK: KILL implicit-def $vcc, implicit-def $sgpr0_sgpr1_sgpr2_sgpr3_sgpr4_sgpr5_sgpr6_sgpr7_sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15_sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23_sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, implicit-def $sgpr32_sgpr33_sgpr34_sgpr35_sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43_sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51_sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59_sgpr60_sgpr61_sgpr62_sgpr63, implicit-def $sgpr64_sgpr65_sgpr66_sgpr67_sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75_sgpr76_sgpr77_sgpr78_sgpr79_sgpr80_sgpr81_sgpr82_sgpr83_sgpr84_sgpr85_sgpr86_sgpr87_sgpr88_sgpr89_sgpr90_sgpr91_sgpr92_sgpr93_sgpr94_sgpr95, implicit-def $sgpr96_sgpr97_sgpr98_sgpr99_sgpr100_sgpr101_sgpr102_sgpr103			; CHECK: KILL implicit-def $vcc, implicit-def $sgpr0_sgpr1_sgpr2_sgpr3_sgpr4_sgpr5_sgpr6_sgpr7_sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15_sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23_sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, implicit-def $sgpr32_sgpr33_sgpr34_sgpr35_sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43_sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51_sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59_sgpr60_sgpr61_sgpr62_sgpr63, implicit-def $sgpr64_sgpr65_sgpr66_sgpr67_sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75_sgpr76_sgpr77_sgpr78_sgpr79_sgpr80_sgpr81_sgpr82_sgpr83_sgpr84_sgpr85_sgpr86_sgpr87_sgpr88_sgpr89_sgpr90_sgpr91_sgpr92_sgpr93_sgpr94_sgpr95, implicit-def $sgpr96_sgpr97_sgpr98_sgpr99_sgpr100_sgpr101_sgpr102_sgpr103
	; CHECK: renamable $sgpr0_sgpr1 = SI_SPILL_S64_RESTORE %stack.0, implicit $exec, implicit $sp_reg :: (load 8 from %stack.0, align 4, addrspace 5)			; CHECK: renamable $sgpr0_sgpr1 = SI_SPILL_S64_RESTORE %stack.0, implicit $exec, implicit $sp_reg :: (load 8 from %stack.0, align 4, addrspace 5)
	; CHECK: $sgpr105 = S_AND_B32 renamable $sgpr1, renamable $sgpr1, implicit-def $scc			; CHECK: $sgpr105 = S_AND_B32 killed renamable $sgpr1, renamable $sgpr1, implicit-def $scc
	; CHECK: S_NOP 0, implicit $sgpr104, implicit $sgpr105			; CHECK: S_NOP 0, implicit $sgpr104, implicit $sgpr105
	%0:sreg_64 = COPY $sgpr0_sgpr1			%0:sreg_64 = COPY $sgpr0_sgpr1
	%0.sub0:sreg_64 = IMPLICIT_DEF			%0.sub0:sreg_64 = IMPLICIT_DEF
	%0.sub1:sreg_64 = IMPLICIT_DEF			%0.sub1:sreg_64 = IMPLICIT_DEF
	$sgpr104 = S_AND_B32 %0.sub0, %0.sub1, implicit-def $scc			$sgpr104 = S_AND_B32 %0.sub0, %0.sub1, implicit-def $scc
	KILL implicit-def $vcc, implicit-def $sgpr0_sgpr1_sgpr2_sgpr3_sgpr4_sgpr5_sgpr6_sgpr7_sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15_sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23_sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, implicit-def $sgpr32_sgpr33_sgpr34_sgpr35_sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43_sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51_sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59_sgpr60_sgpr61_sgpr62_sgpr63, implicit-def $sgpr64_sgpr65_sgpr66_sgpr67_sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75_sgpr76_sgpr77_sgpr78_sgpr79_sgpr80_sgpr81_sgpr82_sgpr83_sgpr84_sgpr85_sgpr86_sgpr87_sgpr88_sgpr89_sgpr90_sgpr91_sgpr92_sgpr93_sgpr94_sgpr95, implicit-def $sgpr96_sgpr97_sgpr98_sgpr99_sgpr100_sgpr101_sgpr102_sgpr103			KILL implicit-def $vcc, implicit-def $sgpr0_sgpr1_sgpr2_sgpr3_sgpr4_sgpr5_sgpr6_sgpr7_sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15_sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23_sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, implicit-def $sgpr32_sgpr33_sgpr34_sgpr35_sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43_sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51_sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59_sgpr60_sgpr61_sgpr62_sgpr63, implicit-def $sgpr64_sgpr65_sgpr66_sgpr67_sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75_sgpr76_sgpr77_sgpr78_sgpr79_sgpr80_sgpr81_sgpr82_sgpr83_sgpr84_sgpr85_sgpr86_sgpr87_sgpr88_sgpr89_sgpr90_sgpr91_sgpr92_sgpr93_sgpr94_sgpr95, implicit-def $sgpr96_sgpr97_sgpr98_sgpr99_sgpr100_sgpr101_sgpr102_sgpr103
	%0.sub0:sreg_64 = IMPLICIT_DEF			%0.sub0:sreg_64 = IMPLICIT_DEF
	%0.sub1:sreg_64 = IMPLICIT_DEF			%0.sub1:sreg_64 = IMPLICIT_DEF
	KILL implicit-def $vcc, implicit-def $sgpr0_sgpr1_sgpr2_sgpr3_sgpr4_sgpr5_sgpr6_sgpr7_sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15_sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23_sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, implicit-def $sgpr32_sgpr33_sgpr34_sgpr35_sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43_sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51_sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59_sgpr60_sgpr61_sgpr62_sgpr63, implicit-def $sgpr64_sgpr65_sgpr66_sgpr67_sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75_sgpr76_sgpr77_sgpr78_sgpr79_sgpr80_sgpr81_sgpr82_sgpr83_sgpr84_sgpr85_sgpr86_sgpr87_sgpr88_sgpr89_sgpr90_sgpr91_sgpr92_sgpr93_sgpr94_sgpr95, implicit-def $sgpr96_sgpr97_sgpr98_sgpr99_sgpr100_sgpr101_sgpr102_sgpr103			KILL implicit-def $vcc, implicit-def $sgpr0_sgpr1_sgpr2_sgpr3_sgpr4_sgpr5_sgpr6_sgpr7_sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15_sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23_sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, implicit-def $sgpr32_sgpr33_sgpr34_sgpr35_sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43_sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51_sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59_sgpr60_sgpr61_sgpr62_sgpr63, implicit-def $sgpr64_sgpr65_sgpr66_sgpr67_sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75_sgpr76_sgpr77_sgpr78_sgpr79_sgpr80_sgpr81_sgpr82_sgpr83_sgpr84_sgpr85_sgpr86_sgpr87_sgpr88_sgpr89_sgpr90_sgpr91_sgpr92_sgpr93_sgpr94_sgpr95, implicit-def $sgpr96_sgpr97_sgpr98_sgpr99_sgpr100_sgpr101_sgpr102_sgpr103
	$sgpr105 = S_AND_B32 %0.sub1, %0.sub1, implicit-def $scc			$sgpr105 = S_AND_B32 %0.sub1, %0.sub1, implicit-def $scc
	S_NOP 0, implicit $sgpr104, implicit $sgpr105			S_NOP 0, implicit $sgpr104, implicit $sgpr105
	...			...

llvm/test/CodeGen/AMDGPU/splitkit.mir

	Show All 33 Lines
	# allocated to sgpr0_sgpr1 and the first to something else so we see two copies			# allocated to sgpr0_sgpr1 and the first to something else so we see two copies
	# in between for the two subregisters that are alive.			# in between for the two subregisters that are alive.
	# CHECK-LABEL: name: func1			# CHECK-LABEL: name: func1
	# CHECK: [[REG0:\$sgpr[0-9]+]] = COPY $sgpr0			# CHECK: [[REG0:\$sgpr[0-9]+]] = COPY $sgpr0
	# CHECK: [[REG1:\$sgpr[0-9]+]] = COPY $sgpr2			# CHECK: [[REG1:\$sgpr[0-9]+]] = COPY $sgpr2
	# CHECK: S_NOP 0			# CHECK: S_NOP 0
	# CHECK: S_NOP 0, implicit renamable [[REG0]]			# CHECK: S_NOP 0, implicit renamable [[REG0]]
	# CHECK: S_NOP 0, implicit renamable [[REG1]]			# CHECK: S_NOP 0, implicit renamable [[REG1]]
	# CHECK: $sgpr0 = COPY renamable [[REG0]]			# CHECK: $sgpr0 = COPY killed renamable [[REG0]]
	# CHECK: $sgpr2 = COPY renamable [[REG1]]			# CHECK: $sgpr2 = COPY renamable [[REG1]]
	# CHECK: S_NOP			# CHECK: S_NOP
	# CHECK: S_NOP 0, implicit renamable $sgpr0			# CHECK: S_NOP 0, implicit renamable $sgpr0
	# CHECK: S_NOP 0, implicit renamable $sgpr2			# CHECK: S_NOP 0, implicit killed renamable $sgpr2
	name: func1			name: func1
	tracksRegLiveness: true			tracksRegLiveness: true
	body: \|			body: \|
	bb.0:			bb.0:
	liveins: $sgpr0, $sgpr1, $sgpr2			liveins: $sgpr0, $sgpr1, $sgpr2
	undef %0.sub0 : sgpr_128 = COPY $sgpr0			undef %0.sub0 : sgpr_128 = COPY $sgpr0
	%0.sub2 = COPY $sgpr2			%0.sub2 = COPY $sgpr2

	▲ Show 20 Lines • Show All 51 Lines • Show Last 20 Lines

llvm/test/CodeGen/AMDGPU/subreg_interference.mir

	Show All 10 Lines
	# We should not detect any interference between v0/v1 here and only allocate			# We should not detect any interference between v0/v1 here and only allocate
	# sgpr0-sgpr3.			# sgpr0-sgpr3.
	#			#
	# CHECK-LABEL: func0			# CHECK-LABEL: func0
	# CHECK: S_NOP 0, implicit-def renamable $sgpr0			# CHECK: S_NOP 0, implicit-def renamable $sgpr0
	# CHECK: S_NOP 0, implicit-def renamable $sgpr3			# CHECK: S_NOP 0, implicit-def renamable $sgpr3
	# CHECK: S_NOP 0, implicit-def renamable $sgpr1			# CHECK: S_NOP 0, implicit-def renamable $sgpr1
	# CHECK: S_NOP 0, implicit-def renamable $sgpr2			# CHECK: S_NOP 0, implicit-def renamable $sgpr2
	# CHECK: S_NOP 0, implicit renamable $sgpr0, implicit renamable $sgpr3			# CHECK: S_NOP 0, implicit killed renamable $sgpr0, implicit renamable $sgpr3
	# CHECK: S_NOP 0, implicit renamable $sgpr1, implicit renamable $sgpr2			# CHECK: S_NOP 0, implicit killed renamable $sgpr1, implicit renamable $sgpr2
	name: func0			name: func0
	body: \|			body: \|
	bb.0:			bb.0:
	S_NOP 0, implicit-def undef %0.sub0 : sgpr_128			S_NOP 0, implicit-def undef %0.sub0 : sgpr_128
	S_NOP 0, implicit-def %0.sub3			S_NOP 0, implicit-def %0.sub3
	S_NOP 0, implicit-def undef %1.sub1 : sgpr_128			S_NOP 0, implicit-def undef %1.sub1 : sgpr_128
	S_NOP 0, implicit-def %1.sub2			S_NOP 0, implicit-def %1.sub2


	S_NOP 0, implicit %0.sub0, implicit %0.sub3			S_NOP 0, implicit %0.sub0, implicit %0.sub3
	S_NOP 0, implicit %1.sub1, implicit %1.sub2			S_NOP 0, implicit %1.sub1, implicit %1.sub2
	...			...

llvm/test/CodeGen/AMDGPU/unallocatable-bundle-regression.mir

Show All 34 Lines	bb.0:
; CHECK: renamable $sgpr8 = COPY renamable $sgpr5		; CHECK: renamable $sgpr8 = COPY renamable $sgpr5
; CHECK: renamable $sgpr9 = COPY renamable $sgpr5		; CHECK: renamable $sgpr9 = COPY renamable $sgpr5
; CHECK: renamable $sgpr10 = COPY renamable $sgpr5		; CHECK: renamable $sgpr10 = COPY renamable $sgpr5
; CHECK: renamable $sgpr11 = COPY renamable $sgpr5		; CHECK: renamable $sgpr11 = COPY renamable $sgpr5
; CHECK: renamable $sgpr12 = COPY renamable $sgpr5		; CHECK: renamable $sgpr12 = COPY renamable $sgpr5
; CHECK: renamable $sgpr13 = COPY renamable $sgpr5		; CHECK: renamable $sgpr13 = COPY renamable $sgpr5
; CHECK: renamable $sgpr14 = COPY renamable $sgpr5		; CHECK: renamable $sgpr14 = COPY renamable $sgpr5
; CHECK: renamable $sgpr15 = COPY renamable $sgpr5		; CHECK: renamable $sgpr15 = COPY renamable $sgpr5
; CHECK: renamable $vgpr5_vgpr6 = COPY renamable $sgpr0_sgpr1		; CHECK: renamable $vgpr5_vgpr6 = COPY killed renamable $sgpr0_sgpr1
; CHECK: renamable $sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1088, 0, 0 :: (dereferenceable load 32, addrspace 6)		; CHECK: renamable $sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1088, 0, 0 :: (dereferenceable load 32, addrspace 6)
; CHECK: renamable $sgpr80_sgpr81_sgpr82_sgpr83 = S_LOAD_DWORDX4_IMM renamable $sgpr4_sgpr5, 0, 0, 0 :: (load 16, addrspace 6)		; CHECK: renamable $sgpr80_sgpr81_sgpr82_sgpr83 = S_LOAD_DWORDX4_IMM renamable $sgpr4_sgpr5, 0, 0, 0 :: (load 16, addrspace 6)
; CHECK: renamable $sgpr0 = S_MOV_B32 1200		; CHECK: renamable $sgpr0 = S_MOV_B32 1200
; CHECK: renamable $sgpr1 = COPY renamable $sgpr5		; CHECK: renamable $sgpr1 = COPY renamable $sgpr5
; CHECK: renamable $sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1152, 0, 0 :: (dereferenceable load 32, addrspace 6)		; CHECK: renamable $sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1152, 0, 0 :: (dereferenceable load 32, addrspace 6)
; CHECK: renamable $sgpr84_sgpr85_sgpr86_sgpr87 = S_LOAD_DWORDX4_IMM renamable $sgpr0_sgpr1, 0, 0, 0 :: (load 16, addrspace 6)		; CHECK: renamable $sgpr84_sgpr85_sgpr86_sgpr87 = S_LOAD_DWORDX4_IMM renamable $sgpr0_sgpr1, 0, 0, 0 :: (load 16, addrspace 6)
; CHECK: KILL renamable $sgpr0, renamable $sgpr1		; CHECK: KILL killed renamable $sgpr0, renamable $sgpr1
; CHECK: renamable $sgpr0 = S_MOV_B32 1264		; CHECK: renamable $sgpr0 = S_MOV_B32 1264
; CHECK: renamable $sgpr1 = COPY renamable $sgpr5		; CHECK: renamable $sgpr1 = COPY renamable $sgpr5
; CHECK: renamable $sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1216, 0, 0 :: (dereferenceable load 32, addrspace 6)		; CHECK: renamable $sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1216, 0, 0 :: (dereferenceable load 32, addrspace 6)
; CHECK: renamable $sgpr88_sgpr89_sgpr90_sgpr91 = S_LOAD_DWORDX4_IMM renamable $sgpr0_sgpr1, 0, 0, 0 :: (load 16, addrspace 6)		; CHECK: renamable $sgpr88_sgpr89_sgpr90_sgpr91 = S_LOAD_DWORDX4_IMM renamable $sgpr0_sgpr1, 0, 0, 0 :: (load 16, addrspace 6)
; CHECK: KILL renamable $sgpr0, renamable $sgpr1		; CHECK: KILL killed renamable $sgpr0, renamable $sgpr1
; CHECK: renamable $sgpr0 = S_MOV_B32 1328		; CHECK: renamable $sgpr0 = S_MOV_B32 1328
; CHECK: renamable $sgpr1 = COPY renamable $sgpr5		; CHECK: renamable $sgpr1 = COPY renamable $sgpr5
; CHECK: renamable $sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1280, 0, 0 :: (dereferenceable load 32, addrspace 6)		; CHECK: renamable $sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1280, 0, 0 :: (dereferenceable load 32, addrspace 6)
; CHECK: renamable $sgpr92_sgpr93_sgpr94_sgpr95 = S_LOAD_DWORDX4_IMM renamable $sgpr0_sgpr1, 0, 0, 0 :: (load 16, addrspace 6)		; CHECK: renamable $sgpr92_sgpr93_sgpr94_sgpr95 = S_LOAD_DWORDX4_IMM renamable $sgpr0_sgpr1, 0, 0, 0 :: (load 16, addrspace 6)
; CHECK: KILL renamable $sgpr0, renamable $sgpr1		; CHECK: KILL killed renamable $sgpr0, renamable $sgpr1
; CHECK: renamable $sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1344, 0, 0 :: (dereferenceable load 32, addrspace 6)		; CHECK: renamable $sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1344, 0, 0 :: (dereferenceable load 32, addrspace 6)
; CHECK: renamable $sgpr0 = S_MOV_B32 1392		; CHECK: renamable $sgpr0 = S_MOV_B32 1392
; CHECK: renamable $sgpr1 = COPY renamable $sgpr5		; CHECK: renamable $sgpr1 = COPY renamable $sgpr5
; CHECK: renamable $sgpr60_sgpr61_sgpr62_sgpr63_sgpr64_sgpr65_sgpr66_sgpr67 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 0, 0, 0 :: (load 32, addrspace 6)		; CHECK: renamable $sgpr60_sgpr61_sgpr62_sgpr63_sgpr64_sgpr65_sgpr66_sgpr67 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 0, 0, 0 :: (load 32, addrspace 6)
; CHECK: renamable $sgpr2 = S_MOV_B32 1456		; CHECK: renamable $sgpr2 = S_MOV_B32 1456
; CHECK: renamable $sgpr3 = COPY renamable $sgpr5		; CHECK: renamable $sgpr3 = COPY renamable $sgpr5
; CHECK: renamable $sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1472, 0, 0 :: (dereferenceable load 32, addrspace 6)		; CHECK: renamable $sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75 = S_LOAD_DWORDX8_IMM renamable $sgpr4_sgpr5, 1472, 0, 0 :: (dereferenceable load 32, addrspace 6)
; CHECK: renamable $sgpr4 = S_MOV_B32 1520		; CHECK: renamable $sgpr4 = S_MOV_B32 1520
; CHECK: renamable $sgpr96_sgpr97_sgpr98_sgpr99 = S_LOAD_DWORDX4_IMM renamable $sgpr2_sgpr3, 0, 0, 0 :: (load 16, addrspace 6)		; CHECK: renamable $sgpr96_sgpr97_sgpr98_sgpr99 = S_LOAD_DWORDX4_IMM killed renamable $sgpr2_sgpr3, 0, 0, 0 :: (load 16, addrspace 6)
; CHECK: renamable $sgpr4_sgpr5_sgpr6_sgpr7 = S_LOAD_DWORDX4_IMM renamable $sgpr4_sgpr5, 0, 0, 0 :: (load 16, addrspace 6)		; CHECK: renamable $sgpr4_sgpr5_sgpr6_sgpr7 = S_LOAD_DWORDX4_IMM killed renamable $sgpr4_sgpr5, 0, 0, 0 :: (load 16, addrspace 6)
; CHECK: renamable $sgpr0_sgpr1_sgpr2_sgpr3 = S_LOAD_DWORDX4_IMM renamable $sgpr0_sgpr1, 0, 0, 0 :: (load 16, addrspace 6)		; CHECK: renamable $sgpr0_sgpr1_sgpr2_sgpr3 = S_LOAD_DWORDX4_IMM killed renamable $sgpr0_sgpr1, 0, 0, 0 :: (load 16, addrspace 6)
; CHECK: renamable $vgpr7 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15, renamable $sgpr76_sgpr77_sgpr78_sgpr79, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")		; CHECK: renamable $vgpr7 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, killed renamable $sgpr8_sgpr9_sgpr10_sgpr11_sgpr12_sgpr13_sgpr14_sgpr15, killed renamable $sgpr76_sgpr77_sgpr78_sgpr79, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")
; CHECK: renamable $vgpr8 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, killed renamable $sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23, killed renamable $sgpr80_sgpr81_sgpr82_sgpr83, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")		; CHECK: renamable $vgpr8 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, killed renamable $sgpr16_sgpr17_sgpr18_sgpr19_sgpr20_sgpr21_sgpr22_sgpr23, killed renamable $sgpr80_sgpr81_sgpr82_sgpr83, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")
; CHECK: renamable $vgpr9 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, killed renamable $sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, killed renamable $sgpr84_sgpr85_sgpr86_sgpr87, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")		; CHECK: renamable $vgpr9 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, killed renamable $sgpr24_sgpr25_sgpr26_sgpr27_sgpr28_sgpr29_sgpr30_sgpr31, killed renamable $sgpr84_sgpr85_sgpr86_sgpr87, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")
; CHECK: renamable $vgpr10 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43, renamable $sgpr88_sgpr89_sgpr90_sgpr91, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")		; CHECK: renamable $vgpr10 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr36_sgpr37_sgpr38_sgpr39_sgpr40_sgpr41_sgpr42_sgpr43, renamable $sgpr88_sgpr89_sgpr90_sgpr91, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")
; CHECK: renamable $vgpr11 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51, renamable $sgpr92_sgpr93_sgpr94_sgpr95, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")		; CHECK: renamable $vgpr11 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr44_sgpr45_sgpr46_sgpr47_sgpr48_sgpr49_sgpr50_sgpr51, renamable $sgpr92_sgpr93_sgpr94_sgpr95, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")
; CHECK: renamable $vgpr12 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr60_sgpr61_sgpr62_sgpr63_sgpr64_sgpr65_sgpr66_sgpr67, renamable $sgpr96_sgpr97_sgpr98_sgpr99, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")		; CHECK: renamable $vgpr12 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr60_sgpr61_sgpr62_sgpr63_sgpr64_sgpr65_sgpr66_sgpr67, renamable $sgpr96_sgpr97_sgpr98_sgpr99, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")
; CHECK: renamable $vgpr13 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75, renamable $sgpr4_sgpr5_sgpr6_sgpr7, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")		; CHECK: renamable $vgpr13 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr68_sgpr69_sgpr70_sgpr71_sgpr72_sgpr73_sgpr74_sgpr75, renamable $sgpr4_sgpr5_sgpr6_sgpr7, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")
; CHECK: renamable $vgpr14 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59, renamable $sgpr0_sgpr1_sgpr2_sgpr3, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")		; CHECK: renamable $vgpr14 = IMAGE_SAMPLE_LZ_V1_V2_gfx10 renamable $vgpr5_vgpr6, renamable $sgpr52_sgpr53_sgpr54_sgpr55_sgpr56_sgpr57_sgpr58_sgpr59, renamable $sgpr0_sgpr1_sgpr2_sgpr3, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, implicit $exec :: (dereferenceable load 16 from custom "ImageResource")
; CHECK: renamable $sgpr8_sgpr9_sgpr10_sgpr11 = SI_SPILL_S128_RESTORE %stack.0, implicit $exec, implicit $sgpr32 :: (load 16 from %stack.0, align 4, addrspace 5)		; CHECK: renamable $sgpr8_sgpr9_sgpr10_sgpr11 = SI_SPILL_S128_RESTORE %stack.0, implicit $exec, implicit $sgpr32 :: (load 16 from %stack.0, align 4, addrspace 5)
Show All 14 Lines	bb.0:
; CHECK: renamable $vgpr0 = nofpexcept V_MAX_F32_e32 killed $vgpr7, killed $vgpr8, implicit $mode, implicit $exec		; CHECK: renamable $vgpr0 = nofpexcept V_MAX_F32_e32 killed $vgpr7, killed $vgpr8, implicit $mode, implicit $exec
; CHECK: renamable $vgpr0 = V_MAX3_F32_e64 0, killed $vgpr0, 0, killed $vgpr9, 0, killed $vgpr10, 0, 0, implicit $mode, implicit $exec		; CHECK: renamable $vgpr0 = V_MAX3_F32_e64 0, killed $vgpr0, 0, killed $vgpr9, 0, killed $vgpr10, 0, 0, implicit $mode, implicit $exec
; CHECK: renamable $vgpr1 = nofpexcept V_ADD_F32_e32 -1083321614, killed $vgpr12, implicit $mode, implicit $exec		; CHECK: renamable $vgpr1 = nofpexcept V_ADD_F32_e32 -1083321614, killed $vgpr12, implicit $mode, implicit $exec
; CHECK: renamable $vgpr3 = nofpexcept V_ADD_F32_e32 -1090988802, killed $vgpr13, implicit $mode, implicit $exec		; CHECK: renamable $vgpr3 = nofpexcept V_ADD_F32_e32 -1090988802, killed $vgpr13, implicit $mode, implicit $exec
; CHECK: renamable $vgpr0 = V_MAX3_F32_e64 0, killed $vgpr0, 0, killed $vgpr11, 0, killed $vgpr14, 0, 0, implicit $mode, implicit $exec		; CHECK: renamable $vgpr0 = V_MAX3_F32_e64 0, killed $vgpr0, 0, killed $vgpr11, 0, killed $vgpr14, 0, 0, implicit $mode, implicit $exec
; CHECK: renamable $vgpr0 = V_MAX3_F32_e64 0, killed $vgpr0, 0, killed $vgpr1, 0, killed $vgpr3, 0, 0, implicit $mode, implicit $exec		; CHECK: renamable $vgpr0 = V_MAX3_F32_e64 0, killed $vgpr0, 0, killed $vgpr1, 0, killed $vgpr3, 0, 0, implicit $mode, implicit $exec
; CHECK: renamable $sgpr0 = nofpexcept V_CMP_GT_F32_e64 0, 1028443341, 0, killed $vgpr0, 0, implicit $mode, implicit $exec		; CHECK: renamable $sgpr0 = nofpexcept V_CMP_GT_F32_e64 0, 1028443341, 0, killed $vgpr0, 0, implicit $mode, implicit $exec
; CHECK: renamable $vgpr0 = V_CNDMASK_B32_e64 0, 0, 0, 1065353216, killed $sgpr0, implicit $exec		; CHECK: renamable $vgpr0 = V_CNDMASK_B32_e64 0, 0, 0, 1065353216, killed $sgpr0, implicit $exec
; CHECK: EXP_DONE 12, killed renamable $vgpr0, renamable $vgpr2, undef renamable $vgpr0, undef renamable $vgpr0, -1, 0, 15, implicit $exec		; CHECK: EXP_DONE 12, killed renamable $vgpr0, killed renamable $vgpr2, undef renamable $vgpr0, undef renamable $vgpr0, -1, 0, 15, implicit $exec
; CHECK: S_ENDPGM 0		; CHECK: S_ENDPGM 0
%0:vgpr_32 = COPY $vgpr0		%0:vgpr_32 = COPY $vgpr0
undef %1.sub0:sgpr_64 = COPY $sgpr0		undef %1.sub0:sgpr_64 = COPY $sgpr0
%2:sgpr_128 = COPY $sgpr0_sgpr1_sgpr2_sgpr3		%2:sgpr_128 = COPY $sgpr0_sgpr1_sgpr2_sgpr3
%1.sub1:sgpr_64 = S_MOV_B32 0		%1.sub1:sgpr_64 = S_MOV_B32 0
undef %3.sub0:sgpr_128 = COPY %1.sub1		undef %3.sub0:sgpr_128 = COPY %1.sub1
%3.sub1:sgpr_128 = COPY %1.sub1		%3.sub1:sgpr_128 = COPY %1.sub1
%3.sub2:sgpr_128 = COPY %1.sub1		%3.sub2:sgpr_128 = COPY %1.sub1
▲ Show 20 Lines • Show All 58 Lines • Show Last 20 Lines

llvm/test/CodeGen/AMDGPU/virtregrewrite-undef-identity-copy.mir

Show All 34 Lines	bb.0:
; CHECK: $sgpr4 = COPY $sgpr95		; CHECK: $sgpr4 = COPY $sgpr95
; CHECK: dead $sgpr30_sgpr31 = SI_CALL killed renamable $sgpr6_sgpr7, @foo, csr_amdgpu_highregs, implicit $sgpr0_sgpr1_sgpr2_sgpr3, implicit $sgpr4		; CHECK: dead $sgpr30_sgpr31 = SI_CALL killed renamable $sgpr6_sgpr7, @foo, csr_amdgpu_highregs, implicit $sgpr0_sgpr1_sgpr2_sgpr3, implicit $sgpr4
; CHECK: ADJCALLSTACKDOWN 0, 4, implicit-def $scc, implicit-def $sgpr32, implicit $sgpr32, implicit $sgpr95		; CHECK: ADJCALLSTACKDOWN 0, 4, implicit-def $scc, implicit-def $sgpr32, implicit $sgpr32, implicit $sgpr95
; CHECK: renamable $sgpr6_sgpr7 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @bar + 4, target-flags(amdgpu-rel32-hi) @bar + 4, implicit-def dead $scc		; CHECK: renamable $sgpr6_sgpr7 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @bar + 4, target-flags(amdgpu-rel32-hi) @bar + 4, implicit-def dead $scc
; CHECK: ADJCALLSTACKUP 0, 0, implicit-def $scc, implicit-def $sgpr32, implicit $sgpr32, implicit $sgpr95		; CHECK: ADJCALLSTACKUP 0, 0, implicit-def $scc, implicit-def $sgpr32, implicit $sgpr32, implicit $sgpr95
; CHECK: $sgpr4 = COPY $sgpr95		; CHECK: $sgpr4 = COPY $sgpr95
; CHECK: $vgpr0 = COPY renamable $vgpr40		; CHECK: $vgpr0 = COPY renamable $vgpr40
; CHECK: $vgpr1 = COPY renamable $vgpr41		; CHECK: $vgpr1 = COPY renamable $vgpr41
; CHECK: $vgpr2 = COPY renamable $vgpr42		; CHECK: $vgpr2 = COPY killed renamable $vgpr42
; CHECK: $vgpr3 = KILL undef renamable $vgpr3		; CHECK: $vgpr3 = KILL undef renamable $vgpr3
; CHECK: dead $sgpr30_sgpr31 = SI_CALL killed renamable $sgpr6_sgpr7, @bar, csr_amdgpu_highregs, implicit $sgpr0_sgpr1_sgpr2_sgpr3, implicit $sgpr4, implicit $vgpr0, implicit killed $vgpr1, implicit killed $vgpr2, implicit killed $vgpr3, implicit-def $vgpr0		; CHECK: dead $sgpr30_sgpr31 = SI_CALL killed renamable $sgpr6_sgpr7, @bar, csr_amdgpu_highregs, implicit $sgpr0_sgpr1_sgpr2_sgpr3, implicit $sgpr4, implicit $vgpr0, implicit killed $vgpr1, implicit killed $vgpr2, implicit killed $vgpr3, implicit-def $vgpr0
; CHECK: ADJCALLSTACKDOWN 0, 4, implicit-def $scc, implicit-def $sgpr32, implicit $sgpr32, implicit $sgpr95		; CHECK: ADJCALLSTACKDOWN 0, 4, implicit-def $scc, implicit-def $sgpr32, implicit $sgpr32, implicit $sgpr95
; CHECK: FLAT_STORE_DWORD undef renamable $vgpr0_vgpr1, killed renamable $vgpr0, 0, 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (store 4, addrspace 1)		; CHECK: FLAT_STORE_DWORD undef renamable $vgpr0_vgpr1, killed renamable $vgpr0, 0, 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (store 4, addrspace 1)
; CHECK: S_ENDPGM 0		; CHECK: S_ENDPGM 0
%0:vreg_128 = FLAT_LOAD_DWORDX4 undef %1:vreg_64, 0, 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (load 16, addrspace 1)		%0:vreg_128 = FLAT_LOAD_DWORDX4 undef %1:vreg_64, 0, 0, 0, 0, 0, implicit $exec, implicit $flat_scr :: (load 16, addrspace 1)
%2:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @foo + 4, target-flags(amdgpu-rel32-hi) @foo + 4, implicit-def dead $scc		%2:sreg_64 = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @foo + 4, target-flags(amdgpu-rel32-hi) @foo + 4, implicit-def dead $scc
ADJCALLSTACKUP 0, 0, implicit-def $sgpr32, implicit $sgpr32, implicit $sgpr95, implicit-def $scc		ADJCALLSTACKUP 0, 0, implicit-def $sgpr32, implicit $sgpr32, implicit $sgpr95, implicit-def $scc
Show All 17 Lines

llvm/test/CodeGen/PowerPC/subreg-killed.mir

This file was added.

				# RUN: llc -mcpu=pwr10 -O3 -ppc-track-subreg-liveness -verify-machineinstrs \
				# RUN: -mtriple=powerpc64le-unknown-linux-gnu -run-pass=greedy,virtregrewriter \
				# RUN: -o - %s \| FileCheck %s

				# This test case checks that the 'killed' flag is properly added when using
				# subregisters.

				# CHECK-LABEL: test
				# CHECK: KILL_PAIR killed
				# CHECK-NEXT: COPY killed
				# CHECK-NEXT: KILL_PAIR killed
				# CHECK-NEXT: COPY killed
				# CHECK-NEXT: BUILD_UACC killed
				# CHECK-NEXT: XXMTACC killed
				# CHECK-NEXT: SPILL_ACC killed

				---
				name: test
				tracksRegLiveness: true
				fixedStack:
				- { id: 0, size: 8 }
				stack:
				- { id: 0, size: 64 }
				body: \|
				bb.0:
				liveins: $v2, $v3, $v4, $v5
				undef %4.sub_vsx1:vsrprc_with_sub_64_in_vfrc = COPY $v5
				%4.sub_vsx0:vsrprc_with_sub_64_in_vfrc = COPY $v4
				undef %5.sub_vsx1:vsrprc_with_sub_64_in_vfrc = COPY $v3
				%5.sub_vsx0:vsrprc_with_sub_64_in_vfrc = COPY $v2
				%6:g8rc_and_g8rc_nox0 = LD 0, %fixed-stack.0
				arsenmUnsubmitted Done Reply Inline Actions Don't need the IR section arsenm: Don't need the IR section
				%5:vsrprc_with_sub_64_in_vfrc = KILL_PAIR %5
				undef %7.sub_pair0:uaccrc = COPY %5
				%4:vsrprc_with_sub_64_in_vfrc = KILL_PAIR %4
				%7.sub_pair1:uaccrc = COPY %4
				%8:accrc = BUILD_UACC %7
				%8:accrc = XXMTACC %8
				SPILL_ACC %8, 0, %stack.0

				...
				arsenmUnsubmitted Done Reply Inline Actions Can you simplify this at all? -run-pass=none after deleting the register section will also compact these vreg numbers arsenm: Can you simplify this at all? -run-pass=none after deleting the register section will also…

This is an archive of the discontinued LLVM Phabricator instance.

[VirtRegRewriter] Insert missing killed flags when tracking subregister liveness
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 327818

llvm/lib/CodeGen/LiveIntervals.cpp

llvm/test/CodeGen/AMDGPU/load-global-i16.ll

llvm/test/CodeGen/AMDGPU/regbank-reassign-wave64.mir

llvm/test/CodeGen/AMDGPU/regbank-reassign.mir

llvm/test/CodeGen/AMDGPU/spill-scavenge-offset.ll

llvm/test/CodeGen/AMDGPU/splitkit-nolivesubranges.mir

llvm/test/CodeGen/AMDGPU/splitkit.mir

llvm/test/CodeGen/AMDGPU/subreg_interference.mir

llvm/test/CodeGen/AMDGPU/unallocatable-bundle-regression.mir

llvm/test/CodeGen/AMDGPU/virtregrewrite-undef-identity-copy.mir

llvm/test/CodeGen/PowerPC/subreg-killed.mir

This is an archive of the discontinued LLVM Phabricator instance.

[VirtRegRewriter] Insert missing killed flags when tracking subregister livenessClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 327818

llvm/lib/CodeGen/LiveIntervals.cpp

llvm/test/CodeGen/AMDGPU/load-global-i16.ll

llvm/test/CodeGen/AMDGPU/regbank-reassign-wave64.mir

llvm/test/CodeGen/AMDGPU/regbank-reassign.mir

llvm/test/CodeGen/AMDGPU/spill-scavenge-offset.ll

llvm/test/CodeGen/AMDGPU/splitkit-nolivesubranges.mir

llvm/test/CodeGen/AMDGPU/splitkit.mir

llvm/test/CodeGen/AMDGPU/subreg_interference.mir

llvm/test/CodeGen/AMDGPU/unallocatable-bundle-regression.mir

llvm/test/CodeGen/AMDGPU/virtregrewrite-undef-identity-copy.mir

llvm/test/CodeGen/PowerPC/subreg-killed.mir

[VirtRegRewriter] Insert missing killed flags when tracking subregister liveness
ClosedPublic