Diff 358174

llvm/lib/Target/AMDGPU/SIInstrInfo.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 101 Lines • ▼ Show 20 Lines	static bool nodesHaveSameOperandValue(SDNode N0, SDNode N1, unsigned OpName) {
--Op0Idx;		--Op0Idx;
--Op1Idx;		--Op1Idx;

return N0->getOperand(Op0Idx) == N1->getOperand(Op1Idx);		return N0->getOperand(Op0Idx) == N1->getOperand(Op1Idx);
}		}

bool SIInstrInfo::isReallyTriviallyReMaterializable(const MachineInstr &MI,		bool SIInstrInfo::isReallyTriviallyReMaterializable(const MachineInstr &MI,
AAResults *AA) const {		AAResults *AA) const {
// TODO: The generic check fails for VALU instructions that should be		if (isVOP1(MI) \|\| isVOP3(MI) \|\| isSDWA(MI)) {
		arsenmUnsubmitted Done Reply Inline Actions Braces arsenm: Braces
		arsenmUnsubmitted Not Done Reply Inline Actions What about VOP2? arsenm: What about VOP2?
		rampitecAuthorUnsubmitted Done Reply Inline Actions There are no supported VOP2 yet. Only two VOP1 conversions and their promoted VOP3 forms. rampitec: There are no supported VOP2 yet. Only two VOP1 conversions and their promoted VOP3 forms.
// rematerializable due to implicit reads of exec. We really want all of the		// Normally VALU use of exec would block the rematerialization, but that
// generic logic for this except for this.		// is OK in this case to have an implicit exec read as all VALU do.
switch (MI.getOpcode()) {		// We really want all of the generic logic for this except for this.
case AMDGPU::V_MOV_B32_e32:
case AMDGPU::V_MOV_B32_e64:		// Another potential implicit use is mode register. The core logic of
case AMDGPU::V_MOV_B64_PSEUDO:		// the RA will not attempt rematerialization if mode is set anywhere
case AMDGPU::V_ACCVGPR_READ_B32_e64:		// in the function, otherwise it is safe since mode is not changed.
case AMDGPU::V_ACCVGPR_WRITE_B32_e64:		return !MI.hasImplicitDef() &&
// No non-standard implicit operands.		MI.getNumImplicitOperands() == MI.getDesc().getNumImplicitUses();
		arsenmUnsubmitted Done Reply Inline Actions Probably should get a comment about how normally exec would block rematerialization but should be OK, plus mode arsenm: Probably should get a comment about how normally exec would block rematerialization but should…
assert(MI.getDesc().getNumOperands() == 2);
assert(MI.getDesc().getNumImplicitDefs() == 0);
assert(MI.getDesc().getNumImplicitUses() == 1);
return MI.getNumOperands() == 3;
default:
return false;
}		}

		return false;
}		}

bool SIInstrInfo::areLoadsFromSameBasePtr(SDNode Load0, SDNode Load1,		bool SIInstrInfo::areLoadsFromSameBasePtr(SDNode Load0, SDNode Load1,
int64_t &Offset0,		int64_t &Offset0,
int64_t &Offset1) const {		int64_t &Offset1) const {
if (!Load0->isMachineOpcode() \|\| !Load1->isMachineOpcode())		if (!Load0->isMachineOpcode() \|\| !Load1->isMachineOpcode())
return false;		return false;

▲ Show 20 Lines • Show All 7,775 Lines • Show Last 20 Lines

llvm/lib/Target/AMDGPU/VOP1Instructions.td

Show First 20 Lines • Show All 197 Lines • ▼ Show 20 Lines	def V_READFIRSTLANE_B32 :
bits<9> src0;		bits<9> src0;

let Inst{8-0} = src0;		let Inst{8-0} = src0;
let Inst{16-9} = 0x2;		let Inst{16-9} = 0x2;
let Inst{24-17} = vdst;		let Inst{24-17} = vdst;
let Inst{31-25} = 0x3f; //encoding		let Inst{31-25} = 0x3f; //encoding
}		}

		let isReMaterializable = 1 in {
let SchedRW = [WriteDoubleCvt] in {		let SchedRW = [WriteDoubleCvt] in {
// OMod clears exceptions when set in this instruction		// OMod clears exceptions when set in this instruction
defm V_CVT_I32_F64 : VOP1Inst <"v_cvt_i32_f64", VOP_I32_F64_SPECIAL_OMOD, fp_to_sint>;		defm V_CVT_I32_F64 : VOP1Inst <"v_cvt_i32_f64", VOP_I32_F64_SPECIAL_OMOD, fp_to_sint>;

let mayRaiseFPException = 0 in {		let mayRaiseFPException = 0 in {
defm V_CVT_F64_I32 : VOP1Inst <"v_cvt_f64_i32", VOP1_F64_I32, sint_to_fp>;		defm V_CVT_F64_I32 : VOP1Inst <"v_cvt_f64_i32", VOP1_F64_I32, sint_to_fp>;
}		}

Show All 27 Lines
defm V_CVT_F32_F16 : VOP1Inst <"v_cvt_f32_f16", VOP_F32_F16, fpextend>;		defm V_CVT_F32_F16 : VOP1Inst <"v_cvt_f32_f16", VOP_F32_F16, fpextend>;

let ReadsModeReg = 0, mayRaiseFPException = 0 in {		let ReadsModeReg = 0, mayRaiseFPException = 0 in {
defm V_CVT_RPI_I32_F32 : VOP1Inst <"v_cvt_rpi_i32_f32", VOP_I32_F32, cvt_rpi_i32_f32>;		defm V_CVT_RPI_I32_F32 : VOP1Inst <"v_cvt_rpi_i32_f32", VOP_I32_F32, cvt_rpi_i32_f32>;
defm V_CVT_FLR_I32_F32 : VOP1Inst <"v_cvt_flr_i32_f32", VOP_I32_F32, cvt_flr_i32_f32>;		defm V_CVT_FLR_I32_F32 : VOP1Inst <"v_cvt_flr_i32_f32", VOP_I32_F32, cvt_flr_i32_f32>;
defm V_CVT_OFF_F32_I4 : VOP1Inst <"v_cvt_off_f32_i4", VOP1_F32_I32>;		defm V_CVT_OFF_F32_I4 : VOP1Inst <"v_cvt_off_f32_i4", VOP1_F32_I32>;
} // End ReadsModeReg = 0, mayRaiseFPException = 0		} // End ReadsModeReg = 0, mayRaiseFPException = 0
} // End SchedRW = [WriteFloatCvt]		} // End SchedRW = [WriteFloatCvt]
		} // End isReMaterializable = 1

let ReadsModeReg = 0, mayRaiseFPException = 0 in {		let ReadsModeReg = 0, mayRaiseFPException = 0 in {
defm V_CVT_F32_UBYTE0 : VOP1Inst <"v_cvt_f32_ubyte0", VOP1_F32_I32, AMDGPUcvt_f32_ubyte0>;		defm V_CVT_F32_UBYTE0 : VOP1Inst <"v_cvt_f32_ubyte0", VOP1_F32_I32, AMDGPUcvt_f32_ubyte0>;
defm V_CVT_F32_UBYTE1 : VOP1Inst <"v_cvt_f32_ubyte1", VOP1_F32_I32, AMDGPUcvt_f32_ubyte1>;		defm V_CVT_F32_UBYTE1 : VOP1Inst <"v_cvt_f32_ubyte1", VOP1_F32_I32, AMDGPUcvt_f32_ubyte1>;
defm V_CVT_F32_UBYTE2 : VOP1Inst <"v_cvt_f32_ubyte2", VOP1_F32_I32, AMDGPUcvt_f32_ubyte2>;		defm V_CVT_F32_UBYTE2 : VOP1Inst <"v_cvt_f32_ubyte2", VOP1_F32_I32, AMDGPUcvt_f32_ubyte2>;
defm V_CVT_F32_UBYTE3 : VOP1Inst <"v_cvt_f32_ubyte3", VOP1_F32_I32, AMDGPUcvt_f32_ubyte3>;		defm V_CVT_F32_UBYTE3 : VOP1Inst <"v_cvt_f32_ubyte3", VOP1_F32_I32, AMDGPUcvt_f32_ubyte3>;
} // ReadsModeReg = 0, mayRaiseFPException = 0		} // ReadsModeReg = 0, mayRaiseFPException = 0

▲ Show 20 Lines • Show All 692 Lines • Show Last 20 Lines

llvm/test/CodeGen/AMDGPU/remat-vop.mir

# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py		# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
# RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx908 -verify-machineinstrs --stress-regalloc=2 -start-before=greedy -stop-after=virtregrewriter -o - %s \| FileCheck -check-prefix=GCN %s		# RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a -verify-machineinstrs --stress-regalloc=2 -start-before=greedy -stop-after=virtregrewriter -o - %s \| FileCheck -check-prefix=GCN %s

---		---
name: test_remat_v_mov_b32_e32		name: test_remat_v_mov_b32_e32
tracksRegLiveness: true		tracksRegLiveness: true
body: \|		body: \|
bb.0:		bb.0:
; GCN-LABEL: name: test_remat_v_mov_b32_e32		; GCN-LABEL: name: test_remat_v_mov_b32_e32
; GCN: renamable $vgpr0 = V_MOV_B32_e32 1, implicit $exec		; GCN: renamable $vgpr0 = V_MOV_B32_e32 1, implicit $exec
▲ Show 20 Lines • Show All 57 Lines • ▼ Show 20 Lines	bb.0:
%1:vgpr_32 = V_MOV_B32_e64 2, implicit $exec		%1:vgpr_32 = V_MOV_B32_e64 2, implicit $exec
%2:vgpr_32 = V_MOV_B32_e64 3, implicit $exec		%2:vgpr_32 = V_MOV_B32_e64 3, implicit $exec
S_NOP 0, implicit %0		S_NOP 0, implicit %0
S_NOP 0, implicit %1		S_NOP 0, implicit %1
S_NOP 0, implicit %2		S_NOP 0, implicit %2
S_ENDPGM 0		S_ENDPGM 0
...		...
---		---
		name: test_no_remat_v_mov_b32_dpp
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_mov_b32_dpp
		; GCN: renamable $vgpr0 = V_MOV_B32_dpp undef $vgpr0, undef $vgpr0, 1, 15, 15, 1, implicit $exec
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_MOV_B32_dpp undef $vgpr1, undef $vgpr0, 1, 15, 15, 1, implicit $exec
		; GCN: renamable $vgpr0 = V_MOV_B32_dpp undef $vgpr0, undef $vgpr0, 1, 15, 15, 1, implicit $exec
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MOV_B32_dpp undef %1:vgpr_32, undef %0:vgpr_32, 1, 15, 15, 1, implicit $exec
		%2:vgpr_32 = V_MOV_B32_dpp undef %2:vgpr_32, undef %0:vgpr_32, 1, 15, 15, 1, implicit $exec
		%3:vgpr_32 = V_MOV_B32_dpp undef %3:vgpr_32, undef %0:vgpr_32, 1, 15, 15, 1, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
name: test_remat_v_accvgpr_read_b32		name: test_remat_v_accvgpr_read_b32
tracksRegLiveness: true		tracksRegLiveness: true
body: \|		body: \|
bb.0:		bb.0:
; GCN-LABEL: name: test_remat_v_accvgpr_read_b32		; GCN-LABEL: name: test_remat_v_accvgpr_read_b32
; GCN: renamable $vgpr0 = V_ACCVGPR_READ_B32_e64 undef $agpr0, implicit $exec		; GCN: renamable $vgpr0 = V_ACCVGPR_READ_B32_e64 undef $agpr0, implicit $exec
; GCN: renamable $vgpr1 = V_ACCVGPR_READ_B32_e64 undef $agpr0, implicit $exec		; GCN: renamable $vgpr1 = V_ACCVGPR_READ_B32_e64 undef $agpr0, implicit $exec
; GCN: S_NOP 0, implicit killed renamable $vgpr0		; GCN: S_NOP 0, implicit killed renamable $vgpr0
Show All 32 Lines
...		...
---		---
name: test_remat_v_mov_b64_pseudo		name: test_remat_v_mov_b64_pseudo
tracksRegLiveness: true		tracksRegLiveness: true
body: \|		body: \|
bb.0:		bb.0:
; GCN-LABEL: name: test_remat_v_mov_b64_pseudo		; GCN-LABEL: name: test_remat_v_mov_b64_pseudo
; GCN: renamable $vgpr0_vgpr1 = V_MOV_B64_PSEUDO 1, implicit $exec		; GCN: renamable $vgpr0_vgpr1 = V_MOV_B64_PSEUDO 1, implicit $exec
		; GCN: renamable $vgpr2_vgpr3 = V_MOV_B64_PSEUDO 2, implicit $exec
; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1		; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1
; GCN: renamable $vgpr0_vgpr1 = V_MOV_B64_PSEUDO 2, implicit $exec		; GCN: S_NOP 0, implicit killed renamable $vgpr2_vgpr3
; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1
; GCN: renamable $vgpr0_vgpr1 = V_MOV_B64_PSEUDO 3, implicit $exec		; GCN: renamable $vgpr0_vgpr1 = V_MOV_B64_PSEUDO 3, implicit $exec
; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1		; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1
; GCN: S_ENDPGM 0		; GCN: S_ENDPGM 0
%0:vreg_64 = V_MOV_B64_PSEUDO 1, implicit $exec		%0:vreg_64_align2 = V_MOV_B64_PSEUDO 1, implicit $exec
%1:vreg_64 = V_MOV_B64_PSEUDO 2, implicit $exec		%1:vreg_64_align2 = V_MOV_B64_PSEUDO 2, implicit $exec
%2:vreg_64 = V_MOV_B64_PSEUDO 3, implicit $exec		%2:vreg_64_align2 = V_MOV_B64_PSEUDO 3, implicit $exec
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_i32_f64_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_i32_f64_e32
		; GCN: dead renamable $vgpr0 = V_CVT_I32_F64_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_I32_F64_e32 2, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0 = V_CVT_I32_F64_e32 3, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e32 1, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_I32_F64_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_I32_F64_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_I32_F64_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		# Cannot rematerialize if MODE register is modified anywhere
		name: test_no_remat_v_cvt_i32_f64_e32_mode_def
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_cvt_i32_f64_e32_mode_def
		; GCN: $mode = IMPLICIT_DEF
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e32 1, implicit $exec, implicit $mode
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_CVT_I32_F64_e32 2, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e32 3, implicit $exec, implicit $mode
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		$mode = IMPLICIT_DEF
		%0:vgpr_32 = V_CVT_I32_F64_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_I32_F64_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_I32_F64_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_i32_f64_e64
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_i32_f64_e64
		; GCN: dead renamable $vgpr0 = V_CVT_I32_F64_e64 0, 1, 0, 0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_I32_F64_e64 0, 2, 0, 0, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0 = V_CVT_I32_F64_e64 0, 3, 0, 0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e64 0, 1, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e64 0, 3, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_I32_F64_e64 0, 1, 0, 0, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_I32_F64_e64 0, 2, 0, 0, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_I32_F64_e64 0, 3, 0, 0, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_i32_f64_e64_undef
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_i32_f64_e64_undef
		; GCN: dead renamable $vgpr0 = V_CVT_I32_F64_e64 0, undef $vgpr0_vgpr1, 0, 0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_I32_F64_e64 0, undef $vgpr0_vgpr1, 0, 0, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0 = V_CVT_I32_F64_e64 0, undef $vgpr0_vgpr1, 0, 0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e64 0, undef $vgpr0_vgpr1, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e64 0, undef $vgpr0_vgpr1, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CVT_I32_F64_e64 0, undef %0:vreg_64, 0, 0, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_I32_F64_e64 0, undef %0:vreg_64, 0, 0, implicit $exec, implicit $mode
		%3:vgpr_32 = V_CVT_I32_F64_e64 0, undef %0:vreg_64, 0, 0, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_cvt_i32_f64_dpp
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_cvt_i32_f64_dpp
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_dpp undef $vgpr0, 0, undef $vgpr0_vgpr1, 336, 0, 0, 0, implicit $exec, implicit $mode
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_CVT_I32_F64_dpp undef $vgpr1, 0, undef $vgpr0_vgpr1, 336, 0, 0, 0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_dpp undef $vgpr0, 0, undef $vgpr0_vgpr1, 336, 0, 0, 0, implicit $exec, implicit $mode
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CVT_I32_F64_dpp undef %1:vgpr_32, 0, undef %0:vreg_64_align2, 336, 0, 0, 0, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_I32_F64_dpp undef %2:vgpr_32, 0, undef %0:vreg_64_align2, 336, 0, 0, 0, implicit $exec, implicit $mode
		%3:vgpr_32 = V_CVT_I32_F64_dpp undef %3:vgpr_32, 0, undef %0:vreg_64_align2, 336, 0, 0, 0, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_cvt_i32_f64_e32_imp_def
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_cvt_i32_f64_e32_imp_def
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e32 1, implicit $exec, implicit $mode, implicit-def $m0
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_CVT_I32_F64_e32 2, implicit $exec, implicit $mode, implicit-def $m0
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e32 3, implicit $exec, implicit $mode, implicit-def $m0
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_I32_F64_e32 1, implicit $exec, implicit $mode, implicit-def $m0
		%1:vgpr_32 = V_CVT_I32_F64_e32 2, implicit $exec, implicit $mode, implicit-def $m0
		%2:vgpr_32 = V_CVT_I32_F64_e32 3, implicit $exec, implicit $mode, implicit-def $m0
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_cvt_i32_f64_e32_imp_use
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_cvt_i32_f64_e32_imp_use
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e32 1, implicit $exec, implicit $mode, implicit $m0
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_CVT_I32_F64_e32 2, implicit $exec, implicit $mode, implicit $m0
		; GCN: renamable $vgpr0 = V_CVT_I32_F64_e32 3, implicit $exec, implicit $mode, implicit $m0
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_I32_F64_e32 1, implicit $exec, implicit $mode, implicit $m0
		%1:vgpr_32 = V_CVT_I32_F64_e32 2, implicit $exec, implicit $mode, implicit $m0
		%2:vgpr_32 = V_CVT_I32_F64_e32 3, implicit $exec, implicit $mode, implicit $m0
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_f64_i32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_f64_i32_e32
		; GCN: renamable $vgpr0_vgpr1 = V_CVT_F64_I32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr2_vgpr3 = V_CVT_F64_I32_e32 2, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1
		; GCN: S_NOP 0, implicit killed renamable $vgpr2_vgpr3
		; GCN: renamable $vgpr0_vgpr1 = V_CVT_F64_I32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1
		; GCN: S_ENDPGM 0
		%0:vreg_64_align2 = V_CVT_F64_I32_e32 1, implicit $exec, implicit $mode
		%1:vreg_64_align2 = V_CVT_F64_I32_e32 2, implicit $exec, implicit $mode
		%2:vreg_64_align2 = V_CVT_F64_I32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_f32_f64_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_f32_f64_e32
		; GCN: dead renamable $vgpr0 = V_CVT_F32_F64_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_F32_F64_e32 2, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0 = V_CVT_F32_F64_e32 3, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_F32_F64_e32 1, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_F32_F64_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_F32_F64_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_F32_F64_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_F32_F64_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_f64_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_f64_f32_e32
		; GCN: dead renamable $vgpr0_vgpr1 = V_CVT_F64_F32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr2_vgpr3 = V_CVT_F64_F32_e32 2, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0_vgpr1 = V_CVT_F64_F32_e32 3, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0_vgpr1 = V_CVT_F64_F32_e32 1, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1
		; GCN: S_NOP 0, implicit killed renamable $vgpr2_vgpr3
		; GCN: renamable $vgpr0_vgpr1 = V_CVT_F64_F32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1
		; GCN: S_ENDPGM 0
		%0:vreg_64_align2 = V_CVT_F64_F32_e32 1, implicit $exec, implicit $mode
		%1:vreg_64_align2 = V_CVT_F64_F32_e32 2, implicit $exec, implicit $mode
		%2:vreg_64_align2 = V_CVT_F64_F32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_u32_f64_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_u32_f64_e32
		; GCN: dead renamable $vgpr0 = V_CVT_U32_F64_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_U32_F64_e32 2, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0 = V_CVT_U32_F64_e32 3, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_U32_F64_e32 1, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_U32_F64_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_U32_F64_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_U32_F64_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_U32_F64_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_f64_u32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_f64_u32_e32
		; GCN: renamable $vgpr0_vgpr1 = V_CVT_F64_U32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr2_vgpr3 = V_CVT_F64_U32_e32 2, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1
		; GCN: S_NOP 0, implicit killed renamable $vgpr2_vgpr3
		; GCN: renamable $vgpr0_vgpr1 = V_CVT_F64_U32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0_vgpr1
		; GCN: S_ENDPGM 0
		%0:vreg_64_align2 = V_CVT_F64_U32_e32 1, implicit $exec, implicit $mode
		%1:vreg_64_align2 = V_CVT_F64_U32_e32 2, implicit $exec, implicit $mode
		%2:vreg_64_align2 = V_CVT_F64_U32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_f32_i32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_f32_i32_e32
		; GCN: renamable $vgpr0 = V_CVT_F32_I32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_F32_I32_e32 2, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_F32_I32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_F32_I32_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_F32_I32_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_F32_I32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_f32_i32_sdwa
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_f32_i32_sdwa
		; GCN: renamable $vgpr0 = V_CVT_F32_I32_sdwa 0, undef $vgpr0, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_F32_I32_sdwa 0, undef $vgpr0, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_F32_I32_sdwa 0, undef $vgpr0, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CVT_F32_I32_sdwa 0, undef %0:vgpr_32, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_F32_I32_sdwa 0, undef %0:vgpr_32, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		%3:vgpr_32 = V_CVT_F32_I32_sdwa 0, undef %0:vgpr_32, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		# SDWA instruction with UNUSED_PRESERVE cannot be rematerialized due to partial
		# dst write. This is handled because it always has a tied-def implicit operand.
		name: test_no_remat_v_cvt_f32_i32_sdwa_dst_unused_preserve
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_cvt_f32_i32_sdwa_dst_unused_preserve
		; GCN: renamable $vgpr0 = V_CVT_F32_I32_sdwa 0, undef $vgpr0, 0, 0, 0, 2, 0, implicit $exec, implicit $mode, implicit undef $vgpr0(tied-def 0)
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_CVT_F32_I32_sdwa 0, undef $vgpr0, 0, 0, 0, 2, 0, implicit $exec, implicit $mode, implicit undef $vgpr1(tied-def 0)
		; GCN: renamable $vgpr0 = V_CVT_F32_I32_sdwa 0, undef $vgpr0, 0, 0, 0, 2, 0, implicit $exec, implicit $mode, implicit undef $vgpr0(tied-def 0)
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CVT_F32_I32_sdwa 0, undef %0:vgpr_32, 0, 0, 0, 2, 0, implicit $exec, implicit $mode, implicit undef %1:vgpr_32(tied-def 0)
		%2:vgpr_32 = V_CVT_F32_I32_sdwa 0, undef %0:vgpr_32, 0, 0, 0, 2, 0, implicit $exec, implicit $mode, implicit undef %2:vgpr_32(tied-def 0)
		%3:vgpr_32 = V_CVT_F32_I32_sdwa 0, undef %0:vgpr_32, 0, 0, 0, 2, 0, implicit $exec, implicit $mode, implicit undef %3:vgpr_32(tied-def 0)
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_f32_u32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_f32_u32_e32
		; GCN: renamable $vgpr0 = V_CVT_F32_U32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_F32_U32_e32 2, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_F32_U32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_F32_U32_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_F32_U32_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_F32_U32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_u32_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_u32_f32_e32
		; GCN: dead renamable $vgpr0 = V_CVT_U32_F32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_U32_F32_e32 2, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0 = V_CVT_U32_F32_e32 3, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_U32_F32_e32 1, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_U32_F32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_U32_F32_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_U32_F32_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_U32_F32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_i32_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_i32_f32_e32
		; GCN: dead renamable $vgpr0 = V_CVT_I32_F32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_I32_F32_e32 2, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0 = V_CVT_I32_F32_e32 3, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_I32_F32_e32 1, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_I32_F32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_I32_F32_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_I32_F32_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_I32_F32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_f16_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_f16_f32_e32
		; GCN: dead renamable $vgpr0 = V_CVT_F16_F32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_F16_F32_e32 2, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0 = V_CVT_F16_F32_e32 3, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_F16_F32_e32 1, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_F16_F32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_F16_F32_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_F16_F32_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_F16_F32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_f32_f16_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_f32_f16_e32
		; GCN: dead renamable $vgpr0 = V_CVT_F32_F16_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_F32_F16_e32 2, implicit $exec, implicit $mode
		; GCN: dead renamable $vgpr0 = V_CVT_F32_F16_e32 3, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = V_CVT_F32_F16_e32 1, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_F32_F16_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_F32_F16_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_F32_F16_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_F32_F16_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_rpi_i32_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_rpi_i32_f32_e32
		; GCN: renamable $vgpr0 = V_CVT_RPI_I32_F32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_RPI_I32_F32_e32 2, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_RPI_I32_F32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_RPI_I32_F32_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_RPI_I32_F32_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_RPI_I32_F32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_flr_i32_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_flr_i32_f32_e32
		; GCN: renamable $vgpr0 = V_CVT_FLR_I32_F32_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_FLR_I32_F32_e32 2, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_FLR_I32_F32_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_FLR_I32_F32_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_FLR_I32_F32_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_FLR_I32_F32_e32 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %0
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_off_f32_i4_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_off_f32_i4_e32
		; GCN: renamable $vgpr0 = V_CVT_OFF_F32_I4_e32 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = V_CVT_OFF_F32_I4_e32 2, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_OFF_F32_I4_e32 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%0:vgpr_32 = V_CVT_OFF_F32_I4_e32 1, implicit $exec, implicit $mode
		%1:vgpr_32 = V_CVT_OFF_F32_I4_e32 2, implicit $exec, implicit $mode
		%2:vgpr_32 = V_CVT_OFF_F32_I4_e32 3, implicit $exec, implicit $mode
S_NOP 0, implicit %0		S_NOP 0, implicit %0
S_NOP 0, implicit %1		S_NOP 0, implicit %1
S_NOP 0, implicit %2		S_NOP 0, implicit %2
S_ENDPGM 0		S_ENDPGM 0
...		...
		arsenmUnsubmitted Done Reply Inline Actions Can you add a test with a mode def that blocks rematerialization? arsenm: Can you add a test with a mode def that blocks rematerialization?
		rampitecAuthorUnsubmitted Done Reply Inline Actions It is exist in `remat-vop.mir`, test `test_no_remat_v_cvt_i32_f64_e32_mode_def`. rampitec: It is exist in `remat-vop.mir`, test `test_no_remat_v_cvt_i32_f64_e32_mode_def`.

This is an archive of the discontinued LLVM Phabricator instance.

[AMDGPU] Make some VOP1 instructions rematerializable
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 358174

llvm/lib/Target/AMDGPU/SIInstrInfo.cpp

llvm/lib/Target/AMDGPU/VOP1Instructions.td

llvm/test/CodeGen/AMDGPU/remat-vop.mir

This is an archive of the discontinued LLVM Phabricator instance.

[AMDGPU] Make some VOP1 instructions rematerializableClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 358174

llvm/lib/Target/AMDGPU/SIInstrInfo.cpp

llvm/lib/Target/AMDGPU/VOP1Instructions.td

llvm/test/CodeGen/AMDGPU/remat-vop.mir

[AMDGPU] Make some VOP1 instructions rematerializable
ClosedPublic