Diff 359162

llvm/lib/Target/AMDGPU/SIInstrInfo.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 101 Lines • ▼ Show 20 Lines	static bool nodesHaveSameOperandValue(SDNode N0, SDNode N1, unsigned OpName) {
--Op0Idx;		--Op0Idx;
--Op1Idx;		--Op1Idx;

return N0->getOperand(Op0Idx) == N1->getOperand(Op1Idx);		return N0->getOperand(Op0Idx) == N1->getOperand(Op1Idx);
}		}

bool SIInstrInfo::isReallyTriviallyReMaterializable(const MachineInstr &MI,		bool SIInstrInfo::isReallyTriviallyReMaterializable(const MachineInstr &MI,
AAResults *AA) const {		AAResults *AA) const {
if (isVOP1(MI) \|\| isVOP3(MI) \|\| isSDWA(MI)) {		if (isVOP1(MI) \|\| isVOP2(MI) \|\| isVOP3(MI) \|\| isSDWA(MI)) {
// Normally VALU use of exec would block the rematerialization, but that		// Normally VALU use of exec would block the rematerialization, but that
// is OK in this case to have an implicit exec read as all VALU do.		// is OK in this case to have an implicit exec read as all VALU do.
// We really want all of the generic logic for this except for this.		// We really want all of the generic logic for this except for this.

// Another potential implicit use is mode register. The core logic of		// Another potential implicit use is mode register. The core logic of
// the RA will not attempt rematerialization if mode is set anywhere		// the RA will not attempt rematerialization if mode is set anywhere
// in the function, otherwise it is safe since mode is not changed.		// in the function, otherwise it is safe since mode is not changed.
return !MI.hasImplicitDef() &&		return !MI.hasImplicitDef() &&
▲ Show 20 Lines • Show All 7,791 Lines • Show Last 20 Lines

llvm/lib/Target/AMDGPU/VOP2Instructions.td

Show First 20 Lines • Show All 237 Lines • ▼ Show 20 Lines	let Uses = !if(useSGPRInput, [VCC, EXEC], [EXEC]) in {
let AsmMatchConverter = "cvtSdwaVOP2e";		let AsmMatchConverter = "cvtSdwaVOP2e";
}		}

foreach _ = BoolToList<P.HasExtDPP>.ret in		foreach _ = BoolToList<P.HasExtDPP>.ret in
def _dpp : VOP2_DPP_Pseudo <opName, P>;		def _dpp : VOP2_DPP_Pseudo <opName, P>;
}		}

def _e64 : VOP3_Pseudo <opName, P, getVOP2Pat64<node, P>.ret>,		def _e64 : VOP3_Pseudo <opName, P, getVOP2Pat64<node, P>.ret>,
Commutable_REV<revOp#"_e64", !eq(revOp, opName)>;		Commutable_REV<revOp#"_e64", !eq(revOp, opName)> {
		let isReMaterializable = 1;
		}
}		}
}		}

class VOP2eInstAlias <VOP2_Pseudo ps, Instruction inst, string opnd = ""> :		class VOP2eInstAlias <VOP2_Pseudo ps, Instruction inst, string opnd = ""> :
InstAlias <ps.OpName#" "#ps.Pfl.Asm32#", "#opnd,		InstAlias <ps.OpName#" "#ps.Pfl.Asm32#", "#opnd,
(inst ps.Pfl.DstRC:$vdst, ps.Pfl.Src0RC32:$src0,		(inst ps.Pfl.DstRC:$vdst, ps.Pfl.Src0RC32:$src0,
ps.Pfl.Src1RC32:$src1)>, PredicateControl;		ps.Pfl.Src1RC32:$src1)>, PredicateControl;

▲ Show 20 Lines • Show All 223 Lines • ▼ Show 20 Lines	def VOP_WRITELANE : VOPProfile<[i32, i32, i32, i32]> {
let HasExtSDWA9 = 0;		let HasExtSDWA9 = 0;
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// VOP2 Instructions		// VOP2 Instructions
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

defm V_CNDMASK_B32 : VOP2eInst <"v_cndmask_b32", VOP2e_I32_I32_I32_I1>;		defm V_CNDMASK_B32 : VOP2eInst <"v_cndmask_b32", VOP2e_I32_I32_I32_I1>;
let SubtargetPredicate = HasMadMacF32Insts in		let SubtargetPredicate = HasMadMacF32Insts, isReMaterializable = 1 in
def V_MADMK_F32 : VOP2_Pseudo <"v_madmk_f32", VOP_MADMK_F32, []>;		def V_MADMK_F32 : VOP2_Pseudo <"v_madmk_f32", VOP_MADMK_F32, []>;

let isCommutable = 1 in {		let isCommutable = 1 in {
		let isReMaterializable = 1 in {
defm V_ADD_F32 : VOP2Inst <"v_add_f32", VOP_F32_F32_F32, any_fadd>;		defm V_ADD_F32 : VOP2Inst <"v_add_f32", VOP_F32_F32_F32, any_fadd>;
defm V_SUB_F32 : VOP2Inst <"v_sub_f32", VOP_F32_F32_F32, any_fsub>;		defm V_SUB_F32 : VOP2Inst <"v_sub_f32", VOP_F32_F32_F32, any_fsub>;
defm V_SUBREV_F32 : VOP2Inst <"v_subrev_f32", VOP_F32_F32_F32, null_frag, "v_sub_f32">;		defm V_SUBREV_F32 : VOP2Inst <"v_subrev_f32", VOP_F32_F32_F32, null_frag, "v_sub_f32">;
defm V_MUL_LEGACY_F32 : VOP2Inst <"v_mul_legacy_f32", VOP_F32_F32_F32, AMDGPUfmul_legacy>;		defm V_MUL_LEGACY_F32 : VOP2Inst <"v_mul_legacy_f32", VOP_F32_F32_F32, AMDGPUfmul_legacy>;
defm V_MUL_F32 : VOP2Inst <"v_mul_f32", VOP_F32_F32_F32, any_fmul>;		defm V_MUL_F32 : VOP2Inst <"v_mul_f32", VOP_F32_F32_F32, any_fmul>;
defm V_MUL_I32_I24 : VOP2Inst <"v_mul_i32_i24", VOP_I32_I32_I32_ARITH, AMDGPUmul_i24>;		defm V_MUL_I32_I24 : VOP2Inst <"v_mul_i32_i24", VOP_I32_I32_I32_ARITH, AMDGPUmul_i24>;
defm V_MUL_HI_I32_I24 : VOP2Inst <"v_mul_hi_i32_i24", VOP_PAT_GEN<VOP_I32_I32_I32, 2>, AMDGPUmulhi_i24>;		defm V_MUL_HI_I32_I24 : VOP2Inst <"v_mul_hi_i32_i24", VOP_PAT_GEN<VOP_I32_I32_I32, 2>, AMDGPUmulhi_i24>;
defm V_MUL_U32_U24 : VOP2Inst <"v_mul_u32_u24", VOP_I32_I32_I32_ARITH, AMDGPUmul_u24>;		defm V_MUL_U32_U24 : VOP2Inst <"v_mul_u32_u24", VOP_I32_I32_I32_ARITH, AMDGPUmul_u24>;
defm V_MUL_HI_U32_U24 : VOP2Inst <"v_mul_hi_u32_u24", VOP_PAT_GEN<VOP_I32_I32_I32, 2>, AMDGPUmulhi_u24>;		defm V_MUL_HI_U32_U24 : VOP2Inst <"v_mul_hi_u32_u24", VOP_PAT_GEN<VOP_I32_I32_I32, 2>, AMDGPUmulhi_u24>;
defm V_MIN_F32 : VOP2Inst <"v_min_f32", VOP_F32_F32_F32, fminnum_like>;		defm V_MIN_F32 : VOP2Inst <"v_min_f32", VOP_F32_F32_F32, fminnum_like>;
defm V_MAX_F32 : VOP2Inst <"v_max_f32", VOP_F32_F32_F32, fmaxnum_like>;		defm V_MAX_F32 : VOP2Inst <"v_max_f32", VOP_F32_F32_F32, fmaxnum_like>;
defm V_MIN_I32 : VOP2Inst <"v_min_i32", VOP_PAT_GEN<VOP_I32_I32_I32>, smin>;		defm V_MIN_I32 : VOP2Inst <"v_min_i32", VOP_PAT_GEN<VOP_I32_I32_I32>, smin>;
defm V_MAX_I32 : VOP2Inst <"v_max_i32", VOP_PAT_GEN<VOP_I32_I32_I32>, smax>;		defm V_MAX_I32 : VOP2Inst <"v_max_i32", VOP_PAT_GEN<VOP_I32_I32_I32>, smax>;
defm V_MIN_U32 : VOP2Inst <"v_min_u32", VOP_PAT_GEN<VOP_I32_I32_I32>, umin>;		defm V_MIN_U32 : VOP2Inst <"v_min_u32", VOP_PAT_GEN<VOP_I32_I32_I32>, umin>;
defm V_MAX_U32 : VOP2Inst <"v_max_u32", VOP_PAT_GEN<VOP_I32_I32_I32>, umax>;		defm V_MAX_U32 : VOP2Inst <"v_max_u32", VOP_PAT_GEN<VOP_I32_I32_I32>, umax>;
defm V_LSHRREV_B32 : VOP2Inst <"v_lshrrev_b32", VOP_I32_I32_I32, lshr_rev, "v_lshr_b32">;		defm V_LSHRREV_B32 : VOP2Inst <"v_lshrrev_b32", VOP_I32_I32_I32, lshr_rev, "v_lshr_b32">;
defm V_ASHRREV_I32 : VOP2Inst <"v_ashrrev_i32", VOP_I32_I32_I32, ashr_rev, "v_ashr_i32">;		defm V_ASHRREV_I32 : VOP2Inst <"v_ashrrev_i32", VOP_I32_I32_I32, ashr_rev, "v_ashr_i32">;
defm V_LSHLREV_B32 : VOP2Inst <"v_lshlrev_b32", VOP_I32_I32_I32, lshl_rev, "v_lshl_b32">;		defm V_LSHLREV_B32 : VOP2Inst <"v_lshlrev_b32", VOP_I32_I32_I32, lshl_rev, "v_lshl_b32">;
defm V_AND_B32 : VOP2Inst <"v_and_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, and>;		defm V_AND_B32 : VOP2Inst <"v_and_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, and>;
defm V_OR_B32 : VOP2Inst <"v_or_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, or>;		defm V_OR_B32 : VOP2Inst <"v_or_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, or>;
defm V_XOR_B32 : VOP2Inst <"v_xor_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, xor>;		defm V_XOR_B32 : VOP2Inst <"v_xor_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, xor>;
		} // End isReMaterializable = 1

let mayRaiseFPException = 0 in {		let mayRaiseFPException = 0 in {
let OtherPredicates = [HasMadMacF32Insts] in {		let OtherPredicates = [HasMadMacF32Insts] in {
let Constraints = "$vdst = $src2", DisableEncoding="$src2",		let Constraints = "$vdst = $src2", DisableEncoding="$src2",
isConvertibleToThreeAddress = 1 in {		isConvertibleToThreeAddress = 1 in {
defm V_MAC_F32 : VOP2Inst <"v_mac_f32", VOP_MAC_F32>;		defm V_MAC_F32 : VOP2Inst <"v_mac_f32", VOP_MAC_F32>;

let SubtargetPredicate = isGFX6GFX7GFX10 in		let SubtargetPredicate = isGFX6GFX7GFX10 in
defm V_MAC_LEGACY_F32 : VOP2Inst <"v_mac_legacy_f32", VOP_MAC_LEGACY_F32>;		defm V_MAC_LEGACY_F32 : VOP2Inst <"v_mac_legacy_f32", VOP_MAC_LEGACY_F32>;
} // End Constraints = "$vdst = $src2", DisableEncoding="$src2",		} // End Constraints = "$vdst = $src2", DisableEncoding="$src2",
// isConvertibleToThreeAddress = 1		// isConvertibleToThreeAddress = 1

		let isReMaterializable = 1 in
def V_MADAK_F32 : VOP2_Pseudo <"v_madak_f32", VOP_MADAK_F32, []>;		def V_MADAK_F32 : VOP2_Pseudo <"v_madak_f32", VOP_MADAK_F32, []>;
} // End OtherPredicates = [HasMadMacF32Insts]		} // End OtherPredicates = [HasMadMacF32Insts]
} // End mayRaiseFPException = 0		} // End mayRaiseFPException = 0

// No patterns so that the scalar instructions are always selected.		// No patterns so that the scalar instructions are always selected.
// The scalar versions will be replaced with vector when needed later.		// The scalar versions will be replaced with vector when needed later.
defm V_ADD_CO_U32 : VOP2bInst <"v_add_co_u32", VOP2b_I32_I1_I32_I32, null_frag, "v_add_co_u32", 1>;		defm V_ADD_CO_U32 : VOP2bInst <"v_add_co_u32", VOP2b_I32_I1_I32_I32, null_frag, "v_add_co_u32", 1>;
defm V_SUB_CO_U32 : VOP2bInst <"v_sub_co_u32", VOP2b_I32_I1_I32_I32, null_frag, "v_sub_co_u32", 1>;		defm V_SUB_CO_U32 : VOP2bInst <"v_sub_co_u32", VOP2b_I32_I1_I32_I32, null_frag, "v_sub_co_u32", 1>;
defm V_SUBREV_CO_U32 : VOP2bInst <"v_subrev_co_u32", VOP2b_I32_I1_I32_I32, null_frag, "v_sub_co_u32", 1>;		defm V_SUBREV_CO_U32 : VOP2bInst <"v_subrev_co_u32", VOP2b_I32_I1_I32_I32, null_frag, "v_sub_co_u32", 1>;
defm V_ADDC_U32 : VOP2bInst <"v_addc_u32", VOP2b_I32_I1_I32_I32_I1, null_frag, "v_addc_u32", 1>;		defm V_ADDC_U32 : VOP2bInst <"v_addc_u32", VOP2b_I32_I1_I32_I32_I1, null_frag, "v_addc_u32", 1>;
defm V_SUBB_U32 : VOP2bInst <"v_subb_u32", VOP2b_I32_I1_I32_I32_I1, null_frag, "v_subb_u32", 1>;		defm V_SUBB_U32 : VOP2bInst <"v_subb_u32", VOP2b_I32_I1_I32_I32_I1, null_frag, "v_subb_u32", 1>;
defm V_SUBBREV_U32 : VOP2bInst <"v_subbrev_u32", VOP2b_I32_I1_I32_I32_I1, null_frag, "v_subb_u32", 1>;		defm V_SUBBREV_U32 : VOP2bInst <"v_subbrev_u32", VOP2b_I32_I1_I32_I32_I1, null_frag, "v_subb_u32", 1>;


let SubtargetPredicate = HasAddNoCarryInsts in {		let SubtargetPredicate = HasAddNoCarryInsts, isReMaterializable = 1 in {
defm V_ADD_U32 : VOP2Inst <"v_add_u32", VOP_I32_I32_I32_ARITH, null_frag, "v_add_u32", 1>;		defm V_ADD_U32 : VOP2Inst <"v_add_u32", VOP_I32_I32_I32_ARITH, null_frag, "v_add_u32", 1>;
defm V_SUB_U32 : VOP2Inst <"v_sub_u32", VOP_I32_I32_I32_ARITH, null_frag, "v_sub_u32", 1>;		defm V_SUB_U32 : VOP2Inst <"v_sub_u32", VOP_I32_I32_I32_ARITH, null_frag, "v_sub_u32", 1>;
defm V_SUBREV_U32 : VOP2Inst <"v_subrev_u32", VOP_I32_I32_I32_ARITH, null_frag, "v_sub_u32", 1>;		defm V_SUBREV_U32 : VOP2Inst <"v_subrev_u32", VOP_I32_I32_I32_ARITH, null_frag, "v_sub_u32", 1>;
}		}

} // End isCommutable = 1		} // End isCommutable = 1

// These are special and do not read the exec mask.		// These are special and do not read the exec mask.
let isConvergent = 1, Uses = []<Register> in {		let isConvergent = 1, Uses = []<Register> in {
def V_READLANE_B32 : VOP2_Pseudo<"v_readlane_b32", VOP_READLANE,		def V_READLANE_B32 : VOP2_Pseudo<"v_readlane_b32", VOP_READLANE,
[(set i32:$vdst, (int_amdgcn_readlane i32:$src0, i32:$src1))]>;		[(set i32:$vdst, (int_amdgcn_readlane i32:$src0, i32:$src1))]>;

let Constraints = "$vdst = $vdst_in", DisableEncoding="$vdst_in" in {		let Constraints = "$vdst = $vdst_in", DisableEncoding="$vdst_in" in {
def V_WRITELANE_B32 : VOP2_Pseudo<"v_writelane_b32", VOP_WRITELANE,		def V_WRITELANE_B32 : VOP2_Pseudo<"v_writelane_b32", VOP_WRITELANE,
[(set i32:$vdst, (int_amdgcn_writelane i32:$src0, i32:$src1, i32:$vdst_in))]>;		[(set i32:$vdst, (int_amdgcn_writelane i32:$src0, i32:$src1, i32:$vdst_in))]>;
} // End $vdst = $vdst_in, DisableEncoding $vdst_in		} // End $vdst = $vdst_in, DisableEncoding $vdst_in
} // End isConvergent = 1		} // End isConvergent = 1

		let isReMaterializable = 1 in {
defm V_BFM_B32 : VOP2Inst <"v_bfm_b32", VOP_NO_EXT<VOP_I32_I32_I32>>;		defm V_BFM_B32 : VOP2Inst <"v_bfm_b32", VOP_NO_EXT<VOP_I32_I32_I32>>;
defm V_BCNT_U32_B32 : VOP2Inst <"v_bcnt_u32_b32", VOP_NO_EXT<VOP_I32_I32_I32>, add_ctpop>;		defm V_BCNT_U32_B32 : VOP2Inst <"v_bcnt_u32_b32", VOP_NO_EXT<VOP_I32_I32_I32>, add_ctpop>;
defm V_MBCNT_LO_U32_B32 : VOP2Inst <"v_mbcnt_lo_u32_b32", VOP_NO_EXT<VOP_I32_I32_I32>, int_amdgcn_mbcnt_lo>;		defm V_MBCNT_LO_U32_B32 : VOP2Inst <"v_mbcnt_lo_u32_b32", VOP_NO_EXT<VOP_I32_I32_I32>, int_amdgcn_mbcnt_lo>;
defm V_MBCNT_HI_U32_B32 : VOP2Inst <"v_mbcnt_hi_u32_b32", VOP_NO_EXT<VOP_I32_I32_I32>, int_amdgcn_mbcnt_hi>;		defm V_MBCNT_HI_U32_B32 : VOP2Inst <"v_mbcnt_hi_u32_b32", VOP_NO_EXT<VOP_I32_I32_I32>, int_amdgcn_mbcnt_hi>;
defm V_LDEXP_F32 : VOP2Inst <"v_ldexp_f32", VOP_NO_EXT<VOP_F32_F32_I32>, AMDGPUldexp>;		defm V_LDEXP_F32 : VOP2Inst <"v_ldexp_f32", VOP_NO_EXT<VOP_F32_F32_I32>, AMDGPUldexp>;
defm V_CVT_PKACCUM_U8_F32 : VOP2Inst <"v_cvt_pkaccum_u8_f32", VOP_NO_EXT<VOP_I32_F32_I32>>; // TODO: set "Uses = dst"

let ReadsModeReg = 0, mayRaiseFPException = 0 in {		let ReadsModeReg = 0, mayRaiseFPException = 0 in {
defm V_CVT_PKNORM_I16_F32 : VOP2Inst <"v_cvt_pknorm_i16_f32", VOP_NO_EXT<VOP_V2I16_F32_F32>, AMDGPUpknorm_i16_f32>;		defm V_CVT_PKNORM_I16_F32 : VOP2Inst <"v_cvt_pknorm_i16_f32", VOP_NO_EXT<VOP_V2I16_F32_F32>, AMDGPUpknorm_i16_f32>;
defm V_CVT_PKNORM_U16_F32 : VOP2Inst <"v_cvt_pknorm_u16_f32", VOP_NO_EXT<VOP_V2I16_F32_F32>, AMDGPUpknorm_u16_f32>;		defm V_CVT_PKNORM_U16_F32 : VOP2Inst <"v_cvt_pknorm_u16_f32", VOP_NO_EXT<VOP_V2I16_F32_F32>, AMDGPUpknorm_u16_f32>;
}		}

defm V_CVT_PKRTZ_F16_F32 : VOP2Inst <"v_cvt_pkrtz_f16_f32", VOP_NO_EXT<VOP_V2F16_F32_F32>, AMDGPUpkrtz_f16_f32>;		defm V_CVT_PKRTZ_F16_F32 : VOP2Inst <"v_cvt_pkrtz_f16_f32", VOP_NO_EXT<VOP_V2F16_F32_F32>, AMDGPUpkrtz_f16_f32>;
defm V_CVT_PK_U16_U32 : VOP2Inst <"v_cvt_pk_u16_u32", VOP_NO_EXT<VOP_V2I16_I32_I32>, AMDGPUpk_u16_u32>;		defm V_CVT_PK_U16_U32 : VOP2Inst <"v_cvt_pk_u16_u32", VOP_NO_EXT<VOP_V2I16_I32_I32>, AMDGPUpk_u16_u32>;
defm V_CVT_PK_I16_I32 : VOP2Inst <"v_cvt_pk_i16_i32", VOP_NO_EXT<VOP_V2I16_I32_I32>, AMDGPUpk_i16_i32>;		defm V_CVT_PK_I16_I32 : VOP2Inst <"v_cvt_pk_i16_i32", VOP_NO_EXT<VOP_V2I16_I32_I32>, AMDGPUpk_i16_i32>;


let SubtargetPredicate = isGFX6GFX7 in {		let SubtargetPredicate = isGFX6GFX7 in {
defm V_MIN_LEGACY_F32 : VOP2Inst <"v_min_legacy_f32", VOP_F32_F32_F32, AMDGPUfmin_legacy>;		defm V_MIN_LEGACY_F32 : VOP2Inst <"v_min_legacy_f32", VOP_F32_F32_F32, AMDGPUfmin_legacy>;
defm V_MAX_LEGACY_F32 : VOP2Inst <"v_max_legacy_f32", VOP_F32_F32_F32, AMDGPUfmax_legacy>;		defm V_MAX_LEGACY_F32 : VOP2Inst <"v_max_legacy_f32", VOP_F32_F32_F32, AMDGPUfmax_legacy>;
} // End SubtargetPredicate = isGFX6GFX7		} // End SubtargetPredicate = isGFX6GFX7

let isCommutable = 1 in {		let isCommutable = 1 in {
let SubtargetPredicate = isGFX6GFX7 in {		let SubtargetPredicate = isGFX6GFX7 in {
defm V_LSHR_B32 : VOP2Inst <"v_lshr_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, srl>;		defm V_LSHR_B32 : VOP2Inst <"v_lshr_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, srl>;
defm V_ASHR_I32 : VOP2Inst <"v_ashr_i32", VOP_PAT_GEN<VOP_I32_I32_I32>, sra>;		defm V_ASHR_I32 : VOP2Inst <"v_ashr_i32", VOP_PAT_GEN<VOP_I32_I32_I32>, sra>;
defm V_LSHL_B32 : VOP2Inst <"v_lshl_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, shl>;		defm V_LSHL_B32 : VOP2Inst <"v_lshl_b32", VOP_PAT_GEN<VOP_I32_I32_I32>, shl>;
} // End SubtargetPredicate = isGFX6GFX7		} // End SubtargetPredicate = isGFX6GFX7
} // End isCommutable = 1		} // End isCommutable = 1
		} // End isReMaterializable = 1

		defm V_CVT_PKACCUM_U8_F32 : VOP2Inst <"v_cvt_pkaccum_u8_f32", VOP_NO_EXT<VOP_I32_F32_I32>>; // TODO: set "Uses = dst"

class DivergentBinOp<SDPatternOperator Op, VOP_Pseudo Inst> :		class DivergentBinOp<SDPatternOperator Op, VOP_Pseudo Inst> :
GCNPat<		GCNPat<
(getDivergentFrag<Op>.ret Inst.Pfl.Src0VT:$src0, Inst.Pfl.Src1VT:$src1),		(getDivergentFrag<Op>.ret Inst.Pfl.Src0VT:$src0, Inst.Pfl.Src1VT:$src1),
!if(!cast<Commutable_REV>(Inst).IsOrig,		!if(!cast<Commutable_REV>(Inst).IsOrig,
(Inst $src0, $src1),		(Inst $src0, $src1),
(Inst $src1, $src0)		(Inst $src1, $src0)
)		)
▲ Show 20 Lines • Show All 42 Lines • ▼ Show 20 Lines

def : divergent_i64_BinOp <and, V_AND_B32_e32>;		def : divergent_i64_BinOp <and, V_AND_B32_e32>;
def : divergent_i64_BinOp <or, V_OR_B32_e32>;		def : divergent_i64_BinOp <or, V_OR_B32_e32>;
def : divergent_i64_BinOp <xor, V_XOR_B32_e32>;		def : divergent_i64_BinOp <xor, V_XOR_B32_e32>;

let SubtargetPredicate = Has16BitInsts in {		let SubtargetPredicate = Has16BitInsts in {

let FPDPRounding = 1 in {		let FPDPRounding = 1 in {
def V_MADMK_F16 : VOP2_Pseudo <"v_madmk_f16", VOP_MADMK_F16, [], "">;		def V_MADMK_F16 : VOP2_Pseudo <"v_madmk_f16", VOP_MADMK_F16, [], "">;
		arsenmUnsubmitted Done Reply Inline Actions This preserves high bits on gfx9 arsenm: This preserves high bits on gfx9
		rampitecAuthorUnsubmitted Done Reply Inline Actions GFX9 manual: VOP1/VOP2 will write zero to unused bits unless SDWA specifies otherwise, and VOP1/VOP2 ops encoded as VOP3 will write zero. So I assume it does not. rampitec: GFX9 manual: VOP1/VOP2 will write zero to unused bits unless SDWA specifies otherwise, and…
defm V_LDEXP_F16 : VOP2Inst <"v_ldexp_f16", VOP_F16_F16_I32, AMDGPUldexp>;		defm V_LDEXP_F16 : VOP2Inst <"v_ldexp_f16", VOP_F16_F16_I32, AMDGPUldexp>;
		arsenmUnsubmitted Done Reply Inline Actions This one does not (but does on gfx10) arsenm: This one does not (but does on gfx10)
		rampitecAuthorUnsubmitted Done Reply Inline Actions Thanks for catching! rampitec: Thanks for catching!
} // End FPDPRounding = 1		} // End FPDPRounding = 1

defm V_LSHLREV_B16 : VOP2Inst <"v_lshlrev_b16", VOP_I16_I16_I16, lshl_rev>;		defm V_LSHLREV_B16 : VOP2Inst <"v_lshlrev_b16", VOP_I16_I16_I16, lshl_rev>;
defm V_LSHRREV_B16 : VOP2Inst <"v_lshrrev_b16", VOP_I16_I16_I16, lshr_rev>;		defm V_LSHRREV_B16 : VOP2Inst <"v_lshrrev_b16", VOP_I16_I16_I16, lshr_rev>;
defm V_ASHRREV_I16 : VOP2Inst <"v_ashrrev_i16", VOP_I16_I16_I16, ashr_rev>;		defm V_ASHRREV_I16 : VOP2Inst <"v_ashrrev_i16", VOP_I16_I16_I16, ashr_rev>;

let isCommutable = 1 in {		let isCommutable = 1 in {
let FPDPRounding = 1 in {		let FPDPRounding = 1 in {
Show All 23 Lines
defm V_MAC_F16 : VOP2Inst <"v_mac_f16", VOP_MAC_F16>;		defm V_MAC_F16 : VOP2Inst <"v_mac_f16", VOP_MAC_F16>;
}		}
} // End isCommutable = 1		} // End isCommutable = 1

} // End SubtargetPredicate = Has16BitInsts		} // End SubtargetPredicate = Has16BitInsts

let SubtargetPredicate = HasDLInsts in {		let SubtargetPredicate = HasDLInsts in {

		let isReMaterializable = 1 in
defm V_XNOR_B32 : VOP2Inst <"v_xnor_b32", VOP_I32_I32_I32, xnor>;		defm V_XNOR_B32 : VOP2Inst <"v_xnor_b32", VOP_I32_I32_I32, xnor>;

let Constraints = "$vdst = $src2",		let Constraints = "$vdst = $src2",
DisableEncoding = "$src2",		DisableEncoding = "$src2",
isConvertibleToThreeAddress = 1,		isConvertibleToThreeAddress = 1,
isCommutable = 1 in		isCommutable = 1 in
defm V_FMAC_F32 : VOP2Inst <"v_fmac_f32", VOP_MAC_F32>;		defm V_FMAC_F32 : VOP2Inst <"v_fmac_f32", VOP_MAC_F32>;

▲ Show 20 Lines • Show All 55 Lines • ▼ Show 20 Lines	let AddedComplexity = 30 in {
def : GCNPat<		def : GCNPat<
(i32 (int_amdgcn_sdot8 i32:$src0, i32:$src1, i32:$src2, (i1 DSTCLAMP.NONE))),		(i32 (int_amdgcn_sdot8 i32:$src0, i32:$src1, i32:$src2, (i1 DSTCLAMP.NONE))),
(i32 (V_DOT8C_I32_I4_e32 $src0, $src1, $src2))		(i32 (V_DOT8C_I32_I4_e32 $src0, $src1, $src2))
> {		> {
let SubtargetPredicate = HasDot3Insts;		let SubtargetPredicate = HasDot3Insts;
}		}
} // End AddedComplexity = 30		} // End AddedComplexity = 30

let SubtargetPredicate = HasFmaakFmamkF32Insts in {		let SubtargetPredicate = HasFmaakFmamkF32Insts, isReMaterializable = 1 in {
def V_FMAMK_F32 : VOP2_Pseudo<"v_fmamk_f32", VOP_MADMK_F32, [], "">;		def V_FMAMK_F32 : VOP2_Pseudo<"v_fmamk_f32", VOP_MADMK_F32, [], "">;
		arsenmUnsubmitted Done Reply Inline Actions This and the other fma flavors preserve the high bits on gfx9 arsenm: This and the other fma flavors preserve the high bits on gfx9
		rampitecAuthorUnsubmitted Done Reply Inline Actions This is f32, both f16 fma shall also zero hi bits because these are VOP2 only. rampitec: This is f32, both f16 fma shall also zero hi bits because these are VOP2 only.
		arsenmUnsubmitted Done Reply Inline Actions I wrote inline asm tests a few weeks ago for all of these. The gfx9 manual says it didn't change the existing instruction behavior, but I think this was wrong. mad/mac/fma all seem to preserve (see GCNSubtarget::zeroesHigh16BitsOfDest) arsenm: I wrote inline asm tests a few weeks ago for all of these. The gfx9 manual says it didn't…
		rampitecAuthorUnsubmitted Done Reply Inline Actions Sigh. There are some VOP1 in that list too. I probably need to avoid any 16 bit dst completely. rampitec: Sigh. There are some VOP1 in that list too. I probably need to avoid any 16 bit dst completely.

let isCommutable = 1 in		let isCommutable = 1 in
def V_FMAAK_F32 : VOP2_Pseudo<"v_fmaak_f32", VOP_MADAK_F32, [], "">;		def V_FMAAK_F32 : VOP2_Pseudo<"v_fmaak_f32", VOP_MADAK_F32, [], "">;
}		}

let SubtargetPredicate = isGFX10Plus in {		let SubtargetPredicate = isGFX10Plus in {

let FPDPRounding = 1 in {		let FPDPRounding = 1 in {
def V_FMAMK_F16 : VOP2_Pseudo <"v_fmamk_f16", VOP_MADMK_F16, [], "">;		def V_FMAMK_F16 : VOP2_Pseudo <"v_fmamk_f16", VOP_MADMK_F16, [], "">;

let isCommutable = 1 in		let isCommutable = 1 in
def V_FMAAK_F16 : VOP2_Pseudo <"v_fmaak_f16", VOP_MADAK_F16, [], "">;		def V_FMAAK_F16 : VOP2_Pseudo <"v_fmaak_f16", VOP_MADAK_F16, [], "">;
} // End FPDPRounding = 1		} // End FPDPRounding = 1
		foadUnsubmitted Done Reply Inline Actions Update comment? foad: Update comment?

let Constraints = "$vdst = $src2",		let Constraints = "$vdst = $src2",
DisableEncoding="$src2",		DisableEncoding="$src2",
isConvertibleToThreeAddress = 1,		isConvertibleToThreeAddress = 1,
isCommutable = 1 in {		isCommutable = 1 in {
defm V_FMAC_F16 : VOP2Inst <"v_fmac_f16", VOP_MAC_F16>;		defm V_FMAC_F16 : VOP2Inst <"v_fmac_f16", VOP_MAC_F16>;
}		}

▲ Show 20 Lines • Show All 963 Lines • Show Last 20 Lines

llvm/test/CodeGen/AMDGPU/remat-vop.mir

Show First 20 Lines • Show All 1,358 Lines • ▼ Show 20 Lines	bb.0:
%0:agpr_32 = V_ACCVGPR_MOV_B32 undef $agpr0, implicit $exec		%0:agpr_32 = V_ACCVGPR_MOV_B32 undef $agpr0, implicit $exec
%1:agpr_32 = V_ACCVGPR_MOV_B32 undef $agpr0, implicit $exec		%1:agpr_32 = V_ACCVGPR_MOV_B32 undef $agpr0, implicit $exec
%2:agpr_32 = V_ACCVGPR_MOV_B32 undef $agpr0, implicit $exec		%2:agpr_32 = V_ACCVGPR_MOV_B32 undef $agpr0, implicit $exec
S_NOP 0, implicit %0		S_NOP 0, implicit %0
S_NOP 0, implicit %1		S_NOP 0, implicit %1
S_NOP 0, implicit %2		S_NOP 0, implicit %2
S_ENDPGM 0		S_ENDPGM 0
...		...
		---
		name: test_no_remat_v_cndmask_b32_e32
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_cndmask_b32_e32
		; GCN: renamable $vgpr0 = V_CNDMASK_B32_e32 1, undef $vgpr0, implicit $exec, implicit undef $vcc
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_CNDMASK_B32_e32 1, undef $vgpr0, implicit $exec, implicit undef $vcc
		; GCN: renamable $vgpr0 = V_CNDMASK_B32_e32 1, undef $vgpr0, implicit $exec, implicit undef $vcc
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CNDMASK_B32_e32 1, undef %0:vgpr_32, implicit $exec, implicit undef $vcc
		%2:vgpr_32 = V_CNDMASK_B32_e32 1, undef %0:vgpr_32, implicit $exec, implicit undef $vcc
		%3:vgpr_32 = V_CNDMASK_B32_e32 1, undef %0:vgpr_32, implicit $exec, implicit undef $vcc
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_cndmask_b32_sdwa
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_cndmask_b32_sdwa
		; GCN: renamable $vgpr0 = V_CNDMASK_B32_sdwa 0, undef $vgpr0, 0, undef $vgpr0, 0, 0, 0, 0, 0, implicit $exec, implicit undef $vcc
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_CNDMASK_B32_sdwa 0, undef $vgpr0, 0, undef $vgpr0, 0, 0, 0, 0, 0, implicit $exec, implicit undef $vcc
		; GCN: renamable $vgpr0 = V_CNDMASK_B32_sdwa 0, undef $vgpr0, 0, undef $vgpr0, 0, 0, 0, 0, 0, implicit $exec, implicit undef $vcc
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CNDMASK_B32_sdwa 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 0, 0, 0, 0, 0, implicit $exec, implicit undef $vcc
		%2:vgpr_32 = V_CNDMASK_B32_sdwa 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 0, 0, 0, 0, 0, implicit $exec, implicit undef $vcc
		%3:vgpr_32 = V_CNDMASK_B32_sdwa 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 0, 0, 0, 0, 0, implicit $exec, implicit undef $vcc
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_cndmask_b32_dpp
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_cndmask_b32_dpp
		; GCN: renamable $vgpr0 = V_CNDMASK_B32_dpp undef $vgpr0, 0, undef $vgpr0, 0, undef $vgpr0, 1, 15, 15, 10, implicit $exec, implicit undef $vcc
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_CNDMASK_B32_dpp undef $vgpr1, 0, undef $vgpr0, 0, undef $vgpr0, 1, 15, 15, 10, implicit $exec, implicit undef $vcc
		; GCN: renamable $vgpr0 = V_CNDMASK_B32_dpp undef $vgpr0, 0, undef $vgpr0, 0, undef $vgpr0, 1, 15, 15, 10, implicit $exec, implicit undef $vcc
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CNDMASK_B32_dpp undef %1:vgpr_32, 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 1, 15, 15, 10, implicit $exec, implicit undef $vcc
		%2:vgpr_32 = V_CNDMASK_B32_dpp undef %2:vgpr_32, 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 1, 15, 15, 10, implicit $exec, implicit undef $vcc
		%3:vgpr_32 = V_CNDMASK_B32_dpp undef %3:vgpr_32, 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 1, 15, 15, 10, implicit $exec, implicit undef $vcc
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cndmask_b32_e64
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cndmask_b32_e64
		; GCN: renamable $vgpr0 = V_CNDMASK_B32_e64 0, 1, 0, 2, undef $sgpr0_sgpr1, implicit $exec
		; GCN: renamable $vgpr1 = V_CNDMASK_B32_e64 0, 1, 0, 2, undef $sgpr0_sgpr1, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CNDMASK_B32_e64 0, 1, 0, 2, undef $sgpr0_sgpr1, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CNDMASK_B32_e64 0, 1, 0, 2, undef %0:sreg_64_xexec, implicit $exec
		%2:vgpr_32 = V_CNDMASK_B32_e64 0, 1, 0, 2, undef %0:sreg_64_xexec, implicit $exec
		%3:vgpr_32 = V_CNDMASK_B32_e64 0, 1, 0, 2, undef %0:sreg_64_xexec, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_madmk_f32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_madmk_f32
		; GCN: renamable $vgpr0 = nofpexcept V_MADMK_F32 1, 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_MADMK_F32 2, 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_MADMK_F32 3, 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_MADMK_F32 1, 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_MADMK_F32 2, 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_MADMK_F32 3, 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_add_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_add_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_ADD_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_ADD_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_ADD_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_ADD_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_ADD_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_ADD_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_add_f32_e64
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_add_f32_e64
		; GCN: renamable $vgpr0 = nofpexcept V_ADD_F32_e64 0, 1, 0, undef $vgpr0, 0, 0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_ADD_F32_e64 0, 2, 0, undef $vgpr0, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_ADD_F32_e64 0, 3, 0, undef $vgpr0, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_ADD_F32_e64 0, 1, 0, undef %0:vgpr_32, 0, 0, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_ADD_F32_e64 0, 2, 0, undef %0:vgpr_32, 0, 0, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_ADD_F32_e64 0, 3, 0, undef %0:vgpr_32, 0, 0, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_add_f32_sdwa
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_add_f32_sdwa
		; GCN: renamable $vgpr0 = nofpexcept V_ADD_F32_sdwa 0, undef $vgpr0, 0, undef $vgpr0, 0, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_ADD_F32_sdwa 0, undef $vgpr0, 0, undef $vgpr0, 0, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_ADD_F32_sdwa 0, undef $vgpr0, 0, undef $vgpr0, 0, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_ADD_F32_sdwa 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 0, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_ADD_F32_sdwa 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 0, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_ADD_F32_sdwa 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 0, 0, 0, 0, 0, 0, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_add_f32_dpp
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_add_f32_dpp
		; GCN: renamable $vgpr0 = nofpexcept V_ADD_F32_dpp undef $vgpr0, 0, undef $vgpr0, 0, undef $vgpr0, 1, 15, 15, 10, implicit $exec, implicit $mode
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = nofpexcept V_ADD_F32_dpp undef $vgpr1, 0, undef $vgpr0, 0, undef $vgpr0, 1, 15, 15, 10, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = nofpexcept V_ADD_F32_dpp undef $vgpr0, 0, undef $vgpr0, 0, undef $vgpr0, 1, 15, 15, 10, implicit $exec, implicit $mode
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_ADD_F32_dpp undef %1:vgpr_32, 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 1, 15, 15, 10, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_ADD_F32_dpp undef %2:vgpr_32, 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 1, 15, 15, 10, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_ADD_F32_dpp undef %3:vgpr_32, 0, undef %0:vgpr_32, 0, undef %0:vgpr_32, 1, 15, 15, 10, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_sub_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_sub_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_SUB_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_SUB_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_SUB_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_SUB_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_SUB_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_SUB_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_subrev_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_subrev_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_SUBREV_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_SUBREV_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_SUBREV_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_SUBREV_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_SUBREV_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_SUBREV_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_mul_legacy_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_mul_legacy_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_MUL_LEGACY_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_MUL_LEGACY_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_MUL_LEGACY_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_MUL_LEGACY_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_MUL_LEGACY_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_MUL_LEGACY_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_mul_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_mul_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_MUL_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_MUL_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_MUL_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_MUL_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_MUL_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_MUL_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_mul_i32_i24_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_mul_i32_i24_e32
		; GCN: renamable $vgpr0 = V_MUL_I32_I24_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MUL_I32_I24_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MUL_I32_I24_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MUL_I32_I24_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MUL_I32_I24_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MUL_I32_I24_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_mul_hi_i32_i24_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_mul_hi_i32_i24_e32
		; GCN: renamable $vgpr0 = V_MUL_HI_I32_I24_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MUL_HI_I32_I24_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MUL_HI_I32_I24_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MUL_HI_I32_I24_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MUL_HI_I32_I24_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MUL_HI_I32_I24_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_mul_u32_u24_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_mul_u32_u24_e32
		; GCN: renamable $vgpr0 = V_MUL_U32_U24_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MUL_U32_U24_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MUL_U32_U24_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MUL_U32_U24_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MUL_U32_U24_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MUL_U32_U24_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_mul_hi_u32_u24_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_mul_hi_u32_u24_e32
		; GCN: renamable $vgpr0 = V_MUL_HI_U32_U24_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MUL_HI_U32_U24_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MUL_HI_U32_U24_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MUL_HI_U32_U24_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MUL_HI_U32_U24_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MUL_HI_U32_U24_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_min_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_min_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_MIN_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_MIN_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_MIN_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_MIN_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_MIN_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_MIN_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_max_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_max_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_MAX_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_MAX_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_MAX_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_MAX_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_MAX_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_MAX_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_min_i32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_min_i32_e32
		; GCN: renamable $vgpr0 = V_MIN_I32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MIN_I32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MIN_I32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MIN_I32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MIN_I32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MIN_I32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_max_i32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_max_i32_e32
		; GCN: renamable $vgpr0 = V_MAX_I32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MAX_I32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MAX_I32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MAX_I32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MAX_I32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MAX_I32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_min_u32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_min_u32_e32
		; GCN: renamable $vgpr0 = V_MIN_U32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MIN_U32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MIN_U32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MIN_U32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MIN_U32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MIN_U32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_max_u32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_max_u32_e32
		; GCN: renamable $vgpr0 = V_MAX_U32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MAX_U32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MAX_U32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MAX_U32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MAX_U32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MAX_U32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_lshrrev_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_lshrrev_b32_e32
		; GCN: renamable $vgpr0 = V_LSHRREV_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_LSHRREV_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_LSHRREV_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_LSHRREV_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_LSHRREV_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_LSHRREV_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_lshlrev_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_lshlrev_b32_e32
		; GCN: renamable $vgpr0 = V_LSHLREV_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_LSHLREV_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_LSHLREV_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_LSHLREV_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_LSHLREV_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_LSHLREV_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_ashrrev_i32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_ashrrev_i32_e32
		; GCN: renamable $vgpr0 = V_ASHRREV_I32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_ASHRREV_I32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_ASHRREV_I32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_ASHRREV_I32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_ASHRREV_I32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_ASHRREV_I32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_and_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_and_b32_e32
		; GCN: renamable $vgpr0 = V_AND_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_AND_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_AND_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_AND_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_AND_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_AND_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_or_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_or_b32_e32
		; GCN: renamable $vgpr0 = V_OR_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_OR_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_OR_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_OR_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_OR_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_OR_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_xor_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_xor_b32_e32
		; GCN: renamable $vgpr0 = V_XOR_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_XOR_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_XOR_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_XOR_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_XOR_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_XOR_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_madak_f32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_madak_f32
		; GCN: renamable $vgpr0 = nofpexcept V_MADAK_F32 1, undef $vgpr0, 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_MADAK_F32 2, undef $vgpr0, 2, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_MADAK_F32 3, undef $vgpr0, 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_MADAK_F32 1, undef %0:vgpr_32, 1, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_MADAK_F32 2, undef %0:vgpr_32, 2, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_MADAK_F32 3, undef %0:vgpr_32, 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_add_u32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_add_u32_e32
		; GCN: renamable $vgpr0 = V_ADD_U32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_ADD_U32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_ADD_U32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_ADD_U32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_ADD_U32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_ADD_U32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_sub_u32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_sub_u32_e32
		; GCN: renamable $vgpr0 = V_SUB_U32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_SUB_U32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_SUB_U32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_SUB_U32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_SUB_U32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_SUB_U32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_subrev_u32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_subrev_u32_e32
		; GCN: renamable $vgpr0 = V_SUBREV_U32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_SUBREV_U32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_SUBREV_U32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_SUBREV_U32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_SUBREV_U32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_SUBREV_U32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_bfm_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_bfm_b32_e32
		; GCN: renamable $vgpr0 = V_BFM_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_BFM_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_BFM_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_BFM_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_BFM_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_BFM_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_bcnt_u32_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_bcnt_u32_b32_e32
		; GCN: renamable $vgpr0 = V_BCNT_U32_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_BCNT_U32_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_BCNT_U32_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_BCNT_U32_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_BCNT_U32_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_BCNT_U32_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_mbcnt_lo_u32_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_mbcnt_lo_u32_b32_e32
		; GCN: renamable $vgpr0 = V_MBCNT_LO_U32_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MBCNT_LO_U32_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MBCNT_LO_U32_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MBCNT_LO_U32_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MBCNT_LO_U32_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MBCNT_LO_U32_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_mbcnt_hi_u32_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_mbcnt_hi_u32_b32_e32
		; GCN: renamable $vgpr0 = V_MBCNT_HI_U32_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_MBCNT_HI_U32_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_MBCNT_HI_U32_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_MBCNT_HI_U32_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_MBCNT_HI_U32_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_MBCNT_HI_U32_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_ldexp_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_ldexp_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_LDEXP_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_LDEXP_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_LDEXP_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_LDEXP_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_LDEXP_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_LDEXP_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_pknorm_i16_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_pknorm_i16_f32_e32
		; GCN: renamable $vgpr0 = V_CVT_PKNORM_I16_F32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_CVT_PKNORM_I16_F32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_PKNORM_I16_F32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CVT_PKNORM_I16_F32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_CVT_PKNORM_I16_F32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_CVT_PKNORM_I16_F32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_pknorm_u16_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_pknorm_u16_f32_e32
		; GCN: renamable $vgpr0 = V_CVT_PKNORM_U16_F32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_CVT_PKNORM_U16_F32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_PKNORM_U16_F32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CVT_PKNORM_U16_F32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_CVT_PKNORM_U16_F32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_CVT_PKNORM_U16_F32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_pkrtz_f16_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_pkrtz_f16_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_CVT_PKRTZ_F16_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_CVT_PKRTZ_F16_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_CVT_PKRTZ_F16_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_CVT_PKRTZ_F16_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_CVT_PKRTZ_F16_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_CVT_PKRTZ_F16_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_pk_u16_u32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_pk_u16_u32_e32
		; GCN: renamable $vgpr0 = V_CVT_PK_U16_U32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_CVT_PK_U16_U32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_PK_U16_U32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CVT_PK_U16_U32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_CVT_PK_U16_U32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_CVT_PK_U16_U32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_cvt_pk_i16_i32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_cvt_pk_i16_i32_e32
		; GCN: renamable $vgpr0 = V_CVT_PK_I16_I32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_CVT_PK_I16_I32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_CVT_PK_I16_I32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_CVT_PK_I16_I32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_CVT_PK_I16_I32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_CVT_PK_I16_I32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_min_legacy_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_min_legacy_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_MIN_LEGACY_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_MIN_LEGACY_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_MIN_LEGACY_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_MIN_LEGACY_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_MIN_LEGACY_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_MIN_LEGACY_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_max_legacy_f32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_max_legacy_f32_e32
		; GCN: renamable $vgpr0 = nofpexcept V_MAX_LEGACY_F32_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_MAX_LEGACY_F32_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_MAX_LEGACY_F32_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_MAX_LEGACY_F32_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_MAX_LEGACY_F32_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_MAX_LEGACY_F32_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_lshr_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_lshr_b32_e32
		; GCN: renamable $vgpr0 = V_LSHR_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_LSHR_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_LSHR_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_LSHR_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_LSHR_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_LSHR_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_lshl_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_lshl_b32_e32
		; GCN: renamable $vgpr0 = V_LSHL_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_LSHL_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_LSHL_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_LSHL_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_LSHL_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_LSHL_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_ashr_i32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_ashr_i32_e32
		; GCN: renamable $vgpr0 = V_ASHR_I32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_ASHR_I32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_ASHR_I32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_ASHR_I32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_ASHR_I32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_ASHR_I32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_ldexp_f16_e32
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_ldexp_f16_e32
		; GCN: renamable $vgpr0 = nofpexcept V_LDEXP_F16_e32 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = nofpexcept V_LDEXP_F16_e32 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr0 = nofpexcept V_LDEXP_F16_e32 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_LDEXP_F16_e32 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_LDEXP_F16_e32 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_LDEXP_F16_e32 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_lshrrev_b16_e32
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_lshrrev_b16_e32
		; GCN: renamable $vgpr0 = V_LSHRREV_B16_e32 1, undef $vgpr0, implicit $exec
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_LSHRREV_B16_e32 2, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr0 = V_LSHRREV_B16_e32 3, undef $vgpr0, implicit $exec
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_LSHRREV_B16_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_LSHRREV_B16_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_LSHRREV_B16_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_lshlrev_b16_e32
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_lshlrev_b16_e32
		; GCN: renamable $vgpr0 = V_LSHLREV_B16_e32 1, undef $vgpr0, implicit $exec
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_LSHLREV_B16_e32 2, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr0 = V_LSHLREV_B16_e32 3, undef $vgpr0, implicit $exec
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_LSHLREV_B16_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_LSHLREV_B16_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_LSHLREV_B16_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_no_remat_v_ashrrev_i16_e32
		tracksRegLiveness: true
		machineFunctionInfo:
		stackPtrOffsetReg: $sgpr32
		body: \|
		bb.0:
		; GCN-LABEL: name: test_no_remat_v_ashrrev_i16_e32
		; GCN: renamable $vgpr0 = V_ASHRREV_I16_e32 1, undef $vgpr0, implicit $exec
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.1, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.1, addrspace 5)
		; GCN: renamable $vgpr1 = V_ASHRREV_I16_e32 2, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr0 = V_ASHRREV_I16_e32 3, undef $vgpr0, implicit $exec
		; GCN: SI_SPILL_V32_SAVE killed $vgpr0, %stack.0, $sgpr32, 0, implicit $exec :: (store (s32) into %stack.0, addrspace 5)
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.1, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.1, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = SI_SPILL_V32_RESTORE %stack.0, $sgpr32, 0, implicit $exec :: (load (s32) from %stack.0, addrspace 5)
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_ASHRREV_I16_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_ASHRREV_I16_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_ASHRREV_I16_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_xnor_b32_e32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_xnor_b32_e32
		; GCN: renamable $vgpr0 = V_XNOR_B32_e32 1, undef $vgpr0, implicit $exec
		; GCN: renamable $vgpr1 = V_XNOR_B32_e32 2, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = V_XNOR_B32_e32 3, undef $vgpr0, implicit $exec
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = V_XNOR_B32_e32 1, undef %0:vgpr_32, implicit $exec
		%2:vgpr_32 = V_XNOR_B32_e32 2, undef %0:vgpr_32, implicit $exec
		%3:vgpr_32 = V_XNOR_B32_e32 3, undef %0:vgpr_32, implicit $exec
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_fmamk_f32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_fmamk_f32
		; GCN: renamable $vgpr0 = nofpexcept V_FMAMK_F32 1, 1, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_FMAMK_F32 2, 2, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_FMAMK_F32 3, 3, undef $vgpr0, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_FMAMK_F32 1, 1, undef %0:vgpr_32, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_FMAMK_F32 2, 2, undef %0:vgpr_32, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_FMAMK_F32 3, 3, undef %0:vgpr_32, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...
		---
		name: test_remat_v_fmaak_f32
		tracksRegLiveness: true
		body: \|
		bb.0:
		; GCN-LABEL: name: test_remat_v_fmaak_f32
		; GCN: renamable $vgpr0 = nofpexcept V_FMAAK_F32 1, undef $vgpr0, 1, implicit $exec, implicit $mode
		; GCN: renamable $vgpr1 = nofpexcept V_FMAAK_F32 2, undef $vgpr0, 2, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_NOP 0, implicit killed renamable $vgpr1
		; GCN: renamable $vgpr0 = nofpexcept V_FMAAK_F32 3, undef $vgpr0, 3, implicit $exec, implicit $mode
		; GCN: S_NOP 0, implicit killed renamable $vgpr0
		; GCN: S_ENDPGM 0
		%1:vgpr_32 = nofpexcept V_FMAAK_F32 1, undef %0:vgpr_32, 1, implicit $exec, implicit $mode
		%2:vgpr_32 = nofpexcept V_FMAAK_F32 2, undef %0:vgpr_32, 2, implicit $exec, implicit $mode
		%3:vgpr_32 = nofpexcept V_FMAAK_F32 3, undef %0:vgpr_32, 3, implicit $exec, implicit $mode
		S_NOP 0, implicit %1
		S_NOP 0, implicit %2
		S_NOP 0, implicit %3
		S_ENDPGM 0
		...

This is an archive of the discontinued LLVM Phabricator instance.

[AMDGPU] Mark relevant rematerializable VOP2 instructions
ClosedPublic

Details

Diff Detail

Unit TestsFailed

Event Timeline

Revision Contents

Diff 359162

llvm/lib/Target/AMDGPU/SIInstrInfo.cpp

llvm/lib/Target/AMDGPU/VOP2Instructions.td

llvm/test/CodeGen/AMDGPU/remat-vop.mir

This is an archive of the discontinued LLVM Phabricator instance.

[AMDGPU] Mark relevant rematerializable VOP2 instructionsClosedPublic

Details

Diff Detail

Unit TestsFailed

Event Timeline

Revision Contents

Diff 359162

llvm/lib/Target/AMDGPU/SIInstrInfo.cpp

llvm/lib/Target/AMDGPU/VOP2Instructions.td

llvm/test/CodeGen/AMDGPU/remat-vop.mir

[AMDGPU] Mark relevant rematerializable VOP2 instructions
ClosedPublic