This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
llvm/trunk/
-
trunk/
-
lib/Target/PowerPC/
-
Target/
-
PowerPC/
-
PPCISelDAGToDAG.cpp
-
PPCISelLowering.h
-
PPCISelLowering.cpp
-
PPCInstr64Bit.td
-
PPCInstrInfo.td
-
PPCInstrVSX.td
-
test/CodeGen/PowerPC/
-
CodeGen/
-
PowerPC/
-
build-vector-tests.ll
-
unaligned-addressing-mode.ll

Differential D62173

[PowerPC] [ISEL] select x-form instruction for unaligned offset
ClosedPublic

Authored by shchenz on May 20 2019, 10:52 PM.

Download Raw Diff

Details

Reviewers

hfinkel
jsji
nemanjai
steven.zhang

Commits

rL361346: [PowerPC] [ISEL] select x-form instruction for unaligned offset

Summary

This patch is ready to fix issue like:

t50: i64 = add t44:1, Constant:i64<3>
t16: i64,ch = load<(load 8 from %ir.uglygep910.cast, !tbaa !3)> t0, t50, undef:i64

Currently we generate:

t50: i64 = ADDI8 t55:1, TargetConstant:i64<3>
t16: i64,ch = LD<Mem:(load 8 from %ir.uglygep910.cast, !tbaa !3)> TargetConstant:i64<0>, t50, t0

But this is not the best one, we should use x-form load here, like:

t46: i64 = LI8 TargetConstant:i64<3>
t18: i64,ch = LDX<Mem:(load 8 from %ir.uglygep910.cast, !tbaa !3)> t55:1, t46, t0

Because if above load is inside a loop, LI8 can be moved outside of loop in later LICM based on register pressure.

gain 10% for small case, %3 for 526.blender_r of SPEC 2017 on PWR8.

Diff Detail

Repository: rL LLVM

Event Timeline

shchenz created this revision.May 20 2019, 10:52 PM

Herald added a project: Restricted Project. · View Herald TranscriptMay 20 2019, 10:52 PM

Herald added subscribers: jfb, kosarev, hiraditya. · View Herald Transcript

LGTM

This revision is now accepted and ready to land.May 21 2019, 8:11 AM

Closed by commit rL361346: [PowerPC] [ISEL] select x-form instruction for unaligned offset (authored by shchenz). · Explain WhyMay 21 2019, 7:55 PM

This revision was automatically updated to reflect the committed changes.

Revision Contents

Path

Size

llvm/

trunk/

lib/

Target/

PowerPC/

56 lines

16 lines

21 lines

10 lines

21 lines

76 lines

test/

CodeGen/

PowerPC/

build-vector-tests.ll

32 lines

unaligned-addressing-mode.ll

19 lines

Diff 200629

llvm/trunk/lib/Target/PowerPC/PPCISelDAGToDAG.cpp

Show First 20 Lines • Show All 212 Lines • ▼ Show 20 Lines	public:
// an X-Form store instruction with the offset being a relocation coming from		// an X-Form store instruction with the offset being a relocation coming from
// the PPCISD::ADD_TLS.		// the PPCISD::ADD_TLS.
bool tryTLSXFormStore(StoreSDNode *N);		bool tryTLSXFormStore(StoreSDNode *N);
/// SelectCC - Select a comparison of the specified values with the		/// SelectCC - Select a comparison of the specified values with the
/// specified condition code, returning the CR# of the expression.		/// specified condition code, returning the CR# of the expression.
SDValue SelectCC(SDValue LHS, SDValue RHS, ISD::CondCode CC,		SDValue SelectCC(SDValue LHS, SDValue RHS, ISD::CondCode CC,
const SDLoc &dl);		const SDLoc &dl);

/// SelectAddrImm - Returns true if the address N can be represented by
/// a base register plus a signed 16-bit displacement [r+imm].
bool SelectAddrImm(SDValue N, SDValue &Disp,
SDValue &Base) {
return PPCLowering->SelectAddressRegImm(N, Disp, Base, *CurDAG, 0);
}

/// SelectAddrImmOffs - Return true if the operand is valid for a preinc		/// SelectAddrImmOffs - Return true if the operand is valid for a preinc
/// immediate field. Note that the operand at this point is already the		/// immediate field. Note that the operand at this point is already the
/// result of a prior SelectAddressRegImm call.		/// result of a prior SelectAddressRegImm call.
bool SelectAddrImmOffs(SDValue N, SDValue &Out) const {		bool SelectAddrImmOffs(SDValue N, SDValue &Out) const {
if (N.getOpcode() == ISD::TargetConstant \|\|		if (N.getOpcode() == ISD::TargetConstant \|\|
N.getOpcode() == ISD::TargetGlobalAddress) {		N.getOpcode() == ISD::TargetGlobalAddress) {
Out = N;		Out = N;
return true;		return true;
}		}

return false;		return false;
}		}

/// SelectAddrIdx - Given the specified addressed, check to see if it can be		/// SelectAddrIdx - Given the specified address, check to see if it can be
/// represented as an indexed [r+r] operation. Returns false if it can		/// represented as an indexed [r+r] operation.
/// be represented by [r+imm], which are preferred.		/// This is for xform instructions whose associated displacement form is D.
		/// The last parameter \p 0 means associated D form has no requirment for 16
		/// bit signed displacement.
		/// Returns false if it can be represented by [r+imm], which are preferred.
bool SelectAddrIdx(SDValue N, SDValue &Base, SDValue &Index) {		bool SelectAddrIdx(SDValue N, SDValue &Base, SDValue &Index) {
return PPCLowering->SelectAddressRegReg(N, Base, Index, *CurDAG);		return PPCLowering->SelectAddressRegReg(N, Base, Index, *CurDAG, 0);
		}

		/// SelectAddrIdx4 - Given the specified address, check to see if it can be
		/// represented as an indexed [r+r] operation.
		/// This is for xform instructions whose associated displacement form is DS.
		/// The last parameter \p 4 means associated DS form 16 bit signed
		/// displacement must be a multiple of 4.
		/// Returns false if it can be represented by [r+imm], which are preferred.
		bool SelectAddrIdxX4(SDValue N, SDValue &Base, SDValue &Index) {
		return PPCLowering->SelectAddressRegReg(N, Base, Index, *CurDAG, 4);
}		}

/// SelectAddrIdxOnly - Given the specified addressed, force it to be		/// SelectAddrIdx16 - Given the specified address, check to see if it can be
		/// represented as an indexed [r+r] operation.
		/// This is for xform instructions whose associated displacement form is DQ.
		/// The last parameter \p 16 means associated DQ form 16 bit signed
		/// displacement must be a multiple of 16.
		/// Returns false if it can be represented by [r+imm], which are preferred.
		bool SelectAddrIdxX16(SDValue N, SDValue &Base, SDValue &Index) {
		return PPCLowering->SelectAddressRegReg(N, Base, Index, *CurDAG, 16);
		}

		/// SelectAddrIdxOnly - Given the specified address, force it to be
/// represented as an indexed [r+r] operation.		/// represented as an indexed [r+r] operation.
bool SelectAddrIdxOnly(SDValue N, SDValue &Base, SDValue &Index) {		bool SelectAddrIdxOnly(SDValue N, SDValue &Base, SDValue &Index) {
return PPCLowering->SelectAddressRegRegOnly(N, Base, Index, *CurDAG);		return PPCLowering->SelectAddressRegRegOnly(N, Base, Index, *CurDAG);
}		}

		/// SelectAddrImm - Returns true if the address N can be represented by
		/// a base register plus a signed 16-bit displacement [r+imm].
		/// The last parameter \p 0 means D form has no requirment for 16 bit signed
		/// displacement.
		bool SelectAddrImm(SDValue N, SDValue &Disp,
		SDValue &Base) {
		return PPCLowering->SelectAddressRegImm(N, Disp, Base, *CurDAG, 0);
		}

/// SelectAddrImmX4 - Returns true if the address N can be represented by		/// SelectAddrImmX4 - Returns true if the address N can be represented by
/// a base register plus a signed 16-bit displacement that is a multiple of 4.		/// a base register plus a signed 16-bit displacement that is a multiple of
/// Suitable for use by STD and friends.		/// 4 (last parameter). Suitable for use by STD and friends.
bool SelectAddrImmX4(SDValue N, SDValue &Disp, SDValue &Base) {		bool SelectAddrImmX4(SDValue N, SDValue &Disp, SDValue &Base) {
return PPCLowering->SelectAddressRegImm(N, Disp, Base, *CurDAG, 4);		return PPCLowering->SelectAddressRegImm(N, Disp, Base, *CurDAG, 4);
}		}

		/// SelectAddrImmX16 - Returns true if the address N can be represented by
		/// a base register plus a signed 16-bit displacement that is a multiple of
		/// 16(last parameter). Suitable for use by STXV and friends.
bool SelectAddrImmX16(SDValue N, SDValue &Disp, SDValue &Base) {		bool SelectAddrImmX16(SDValue N, SDValue &Disp, SDValue &Base) {
return PPCLowering->SelectAddressRegImm(N, Disp, Base, *CurDAG, 16);		return PPCLowering->SelectAddressRegImm(N, Disp, Base, *CurDAG, 16);
}		}

// Select an address into a single register.		// Select an address into a single register.
bool SelectAddr(SDValue N, SDValue &Base) {		bool SelectAddr(SDValue N, SDValue &Base) {
Base = N;		Base = N;
return true;		return true;
▲ Show 20 Lines • Show All 6,254 Lines • Show Last 20 Lines

llvm/trunk/lib/Target/PowerPC/PPCISelLowering.h

Show First 20 Lines • Show All 654 Lines • ▼ Show 20 Lines	public:
/// offset pointer and addressing mode by reference if the node's address		/// offset pointer and addressing mode by reference if the node's address
/// can be legally represented as pre-indexed load / store address.		/// can be legally represented as pre-indexed load / store address.
bool getPreIndexedAddressParts(SDNode *N, SDValue &Base,		bool getPreIndexedAddressParts(SDNode *N, SDValue &Base,
SDValue &Offset,		SDValue &Offset,
ISD::MemIndexedMode &AM,		ISD::MemIndexedMode &AM,
SelectionDAG &DAG) const override;		SelectionDAG &DAG) const override;

/// SelectAddressRegReg - Given the specified addressed, check to see if it		/// SelectAddressRegReg - Given the specified addressed, check to see if it
/// can be represented as an indexed [r+r] operation. Returns false if it		/// can be more efficiently represented as [r+imm]. If \p EncodingAlignment
/// can be more efficiently represented with [r+imm].		/// is non-zero, only accept displacement which is not suitable for [r+imm].
		/// Returns false if it can be represented by [r+imm], which are preferred.
bool SelectAddressRegReg(SDValue N, SDValue &Base, SDValue &Index,		bool SelectAddressRegReg(SDValue N, SDValue &Base, SDValue &Index,
SelectionDAG &DAG) const;		SelectionDAG &DAG,
		unsigned EncodingAlignment = 0) const;

/// SelectAddressRegImm - Returns true if the address N can be represented		/// SelectAddressRegImm - Returns true if the address N can be represented
/// by a base register plus a signed 16-bit displacement [r+imm], and if it		/// by a base register plus a signed 16-bit displacement [r+imm], and if it
/// is not better represented as reg+reg. If Aligned is true, only accept		/// is not better represented as reg+reg. If \p EncodingAlignment is
/// displacements suitable for STD and friends, i.e. multiples of 4.		/// non-zero, only accept displacements suitable for instruction encoding
		/// requirement, i.e. multiples of 4 for DS form.
bool SelectAddressRegImm(SDValue N, SDValue &Disp, SDValue &Base,		bool SelectAddressRegImm(SDValue N, SDValue &Disp, SDValue &Base,
SelectionDAG &DAG, unsigned Alignment) const;		SelectionDAG &DAG,
		unsigned EncodingAlignment) const;

/// SelectAddressRegRegOnly - Given the specified addressed, force it to be		/// SelectAddressRegRegOnly - Given the specified addressed, force it to be
/// represented as an indexed [r+r] operation.		/// represented as an indexed [r+r] operation.
bool SelectAddressRegRegOnly(SDValue N, SDValue &Base, SDValue &Index,		bool SelectAddressRegRegOnly(SDValue N, SDValue &Base, SDValue &Index,
SelectionDAG &DAG) const;		SelectionDAG &DAG) const;

Sched::Preference getSchedulingPreference(SDNode *N) const override;		Sched::Preference getSchedulingPreference(SDNode *N) const override;

▲ Show 20 Lines • Show All 505 Lines • Show Last 20 Lines

llvm/trunk/lib/Target/PowerPC/PPCISelLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 2,213 Lines • ▼ Show 20 Lines	else
return Imm == (int64_t)cast<ConstantSDNode>(N)->getZExtValue();		return Imm == (int64_t)cast<ConstantSDNode>(N)->getZExtValue();
}		}
bool llvm::isIntS16Immediate(SDValue Op, int16_t &Imm) {		bool llvm::isIntS16Immediate(SDValue Op, int16_t &Imm) {
return isIntS16Immediate(Op.getNode(), Imm);		return isIntS16Immediate(Op.getNode(), Imm);
}		}

/// SelectAddressRegReg - Given the specified addressed, check to see if it		/// SelectAddressRegReg - Given the specified addressed, check to see if it
/// can be represented as an indexed [r+r] operation. Returns false if it		/// can be represented as an indexed [r+r] operation. Returns false if it
/// can be more efficiently represented with [r+imm].		/// can be more efficiently represented as [r+imm]. If \p EncodingAlignment is
		/// non-zero and N can be represented by a base register plus a signed 16-bit
		/// displacement, make a more precise judgement by checking (displacement % \p
		/// EncodingAlignment).
bool PPCTargetLowering::SelectAddressRegReg(SDValue N, SDValue &Base,		bool PPCTargetLowering::SelectAddressRegReg(SDValue N, SDValue &Base,
SDValue &Index,		SDValue &Index, SelectionDAG &DAG,
SelectionDAG &DAG) const {		unsigned EncodingAlignment) const {
int16_t imm = 0;		int16_t imm = 0;
if (N.getOpcode() == ISD::ADD) {		if (N.getOpcode() == ISD::ADD) {
if (isIntS16Immediate(N.getOperand(1), imm))		if (isIntS16Immediate(N.getOperand(1), imm) &&
		(!EncodingAlignment \|\| !(imm % EncodingAlignment)))
return false; // r+i		return false; // r+i
if (N.getOperand(1).getOpcode() == PPCISD::Lo)		if (N.getOperand(1).getOpcode() == PPCISD::Lo)
return false; // r+i		return false; // r+i

Base = N.getOperand(0);		Base = N.getOperand(0);
Index = N.getOperand(1);		Index = N.getOperand(1);
return true;		return true;
} else if (N.getOpcode() == ISD::OR) {		} else if (N.getOpcode() == ISD::OR) {
if (isIntS16Immediate(N.getOperand(1), imm))		if (isIntS16Immediate(N.getOperand(1), imm) &&
		(!EncodingAlignment \|\| !(imm % EncodingAlignment)))
return false; // r+i can fold it if we can.		return false; // r+i can fold it if we can.

// If this is an or of disjoint bitfields, we can codegen this as an add		// If this is an or of disjoint bitfields, we can codegen this as an add
// (for better address arithmetic) if the LHS and RHS of the OR are provably		// (for better address arithmetic) if the LHS and RHS of the OR are provably
// disjoint.		// disjoint.
KnownBits LHSKnown = DAG.computeKnownBits(N.getOperand(0));		KnownBits LHSKnown = DAG.computeKnownBits(N.getOperand(0));

if (LHSKnown.Zero.getBoolValue()) {		if (LHSKnown.Zero.getBoolValue()) {
KnownBits RHSKnown = DAG.computeKnownBits(N.getOperand(1));		KnownBits RHSKnown = DAG.computeKnownBits(N.getOperand(1));
▲ Show 20 Lines • Show All 56 Lines • ▼ Show 20 Lines
/// displacements that are multiples of that value.		/// displacements that are multiples of that value.
bool PPCTargetLowering::SelectAddressRegImm(SDValue N, SDValue &Disp,		bool PPCTargetLowering::SelectAddressRegImm(SDValue N, SDValue &Disp,
SDValue &Base,		SDValue &Base,
SelectionDAG &DAG,		SelectionDAG &DAG,
unsigned EncodingAlignment) const {		unsigned EncodingAlignment) const {
// FIXME dl should come from parent load or store, not from address		// FIXME dl should come from parent load or store, not from address
SDLoc dl(N);		SDLoc dl(N);
// If this can be more profitably realized as r+r, fail.		// If this can be more profitably realized as r+r, fail.
if (SelectAddressRegReg(N, Disp, Base, DAG))		if (SelectAddressRegReg(N, Disp, Base, DAG, EncodingAlignment))
return false;		return false;

if (N.getOpcode() == ISD::ADD) {		if (N.getOpcode() == ISD::ADD) {
int16_t imm = 0;		int16_t imm = 0;
if (isIntS16Immediate(N.getOperand(1), imm) &&		if (isIntS16Immediate(N.getOperand(1), imm) &&
(!EncodingAlignment \|\| (imm % EncodingAlignment) == 0)) {		(!EncodingAlignment \|\| (imm % EncodingAlignment) == 0)) {
Disp = DAG.getTargetConstant(imm, dl, N.getValueType());		Disp = DAG.getTargetConstant(imm, dl, N.getValueType());
if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N.getOperand(0))) {		if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N.getOperand(0))) {
▲ Show 20 Lines • Show All 12,721 Lines • Show Last 20 Lines

llvm/trunk/lib/Target/PowerPC/PPCInstr64Bit.td

Show First 20 Lines • Show All 921 Lines • ▼ Show 20 Lines	def LWA : DSForm_1<58, 2, (outs g8rc:$rD), (ins memrix:$src),
PPC970_DGroup_Cracked;		PPC970_DGroup_Cracked;
let Interpretation64Bit = 1, isCodeGenOnly = 1 in		let Interpretation64Bit = 1, isCodeGenOnly = 1 in
def LHAX8: XForm_1_memOp<31, 343, (outs g8rc:$rD), (ins memrr:$src),		def LHAX8: XForm_1_memOp<31, 343, (outs g8rc:$rD), (ins memrr:$src),
"lhax $rD, $src", IIC_LdStLHA,		"lhax $rD, $src", IIC_LdStLHA,
[(set i64:$rD, (sextloadi16 xaddr:$src))]>,		[(set i64:$rD, (sextloadi16 xaddr:$src))]>,
PPC970_DGroup_Cracked;		PPC970_DGroup_Cracked;
def LWAX : XForm_1_memOp<31, 341, (outs g8rc:$rD), (ins memrr:$src),		def LWAX : XForm_1_memOp<31, 341, (outs g8rc:$rD), (ins memrr:$src),
"lwax $rD, $src", IIC_LdStLHA,		"lwax $rD, $src", IIC_LdStLHA,
[(set i64:$rD, (sextloadi32 xaddr:$src))]>, isPPC64,		[(set i64:$rD, (sextloadi32 xaddrX4:$src))]>, isPPC64,
PPC970_DGroup_Cracked;		PPC970_DGroup_Cracked;
// For fast-isel:		// For fast-isel:
let isCodeGenOnly = 1, mayLoad = 1 in {		let isCodeGenOnly = 1, mayLoad = 1 in {
def LWA_32 : DSForm_1<58, 2, (outs gprc:$rD), (ins memrix:$src),		def LWA_32 : DSForm_1<58, 2, (outs gprc:$rD), (ins memrix:$src),
"lwa $rD, $src", IIC_LdStLWA, []>, isPPC64,		"lwa $rD, $src", IIC_LdStLWA, []>, isPPC64,
PPC970_DGroup_Cracked;		PPC970_DGroup_Cracked;
def LWAX_32 : XForm_1_memOp<31, 341, (outs gprc:$rD), (ins memrr:$src),		def LWAX_32 : XForm_1_memOp<31, 341, (outs gprc:$rD), (ins memrr:$src),
"lwax $rD, $src", IIC_LdStLHA, []>, isPPC64,		"lwax $rD, $src", IIC_LdStLHA, []>, isPPC64,
▲ Show 20 Lines • Show All 108 Lines • ▼ Show 20 Lines	def LDtocCPT: PPCEmitTimePseudo<(outs g8rc:$rD), (ins tocentry:$disp, g8rc:$reg),
(PPCtoc_entry tconstpool:$disp, i64:$reg))]>, isPPC64;		(PPCtoc_entry tconstpool:$disp, i64:$reg))]>, isPPC64;
def LDtocBA: PPCEmitTimePseudo<(outs g8rc:$rD), (ins tocentry:$disp, g8rc:$reg),		def LDtocBA: PPCEmitTimePseudo<(outs g8rc:$rD), (ins tocentry:$disp, g8rc:$reg),
"#LDtocCPT",		"#LDtocCPT",
[(set i64:$rD,		[(set i64:$rD,
(PPCtoc_entry tblockaddress:$disp, i64:$reg))]>, isPPC64;		(PPCtoc_entry tblockaddress:$disp, i64:$reg))]>, isPPC64;

def LDX : XForm_1_memOp<31, 21, (outs g8rc:$rD), (ins memrr:$src),		def LDX : XForm_1_memOp<31, 21, (outs g8rc:$rD), (ins memrr:$src),
"ldx $rD, $src", IIC_LdStLD,		"ldx $rD, $src", IIC_LdStLD,
[(set i64:$rD, (load xaddr:$src))]>, isPPC64;		[(set i64:$rD, (load xaddrX4:$src))]>, isPPC64;
def LDBRX : XForm_1_memOp<31, 532, (outs g8rc:$rD), (ins memrr:$src),		def LDBRX : XForm_1_memOp<31, 532, (outs g8rc:$rD), (ins memrr:$src),
"ldbrx $rD, $src", IIC_LdStLoad,		"ldbrx $rD, $src", IIC_LdStLoad,
[(set i64:$rD, (PPClbrx xoaddr:$src, i64))]>, isPPC64;		[(set i64:$rD, (PPClbrx xoaddr:$src, i64))]>, isPPC64;

let mayLoad = 1, hasSideEffects = 0, isCodeGenOnly = 1 in {		let mayLoad = 1, hasSideEffects = 0, isCodeGenOnly = 1 in {
def LHBRX8 : XForm_1_memOp<31, 790, (outs g8rc:$rD), (ins memrr:$src),		def LHBRX8 : XForm_1_memOp<31, 790, (outs g8rc:$rD), (ins memrr:$src),
"lhbrx $rD, $src", IIC_LdStLoad, []>;		"lhbrx $rD, $src", IIC_LdStLoad, []>;
def LWBRX8 : XForm_1_memOp<31, 534, (outs g8rc:$rD), (ins memrr:$src),		def LWBRX8 : XForm_1_memOp<31, 534, (outs g8rc:$rD), (ins memrr:$src),
▲ Show 20 Lines • Show All 155 Lines • ▼ Show 20 Lines
} // Interpretation64Bit		} // Interpretation64Bit

// Normal 8-byte stores.		// Normal 8-byte stores.
def STD : DSForm_1<62, 0, (outs), (ins g8rc:$rS, memrix:$dst),		def STD : DSForm_1<62, 0, (outs), (ins g8rc:$rS, memrix:$dst),
"std $rS, $dst", IIC_LdStSTD,		"std $rS, $dst", IIC_LdStSTD,
[(aligned4store i64:$rS, ixaddr:$dst)]>, isPPC64;		[(aligned4store i64:$rS, ixaddr:$dst)]>, isPPC64;
def STDX : XForm_8_memOp<31, 149, (outs), (ins g8rc:$rS, memrr:$dst),		def STDX : XForm_8_memOp<31, 149, (outs), (ins g8rc:$rS, memrr:$dst),
"stdx $rS, $dst", IIC_LdStSTD,		"stdx $rS, $dst", IIC_LdStSTD,
[(store i64:$rS, xaddr:$dst)]>, isPPC64,		[(store i64:$rS, xaddrX4:$dst)]>, isPPC64,
PPC970_DGroup_Cracked;		PPC970_DGroup_Cracked;
def STDBRX: XForm_8_memOp<31, 660, (outs), (ins g8rc:$rS, memrr:$dst),		def STDBRX: XForm_8_memOp<31, 660, (outs), (ins g8rc:$rS, memrr:$dst),
"stdbrx $rS, $dst", IIC_LdStStore,		"stdbrx $rS, $dst", IIC_LdStStore,
[(PPCstbrx i64:$rS, xoaddr:$dst, i64)]>, isPPC64,		[(PPCstbrx i64:$rS, xoaddr:$dst, i64)]>, isPPC64,
PPC970_DGroup_Cracked;		PPC970_DGroup_Cracked;
}		}

// Stores with Update (pre-inc).		// Stores with Update (pre-inc).
▲ Show 20 Lines • Show All 200 Lines • ▼ Show 20 Lines	def : Pat<(i64 (unaligned4sextloadi32 xoaddr:$src)),
(LWAX xoaddr:$src)>;		(LWAX xoaddr:$src)>;
def : Pat<(i64 (unaligned4load xoaddr:$src)),		def : Pat<(i64 (unaligned4load xoaddr:$src)),
(LDX xoaddr:$src)>;		(LDX xoaddr:$src)>;
def : Pat<(unaligned4store i64:$rS, xoaddr:$dst),		def : Pat<(unaligned4store i64:$rS, xoaddr:$dst),
(STDX $rS, xoaddr:$dst)>;		(STDX $rS, xoaddr:$dst)>;

// 64-bits atomic loads and stores		// 64-bits atomic loads and stores
def : Pat<(atomic_load_64 ixaddr:$src), (LD memrix:$src)>;		def : Pat<(atomic_load_64 ixaddr:$src), (LD memrix:$src)>;
def : Pat<(atomic_load_64 xaddr:$src), (LDX memrr:$src)>;		def : Pat<(atomic_load_64 xaddrX4:$src), (LDX memrr:$src)>;

def : Pat<(atomic_store_64 ixaddr:$ptr, i64:$val), (STD g8rc:$val, memrix:$ptr)>;		def : Pat<(atomic_store_64 ixaddr:$ptr, i64:$val), (STD g8rc:$val, memrix:$ptr)>;
def : Pat<(atomic_store_64 xaddr:$ptr, i64:$val), (STDX g8rc:$val, memrr:$ptr)>;		def : Pat<(atomic_store_64 xaddrX4:$ptr, i64:$val), (STDX g8rc:$val, memrr:$ptr)>;

let Predicates = [IsISA3_0] in {		let Predicates = [IsISA3_0] in {

class X_L1_RA5_RB5<bits<6> opcode, bits<10> xo, string opc, RegisterOperand ty,		class X_L1_RA5_RB5<bits<6> opcode, bits<10> xo, string opc, RegisterOperand ty,
InstrItinClass itin, list<dag> pattern>		InstrItinClass itin, list<dag> pattern>
: X_L1_RS5_RS5<opcode, xo, (outs), (ins ty:$rA, ty:$rB, u1imm:$L),		: X_L1_RS5_RS5<opcode, xo, (outs), (ins ty:$rA, ty:$rB, u1imm:$L),
!strconcat(opc, " $rA, $rB, $L"), itin, pattern>;		!strconcat(opc, " $rA, $rB, $L"), itin, pattern>;

Show All 13 Lines

llvm/trunk/lib/Target/PowerPC/PPCInstrInfo.td

	Show First 20 Lines • Show All 887 Lines • ▼ Show 20 Lines

	// PowerPC Predicate operand.			// PowerPC Predicate operand.
	def pred : Operand<OtherVT> {			def pred : Operand<OtherVT> {
	let PrintMethod = "printPredicateOperand";			let PrintMethod = "printPredicateOperand";
	let MIOperandInfo = (ops i32imm:$bibo, crrc:$reg);			let MIOperandInfo = (ops i32imm:$bibo, crrc:$reg);
	}			}

	// Define PowerPC specific addressing mode.			// Define PowerPC specific addressing mode.
	def iaddr : ComplexPattern<iPTR, 2, "SelectAddrImm", [], []>;
	def xaddr : ComplexPattern<iPTR, 2, "SelectAddrIdx", [], []>;			// d-form
	def xoaddr : ComplexPattern<iPTR, 2, "SelectAddrIdxOnly",[], []>;			def iaddr : ComplexPattern<iPTR, 2, "SelectAddrImm", [], []>; // "stb"
				// ds-form
	def ixaddr : ComplexPattern<iPTR, 2, "SelectAddrImmX4", [], []>; // "std"			def ixaddr : ComplexPattern<iPTR, 2, "SelectAddrImmX4", [], []>; // "std"
				// dq-form
	def iqaddr : ComplexPattern<iPTR, 2, "SelectAddrImmX16", [], []>; // "stxv"			def iqaddr : ComplexPattern<iPTR, 2, "SelectAddrImmX16", [], []>; // "stxv"

				// Below forms are all x-form addressing mode, use three different ones so we
				// can make a accurate check for x-form instructions in ISEL.
				// x-form addressing mode whose associated diplacement form is D.
				def xaddr : ComplexPattern<iPTR, 2, "SelectAddrIdx", [], []>; // "stbx"
				// x-form addressing mode whose associated diplacement form is DS.
				def xaddrX4 : ComplexPattern<iPTR, 2, "SelectAddrIdxX4", [], []>; // "stdx"
				// x-form addressing mode whose associated diplacement form is DQ.
				def xaddrX16 : ComplexPattern<iPTR, 2, "SelectAddrIdxX16", [], []>; // "stxvx"

				def xoaddr : ComplexPattern<iPTR, 2, "SelectAddrIdxOnly",[], []>;

	// The address in a single register. This is used with the SjLj			// The address in a single register. This is used with the SjLj
	// pseudo-instructions.			// pseudo-instructions.
	def addr : ComplexPattern<iPTR, 1, "SelectAddr",[], []>;			def addr : ComplexPattern<iPTR, 1, "SelectAddr",[], []>;

	/// This is just the offset part of iaddr, used for preinc.			/// This is just the offset part of iaddr, used for preinc.
	def iaddroff : ComplexPattern<iPTR, 1, "SelectAddrImmOffs", [], []>;			def iaddroff : ComplexPattern<iPTR, 1, "SelectAddrImmOffs", [], []>;

	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	▲ Show 20 Lines • Show All 4,074 Lines • Show Last 20 Lines

llvm/trunk/lib/Target/PowerPC/PPCInstrVSX.td

Show First 20 Lines • Show All 2,851 Lines • ▼ Show 20 Lines	def LXSIHZX : X_XT6_RA5_RB5<31, 813, "lxsihzx", vsfrc,
[(set f64:$XT, (PPClxsizx xoaddr:$src, 2))]>;		[(set f64:$XT, (PPClxsizx xoaddr:$src, 2))]>;

// Load Vector Halfword8/Byte16 Indexed		// Load Vector Halfword8/Byte16 Indexed
def LXVH8X : X_XT6_RA5_RB5<31, 812, "lxvh8x" , vsrc, []>;		def LXVH8X : X_XT6_RA5_RB5<31, 812, "lxvh8x" , vsrc, []>;
def LXVB16X : X_XT6_RA5_RB5<31, 876, "lxvb16x", vsrc, []>;		def LXVB16X : X_XT6_RA5_RB5<31, 876, "lxvb16x", vsrc, []>;

// Load Vector Indexed		// Load Vector Indexed
def LXVX : X_XT6_RA5_RB5<31, 268, "lxvx" , vsrc,		def LXVX : X_XT6_RA5_RB5<31, 268, "lxvx" , vsrc,
[(set v2f64:$XT, (load xaddr:$src))]>;		[(set v2f64:$XT, (load xaddrX16:$src))]>;
// Load Vector (Left-justified) with Length		// Load Vector (Left-justified) with Length
def LXVL : XX1Form_memOp<31, 269, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),		def LXVL : XX1Form_memOp<31, 269, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
"lxvl $XT, $src, $rB", IIC_LdStLoad,		"lxvl $XT, $src, $rB", IIC_LdStLoad,
[(set v4i32:$XT, (int_ppc_vsx_lxvl addr:$src, i64:$rB))]>;		[(set v4i32:$XT, (int_ppc_vsx_lxvl addr:$src, i64:$rB))]>;
def LXVLL : XX1Form_memOp<31,301, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),		def LXVLL : XX1Form_memOp<31,301, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
"lxvll $XT, $src, $rB", IIC_LdStLoad,		"lxvll $XT, $src, $rB", IIC_LdStLoad,
[(set v4i32:$XT, (int_ppc_vsx_lxvll addr:$src, i64:$rB))]>;		[(set v4i32:$XT, (int_ppc_vsx_lxvll addr:$src, i64:$rB))]>;

Show All 31 Lines	let AddedComplexity = 400, Predicates = [HasP9Vector] in {
}		}

// Store Vector Halfword8/Byte16 Indexed		// Store Vector Halfword8/Byte16 Indexed
def STXVH8X : X_XS6_RA5_RB5<31, 940, "stxvh8x" , vsrc, []>;		def STXVH8X : X_XS6_RA5_RB5<31, 940, "stxvh8x" , vsrc, []>;
def STXVB16X : X_XS6_RA5_RB5<31, 1004, "stxvb16x", vsrc, []>;		def STXVB16X : X_XS6_RA5_RB5<31, 1004, "stxvb16x", vsrc, []>;

// Store Vector Indexed		// Store Vector Indexed
def STXVX : X_XS6_RA5_RB5<31, 396, "stxvx" , vsrc,		def STXVX : X_XS6_RA5_RB5<31, 396, "stxvx" , vsrc,
[(store v2f64:$XT, xaddr:$dst)]>;		[(store v2f64:$XT, xaddrX16:$dst)]>;

// Store Vector (Left-justified) with Length		// Store Vector (Left-justified) with Length
def STXVL : XX1Form_memOp<31, 397, (outs),		def STXVL : XX1Form_memOp<31, 397, (outs),
(ins vsrc:$XT, memr:$dst, g8rc:$rB),		(ins vsrc:$XT, memr:$dst, g8rc:$rB),
"stxvl $XT, $dst, $rB", IIC_LdStLoad,		"stxvl $XT, $dst, $rB", IIC_LdStLoad,
[(int_ppc_vsx_stxvl v4i32:$XT, addr:$dst,		[(int_ppc_vsx_stxvl v4i32:$XT, addr:$dst,
i64:$rB)]>;		i64:$rB)]>;
def STXVLL : XX1Form_memOp<31, 429, (outs),		def STXVLL : XX1Form_memOp<31, 429, (outs),
▲ Show 20 Lines • Show All 371 Lines • ▼ Show 20 Lines	let AddedComplexity = 400, Predicates = [HasP9Vector] in {

let AddedComplexity = 400 in {		let AddedComplexity = 400 in {
// The following pseudoinstructions are used to ensure the utilization		// The following pseudoinstructions are used to ensure the utilization
// of all 64 VSX registers.		// of all 64 VSX registers.
let Predicates = [IsLittleEndian, HasP9Vector] in {		let Predicates = [IsLittleEndian, HasP9Vector] in {
def : Pat<(v2i64 (scalar_to_vector (i64 (load ixaddr:$src)))),		def : Pat<(v2i64 (scalar_to_vector (i64 (load ixaddr:$src)))),
(v2i64 (XXPERMDIs		(v2i64 (XXPERMDIs
(COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC), 2))>;		(COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC), 2))>;
def : Pat<(v2i64 (scalar_to_vector (i64 (load xaddr:$src)))),		def : Pat<(v2i64 (scalar_to_vector (i64 (load xaddrX4:$src)))),
(v2i64 (XXPERMDIs		(v2i64 (XXPERMDIs
(COPY_TO_REGCLASS (XFLOADf64 xaddr:$src), VSRC), 2))>;		(COPY_TO_REGCLASS (XFLOADf64 xaddrX4:$src), VSRC), 2))>;

def : Pat<(v2f64 (scalar_to_vector (f64 (load ixaddr:$src)))),		def : Pat<(v2f64 (scalar_to_vector (f64 (load ixaddr:$src)))),
(v2f64 (XXPERMDIs		(v2f64 (XXPERMDIs
(COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC), 2))>;		(COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC), 2))>;
def : Pat<(v2f64 (scalar_to_vector (f64 (load xaddr:$src)))),		def : Pat<(v2f64 (scalar_to_vector (f64 (load xaddrX4:$src)))),
(v2f64 (XXPERMDIs		(v2f64 (XXPERMDIs
(COPY_TO_REGCLASS (XFLOADf64 xaddr:$src), VSRC), 2))>;		(COPY_TO_REGCLASS (XFLOADf64 xaddrX4:$src), VSRC), 2))>;
def : Pat<(store (i64 (extractelt v2i64:$A, 0)), xaddr:$src),		def : Pat<(store (i64 (extractelt v2i64:$A, 0)), xaddrX4:$src),
(XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),		(XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
sub_64), xaddr:$src)>;		sub_64), xaddrX4:$src)>;
def : Pat<(store (f64 (extractelt v2f64:$A, 0)), xaddr:$src),		def : Pat<(store (f64 (extractelt v2f64:$A, 0)), xaddrX4:$src),
(XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),		(XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
sub_64), xaddr:$src)>;		sub_64), xaddrX4:$src)>;
def : Pat<(store (i64 (extractelt v2i64:$A, 1)), xaddr:$src),		def : Pat<(store (i64 (extractelt v2i64:$A, 1)), xaddrX4:$src),
(XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddr:$src)>;		(XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddrX4:$src)>;
def : Pat<(store (f64 (extractelt v2f64:$A, 1)), xaddr:$src),		def : Pat<(store (f64 (extractelt v2f64:$A, 1)), xaddrX4:$src),
(XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddr:$src)>;		(XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddrX4:$src)>;
def : Pat<(store (i64 (extractelt v2i64:$A, 0)), ixaddr:$src),		def : Pat<(store (i64 (extractelt v2i64:$A, 0)), ixaddr:$src),
(DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),		(DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
sub_64), ixaddr:$src)>;		sub_64), ixaddr:$src)>;
def : Pat<(store (f64 (extractelt v2f64:$A, 0)), ixaddr:$src),		def : Pat<(store (f64 (extractelt v2f64:$A, 0)), ixaddr:$src),
(DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2), sub_64),		(DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2), sub_64),
ixaddr:$src)>;		ixaddr:$src)>;
def : Pat<(store (i64 (extractelt v2i64:$A, 1)), ixaddr:$src),		def : Pat<(store (i64 (extractelt v2i64:$A, 1)), ixaddr:$src),
(DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;		(DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;
def : Pat<(store (f64 (extractelt v2f64:$A, 1)), ixaddr:$src),		def : Pat<(store (f64 (extractelt v2f64:$A, 1)), ixaddr:$src),
(DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;		(DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;
} // IsLittleEndian, HasP9Vector		} // IsLittleEndian, HasP9Vector

let Predicates = [IsBigEndian, HasP9Vector] in {		let Predicates = [IsBigEndian, HasP9Vector] in {
def : Pat<(v2i64 (scalar_to_vector (i64 (load ixaddr:$src)))),		def : Pat<(v2i64 (scalar_to_vector (i64 (load ixaddr:$src)))),
(v2i64 (COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC))>;		(v2i64 (COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC))>;
def : Pat<(v2i64 (scalar_to_vector (i64 (load xaddr:$src)))),		def : Pat<(v2i64 (scalar_to_vector (i64 (load xaddrX4:$src)))),
(v2i64 (COPY_TO_REGCLASS (XFLOADf64 xaddr:$src), VSRC))>;		(v2i64 (COPY_TO_REGCLASS (XFLOADf64 xaddrX4:$src), VSRC))>;

def : Pat<(v2f64 (scalar_to_vector (f64 (load ixaddr:$src)))),		def : Pat<(v2f64 (scalar_to_vector (f64 (load ixaddr:$src)))),
(v2f64 (COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC))>;		(v2f64 (COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC))>;
def : Pat<(v2f64 (scalar_to_vector (f64 (load xaddr:$src)))),		def : Pat<(v2f64 (scalar_to_vector (f64 (load xaddrX4:$src)))),
(v2f64 (COPY_TO_REGCLASS (XFLOADf64 xaddr:$src), VSRC))>;		(v2f64 (COPY_TO_REGCLASS (XFLOADf64 xaddrX4:$src), VSRC))>;
def : Pat<(store (i64 (extractelt v2i64:$A, 1)), xaddr:$src),		def : Pat<(store (i64 (extractelt v2i64:$A, 1)), xaddrX4:$src),
(XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),		(XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
sub_64), xaddr:$src)>;		sub_64), xaddrX4:$src)>;
def : Pat<(store (f64 (extractelt v2f64:$A, 1)), xaddr:$src),		def : Pat<(store (f64 (extractelt v2f64:$A, 1)), xaddrX4:$src),
(XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),		(XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
sub_64), xaddr:$src)>;		sub_64), xaddrX4:$src)>;
def : Pat<(store (i64 (extractelt v2i64:$A, 0)), xaddr:$src),		def : Pat<(store (i64 (extractelt v2i64:$A, 0)), xaddrX4:$src),
(XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddr:$src)>;		(XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddrX4:$src)>;
def : Pat<(store (f64 (extractelt v2f64:$A, 0)), xaddr:$src),		def : Pat<(store (f64 (extractelt v2f64:$A, 0)), xaddrX4:$src),
(XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddr:$src)>;		(XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddrX4:$src)>;
def : Pat<(store (i64 (extractelt v2i64:$A, 1)), ixaddr:$src),		def : Pat<(store (i64 (extractelt v2i64:$A, 1)), ixaddr:$src),
(DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),		(DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
sub_64), ixaddr:$src)>;		sub_64), ixaddr:$src)>;
def : Pat<(store (f64 (extractelt v2f64:$A, 1)), ixaddr:$src),		def : Pat<(store (f64 (extractelt v2f64:$A, 1)), ixaddr:$src),
(DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),		(DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
sub_64), ixaddr:$src)>;		sub_64), ixaddr:$src)>;
def : Pat<(store (i64 (extractelt v2i64:$A, 0)), ixaddr:$src),		def : Pat<(store (i64 (extractelt v2i64:$A, 0)), ixaddr:$src),
(DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;		(DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;
▲ Show 20 Lines • Show All 130 Lines • ▼ Show 20 Lines	let Predicates = [IsLittleEndian, HasP9Vector] in {

// Unsiged int in vsx register -> QP		// Unsiged int in vsx register -> QP
def : Pat<(f128 (uint_to_fp (i32 (PPCmfvsr f64:$src)))),		def : Pat<(f128 (uint_to_fp (i32 (PPCmfvsr f64:$src)))),
(f128 (XSCVUDQP		(f128 (XSCVUDQP
(XXEXTRACTUW (SUBREG_TO_REG (i64 1), $src, sub_64), 8)))>;		(XXEXTRACTUW (SUBREG_TO_REG (i64 1), $src, sub_64), 8)))>;
} // IsLittleEndian, HasP9Vector		} // IsLittleEndian, HasP9Vector

// Convert (Un)Signed DWord in memory -> QP		// Convert (Un)Signed DWord in memory -> QP
def : Pat<(f128 (sint_to_fp (i64 (load xaddr:$src)))),		def : Pat<(f128 (sint_to_fp (i64 (load xaddrX4:$src)))),
(f128 (XSCVSDQP (LXSDX xaddr:$src)))>;		(f128 (XSCVSDQP (LXSDX xaddrX4:$src)))>;
def : Pat<(f128 (sint_to_fp (i64 (load ixaddr:$src)))),		def : Pat<(f128 (sint_to_fp (i64 (load ixaddr:$src)))),
(f128 (XSCVSDQP (LXSD ixaddr:$src)))>;		(f128 (XSCVSDQP (LXSD ixaddr:$src)))>;
def : Pat<(f128 (uint_to_fp (i64 (load xaddr:$src)))),		def : Pat<(f128 (uint_to_fp (i64 (load xaddrX4:$src)))),
(f128 (XSCVUDQP (LXSDX xaddr:$src)))>;		(f128 (XSCVUDQP (LXSDX xaddrX4:$src)))>;
def : Pat<(f128 (uint_to_fp (i64 (load ixaddr:$src)))),		def : Pat<(f128 (uint_to_fp (i64 (load ixaddr:$src)))),
(f128 (XSCVUDQP (LXSD ixaddr:$src)))>;		(f128 (XSCVUDQP (LXSD ixaddr:$src)))>;

// Convert Unsigned HWord in memory -> QP		// Convert Unsigned HWord in memory -> QP
def : Pat<(f128 (uint_to_fp ScalarLoads.ZELi16)),		def : Pat<(f128 (uint_to_fp ScalarLoads.ZELi16)),
(f128 (XSCVUDQP (LXSIHZX xaddr:$src)))>;		(f128 (XSCVUDQP (LXSIHZX xaddr:$src)))>;

// Convert Unsigned Byte in memory -> QP		// Convert Unsigned Byte in memory -> QP
def : Pat<(f128 (uint_to_fp ScalarLoads.ZELi8)),		def : Pat<(f128 (uint_to_fp ScalarLoads.ZELi8)),
(f128 (XSCVUDQP (LXSIBZX xoaddr:$src)))>;		(f128 (XSCVUDQP (LXSIBZX xoaddr:$src)))>;

// Truncate & Convert QP -> (Un)Signed (D)Word.		// Truncate & Convert QP -> (Un)Signed (D)Word.
def : Pat<(i64 (fp_to_sint f128:$src)), (i64 (MFVRD (XSCVQPSDZ $src)))>;		def : Pat<(i64 (fp_to_sint f128:$src)), (i64 (MFVRD (XSCVQPSDZ $src)))>;
def : Pat<(i64 (fp_to_uint f128:$src)), (i64 (MFVRD (XSCVQPUDZ $src)))>;		def : Pat<(i64 (fp_to_uint f128:$src)), (i64 (MFVRD (XSCVQPUDZ $src)))>;
def : Pat<(i32 (fp_to_sint f128:$src)),		def : Pat<(i32 (fp_to_sint f128:$src)),
(i32 (MFVSRWZ (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC)))>;		(i32 (MFVSRWZ (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC)))>;
def : Pat<(i32 (fp_to_uint f128:$src)),		def : Pat<(i32 (fp_to_uint f128:$src)),
(i32 (MFVSRWZ (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC)))>;		(i32 (MFVSRWZ (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC)))>;

// Instructions for store(fptosi).		// Instructions for store(fptosi).
// The 8-byte version is repeated here due to availability of D-Form STXSD.		// The 8-byte version is repeated here due to availability of D-Form STXSD.
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xaddr:$dst, 8),		(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xaddrX4:$dst, 8),
(STXSDX (COPY_TO_REGCLASS (XSCVQPSDZ f128:$src), VFRC),		(STXSDX (COPY_TO_REGCLASS (XSCVQPSDZ f128:$src), VFRC),
xaddr:$dst)>;		xaddrX4:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), ixaddr:$dst, 8),		(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), ixaddr:$dst, 8),
(STXSD (COPY_TO_REGCLASS (XSCVQPSDZ f128:$src), VFRC),		(STXSD (COPY_TO_REGCLASS (XSCVQPSDZ f128:$src), VFRC),
ixaddr:$dst)>;		ixaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xoaddr:$dst, 4),		(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xoaddr:$dst, 4),
(STXSIWX (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC), xoaddr:$dst)>;		(STXSIWX (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC), xoaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xoaddr:$dst, 2),		(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xoaddr:$dst, 2),
(STXSIHX (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC), xoaddr:$dst)>;		(STXSIHX (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC), xoaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xoaddr:$dst, 1),		(f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xoaddr:$dst, 1),
(STXSIBX (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC), xoaddr:$dst)>;		(STXSIBX (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC), xoaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xaddr:$dst, 8),		(f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xaddrX4:$dst, 8),
(STXSDX (XSCVDPSXDS f64:$src), xaddr:$dst)>;		(STXSDX (XSCVDPSXDS f64:$src), xaddrX4:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), ixaddr:$dst, 8),		(f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), ixaddr:$dst, 8),
(STXSD (XSCVDPSXDS f64:$src), ixaddr:$dst)>;		(STXSD (XSCVDPSXDS f64:$src), ixaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xoaddr:$dst, 2),		(f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xoaddr:$dst, 2),
(STXSIHX (XSCVDPSXWS f64:$src), xoaddr:$dst)>;		(STXSIHX (XSCVDPSXWS f64:$src), xoaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xoaddr:$dst, 1),		(f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xoaddr:$dst, 1),
(STXSIBX (XSCVDPSXWS f64:$src), xoaddr:$dst)>;		(STXSIBX (XSCVDPSXWS f64:$src), xoaddr:$dst)>;

// Instructions for store(fptoui).		// Instructions for store(fptoui).
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xaddr:$dst, 8),		(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xaddrX4:$dst, 8),
(STXSDX (COPY_TO_REGCLASS (XSCVQPUDZ f128:$src), VFRC),		(STXSDX (COPY_TO_REGCLASS (XSCVQPUDZ f128:$src), VFRC),
xaddr:$dst)>;		xaddrX4:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), ixaddr:$dst, 8),		(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), ixaddr:$dst, 8),
(STXSD (COPY_TO_REGCLASS (XSCVQPUDZ f128:$src), VFRC),		(STXSD (COPY_TO_REGCLASS (XSCVQPUDZ f128:$src), VFRC),
ixaddr:$dst)>;		ixaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xoaddr:$dst, 4),		(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xoaddr:$dst, 4),
(STXSIWX (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC), xoaddr:$dst)>;		(STXSIWX (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC), xoaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xoaddr:$dst, 2),		(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xoaddr:$dst, 2),
(STXSIHX (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC), xoaddr:$dst)>;		(STXSIHX (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC), xoaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xoaddr:$dst, 1),		(f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xoaddr:$dst, 1),
(STXSIBX (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC), xoaddr:$dst)>;		(STXSIBX (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC), xoaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xaddr:$dst, 8),		(f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xaddrX4:$dst, 8),
(STXSDX (XSCVDPUXDS f64:$src), xaddr:$dst)>;		(STXSDX (XSCVDPUXDS f64:$src), xaddrX4:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), ixaddr:$dst, 8),		(f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), ixaddr:$dst, 8),
(STXSD (XSCVDPUXDS f64:$src), ixaddr:$dst)>;		(STXSD (XSCVDPUXDS f64:$src), ixaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xoaddr:$dst, 2),		(f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xoaddr:$dst, 2),
(STXSIHX (XSCVDPUXWS f64:$src), xoaddr:$dst)>;		(STXSIHX (XSCVDPUXWS f64:$src), xoaddr:$dst)>;
def : Pat<(PPCstore_scal_int_from_vsr		def : Pat<(PPCstore_scal_int_from_vsr
(f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xoaddr:$dst, 1),		(f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xoaddr:$dst, 1),
▲ Show 20 Lines • Show All 590 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/PowerPC/build-vector-tests.ll

	Show First 20 Lines • Show All 4,220 Lines • ▼ Show 20 Lines
	}			}

	; Function Attrs: norecurse nounwind readonly			; Function Attrs: norecurse nounwind readonly
	define <2 x i64> @fromDiffMemVarDll(i64* nocapture readonly %arr, i32 signext %elem) {			define <2 x i64> @fromDiffMemVarDll(i64* nocapture readonly %arr, i32 signext %elem) {
	; P9BE-LABEL: fromDiffMemVarDll:			; P9BE-LABEL: fromDiffMemVarDll:
	; P9BE: # %bb.0: # %entry			; P9BE: # %bb.0: # %entry
	; P9BE-NEXT: sldi r4, r4, 3			; P9BE-NEXT: sldi r4, r4, 3
	; P9BE-NEXT: add r3, r3, r4			; P9BE-NEXT: add r3, r3, r4
	; P9BE-NEXT: addi r3, r3, -8			; P9BE-NEXT: li r4, -8
	; P9BE-NEXT: lxvx v2, 0, r3			; P9BE-NEXT: lxvx v2, r3, r4
	; P9BE-NEXT: xxswapd v2, v2			; P9BE-NEXT: xxswapd v2, v2
	; P9BE-NEXT: blr			; P9BE-NEXT: blr
	;			;
	; P9LE-LABEL: fromDiffMemVarDll:			; P9LE-LABEL: fromDiffMemVarDll:
	; P9LE: # %bb.0: # %entry			; P9LE: # %bb.0: # %entry
	; P9LE-NEXT: sldi r4, r4, 3			; P9LE-NEXT: sldi r4, r4, 3
	; P9LE-NEXT: add r3, r3, r4			; P9LE-NEXT: add r3, r3, r4
	; P9LE-NEXT: addi r3, r3, -8			; P9LE-NEXT: li r4, -8
	; P9LE-NEXT: lxvx v2, 0, r3			; P9LE-NEXT: lxvx v2, r3, r4
	; P9LE-NEXT: xxswapd v2, v2			; P9LE-NEXT: xxswapd v2, v2
	; P9LE-NEXT: blr			; P9LE-NEXT: blr
	;			;
	; P8BE-LABEL: fromDiffMemVarDll:			; P8BE-LABEL: fromDiffMemVarDll:
	; P8BE: # %bb.0: # %entry			; P8BE: # %bb.0: # %entry
	; P8BE-NEXT: sldi r4, r4, 3			; P8BE-NEXT: sldi r4, r4, 3
	; P8BE-NEXT: add r3, r3, r4			; P8BE-NEXT: add r3, r3, r4
	; P8BE-NEXT: addi r3, r3, -8			; P8BE-NEXT: addi r3, r3, -8
	▲ Show 20 Lines • Show All 777 Lines • ▼ Show 20 Lines
	}			}

	; Function Attrs: norecurse nounwind readonly			; Function Attrs: norecurse nounwind readonly
	define <2 x i64> @fromDiffMemVarDConvdtoll(double* nocapture readonly %arr, i32 signext %elem) {			define <2 x i64> @fromDiffMemVarDConvdtoll(double* nocapture readonly %arr, i32 signext %elem) {
	; P9BE-LABEL: fromDiffMemVarDConvdtoll:			; P9BE-LABEL: fromDiffMemVarDConvdtoll:
	; P9BE: # %bb.0: # %entry			; P9BE: # %bb.0: # %entry
	; P9BE-NEXT: sldi r4, r4, 3			; P9BE-NEXT: sldi r4, r4, 3
	; P9BE-NEXT: add r3, r3, r4			; P9BE-NEXT: add r3, r3, r4
	; P9BE-NEXT: addi r3, r3, -8			; P9BE-NEXT: li r4, -8
	; P9BE-NEXT: lxvx vs0, 0, r3			; P9BE-NEXT: lxvx vs0, r3, r4
	; P9BE-NEXT: xxswapd vs0, vs0			; P9BE-NEXT: xxswapd vs0, vs0
	; P9BE-NEXT: xvcvdpsxds v2, vs0			; P9BE-NEXT: xvcvdpsxds v2, vs0
	; P9BE-NEXT: blr			; P9BE-NEXT: blr
	;			;
	; P9LE-LABEL: fromDiffMemVarDConvdtoll:			; P9LE-LABEL: fromDiffMemVarDConvdtoll:
	; P9LE: # %bb.0: # %entry			; P9LE: # %bb.0: # %entry
	; P9LE-NEXT: sldi r4, r4, 3			; P9LE-NEXT: sldi r4, r4, 3
	; P9LE-NEXT: add r3, r3, r4			; P9LE-NEXT: add r3, r3, r4
	; P9LE-NEXT: addi r3, r3, -8			; P9LE-NEXT: li r4, -8
	; P9LE-NEXT: lxvx vs0, 0, r3			; P9LE-NEXT: lxvx vs0, r3, r4
	; P9LE-NEXT: xxswapd vs0, vs0			; P9LE-NEXT: xxswapd vs0, vs0
	; P9LE-NEXT: xvcvdpsxds v2, vs0			; P9LE-NEXT: xvcvdpsxds v2, vs0
	; P9LE-NEXT: blr			; P9LE-NEXT: blr
	;			;
	; P8BE-LABEL: fromDiffMemVarDConvdtoll:			; P8BE-LABEL: fromDiffMemVarDConvdtoll:
	; P8BE: # %bb.0: # %entry			; P8BE: # %bb.0: # %entry
	; P8BE-NEXT: sldi r4, r4, 3			; P8BE-NEXT: sldi r4, r4, 3
	; P8BE-NEXT: add r3, r3, r4			; P8BE-NEXT: add r3, r3, r4
	▲ Show 20 Lines • Show All 415 Lines • ▼ Show 20 Lines
	}			}

	; Function Attrs: norecurse nounwind readonly			; Function Attrs: norecurse nounwind readonly
	define <2 x i64> @fromDiffMemVarDull(i64* nocapture readonly %arr, i32 signext %elem) {			define <2 x i64> @fromDiffMemVarDull(i64* nocapture readonly %arr, i32 signext %elem) {
	; P9BE-LABEL: fromDiffMemVarDull:			; P9BE-LABEL: fromDiffMemVarDull:
	; P9BE: # %bb.0: # %entry			; P9BE: # %bb.0: # %entry
	; P9BE-NEXT: sldi r4, r4, 3			; P9BE-NEXT: sldi r4, r4, 3
	; P9BE-NEXT: add r3, r3, r4			; P9BE-NEXT: add r3, r3, r4
	; P9BE-NEXT: addi r3, r3, -8			; P9BE-NEXT: li r4, -8
	; P9BE-NEXT: lxvx v2, 0, r3			; P9BE-NEXT: lxvx v2, r3, r4
	; P9BE-NEXT: xxswapd v2, v2			; P9BE-NEXT: xxswapd v2, v2
	; P9BE-NEXT: blr			; P9BE-NEXT: blr
	;			;
	; P9LE-LABEL: fromDiffMemVarDull:			; P9LE-LABEL: fromDiffMemVarDull:
	; P9LE: # %bb.0: # %entry			; P9LE: # %bb.0: # %entry
	; P9LE-NEXT: sldi r4, r4, 3			; P9LE-NEXT: sldi r4, r4, 3
	; P9LE-NEXT: add r3, r3, r4			; P9LE-NEXT: add r3, r3, r4
	; P9LE-NEXT: addi r3, r3, -8			; P9LE-NEXT: li r4, -8
	; P9LE-NEXT: lxvx v2, 0, r3			; P9LE-NEXT: lxvx v2, r3, r4
	; P9LE-NEXT: xxswapd v2, v2			; P9LE-NEXT: xxswapd v2, v2
	; P9LE-NEXT: blr			; P9LE-NEXT: blr
	;			;
	; P8BE-LABEL: fromDiffMemVarDull:			; P8BE-LABEL: fromDiffMemVarDull:
	; P8BE: # %bb.0: # %entry			; P8BE: # %bb.0: # %entry
	; P8BE-NEXT: sldi r4, r4, 3			; P8BE-NEXT: sldi r4, r4, 3
	; P8BE-NEXT: add r3, r3, r4			; P8BE-NEXT: add r3, r3, r4
	; P8BE-NEXT: addi r3, r3, -8			; P8BE-NEXT: addi r3, r3, -8
	▲ Show 20 Lines • Show All 777 Lines • ▼ Show 20 Lines
	}			}

	; Function Attrs: norecurse nounwind readonly			; Function Attrs: norecurse nounwind readonly
	define <2 x i64> @fromDiffMemVarDConvdtoull(double* nocapture readonly %arr, i32 signext %elem) {			define <2 x i64> @fromDiffMemVarDConvdtoull(double* nocapture readonly %arr, i32 signext %elem) {
	; P9BE-LABEL: fromDiffMemVarDConvdtoull:			; P9BE-LABEL: fromDiffMemVarDConvdtoull:
	; P9BE: # %bb.0: # %entry			; P9BE: # %bb.0: # %entry
	; P9BE-NEXT: sldi r4, r4, 3			; P9BE-NEXT: sldi r4, r4, 3
	; P9BE-NEXT: add r3, r3, r4			; P9BE-NEXT: add r3, r3, r4
	; P9BE-NEXT: addi r3, r3, -8			; P9BE-NEXT: li r4, -8
	; P9BE-NEXT: lxvx vs0, 0, r3			; P9BE-NEXT: lxvx vs0, r3, r4
	; P9BE-NEXT: xxswapd vs0, vs0			; P9BE-NEXT: xxswapd vs0, vs0
	; P9BE-NEXT: xvcvdpuxds v2, vs0			; P9BE-NEXT: xvcvdpuxds v2, vs0
	; P9BE-NEXT: blr			; P9BE-NEXT: blr
	;			;
	; P9LE-LABEL: fromDiffMemVarDConvdtoull:			; P9LE-LABEL: fromDiffMemVarDConvdtoull:
	; P9LE: # %bb.0: # %entry			; P9LE: # %bb.0: # %entry
	; P9LE-NEXT: sldi r4, r4, 3			; P9LE-NEXT: sldi r4, r4, 3
	; P9LE-NEXT: add r3, r3, r4			; P9LE-NEXT: add r3, r3, r4
	; P9LE-NEXT: addi r3, r3, -8			; P9LE-NEXT: li r4, -8
	; P9LE-NEXT: lxvx vs0, 0, r3			; P9LE-NEXT: lxvx vs0, r3, r4
	; P9LE-NEXT: xxswapd vs0, vs0			; P9LE-NEXT: xxswapd vs0, vs0
	; P9LE-NEXT: xvcvdpuxds v2, vs0			; P9LE-NEXT: xvcvdpuxds v2, vs0
	; P9LE-NEXT: blr			; P9LE-NEXT: blr
	;			;
	; P8BE-LABEL: fromDiffMemVarDConvdtoull:			; P8BE-LABEL: fromDiffMemVarDConvdtoull:
	; P8BE: # %bb.0: # %entry			; P8BE: # %bb.0: # %entry
	; P8BE-NEXT: sldi r4, r4, 3			; P8BE-NEXT: sldi r4, r4, 3
	; P8BE-NEXT: add r3, r3, r4			; P8BE-NEXT: add r3, r3, r4
	▲ Show 20 Lines • Show All 93 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/PowerPC/unaligned-addressing-mode.ll

Show All 17 Lines	entry:
%1 = load i8, i8* %add.ptr, align 1		%1 = load i8, i8* %add.ptr, align 1
ret i8 %1		ret i8 %1
}		}

; ISEL matches address mode xaddrX4.		; ISEL matches address mode xaddrX4.
define i64 @test_xaddrX4(i8* %p) {		define i64 @test_xaddrX4(i8* %p) {
; CHECK-LABEL: test_xaddrX4:		; CHECK-LABEL: test_xaddrX4:
; CHECK: # %bb.0: # %entry		; CHECK: # %bb.0: # %entry
		; CHECK-NEXT: li r4, 3
; CHECK-NEXT: std r3, -8(r1)		; CHECK-NEXT: std r3, -8(r1)
; CHECK-NEXT: addi r3, r3, 3		; CHECK-NEXT: ldx r3, r3, r4
; CHECK-NEXT: ld r3, 0(r3)
; CHECK-NEXT: blr		; CHECK-NEXT: blr
entry:		entry:
%p.addr = alloca i8*, align 8		%p.addr = alloca i8*, align 8
store i8* %p, i8** %p.addr, align 8		store i8* %p, i8** %p.addr, align 8
%0 = load i8, i8* %p.addr, align 8		%0 = load i8, i8* %p.addr, align 8
%add.ptr = getelementptr inbounds i8, i8* %0, i64 3		%add.ptr = getelementptr inbounds i8, i8* %0, i64 3
%1 = bitcast i8* %add.ptr to i64*		%1 = bitcast i8* %add.ptr to i64*
%2 = load i64, i64* %1, align 8		%2 = load i64, i64* %1, align 8
ret i64 %2		ret i64 %2
}		}

; ISEL matches address mode xaddrX16.		; ISEL matches address mode xaddrX16.
define <2 x double> @test_xaddrX16(double* %arr) {		define <2 x double> @test_xaddrX16(double* %arr) {
; CHECK-LABEL: test_xaddrX16:		; CHECK-LABEL: test_xaddrX16:
; CHECK: # %bb.0: # %entry		; CHECK: # %bb.0: # %entry
; CHECK-NEXT: addi r3, r3, 40		; CHECK-NEXT: li r4, 40
; CHECK-NEXT: lxvx vs34, 0, r3		; CHECK-NEXT: lxvx vs34, r3, r4
; CHECK-NEXT: blr		; CHECK-NEXT: blr
entry:		entry:
%arrayidx1 = getelementptr inbounds double, double* %arr, i64 5		%arrayidx1 = getelementptr inbounds double, double* %arr, i64 5
%0 = bitcast double* %arrayidx1 to <2 x double>*		%0 = bitcast double* %arrayidx1 to <2 x double>*
%1 = load <2 x double>, <2 x double>* %0, align 16		%1 = load <2 x double>, <2 x double>* %0, align 16
ret <2 x double> %1		ret <2 x double> %1
}		}

Show All 20 Lines
; loop.		; loop.
define i64 @test_xaddrX4_loop(i8* %p) {		define i64 @test_xaddrX4_loop(i8* %p) {
; CHECK-LABEL: test_xaddrX4_loop:		; CHECK-LABEL: test_xaddrX4_loop:
; CHECK: # %bb.0: # %entry		; CHECK: # %bb.0: # %entry
; CHECK-NEXT: addi r4, r3, -8		; CHECK-NEXT: addi r4, r3, -8
; CHECK-NEXT: li r3, 8		; CHECK-NEXT: li r3, 8
; CHECK-NEXT: mtctr r3		; CHECK-NEXT: mtctr r3
; CHECK-NEXT: li r3, 0		; CHECK-NEXT: li r3, 0
; CHECK-NEXT: .p2align 5		; CHECK-NEXT: li r5, 3
		; loop instruction number is changed from 5 to 4, so its align is changed from 5 to 4.
		; CHECK-NEXT: .p2align 4
; CHECK-NEXT: .LBB4_1: # %for.body		; CHECK-NEXT: .LBB4_1: # %for.body
; CHECK: ldu r5, 8(r4)		; CHECK: ldu r6, 8(r4)
; CHECK-NEXT: addi r6, r4, 3		; CHECK-NEXT: ldx r7, r4, r5
; CHECK-NEXT: ld r6, 0(r6)		; CHECK-NEXT: maddld r3, r7, r6, r3
; CHECK-NEXT: maddld r3, r6, r5, r3
; CHECK-NEXT: bdnz .LBB4_1		; CHECK-NEXT: bdnz .LBB4_1
; CHECK-NEXT: # %bb.2: # %for.end		; CHECK-NEXT: # %bb.2: # %for.end
; CHECK-NEXT: blr		; CHECK-NEXT: blr
entry:		entry:
br label %for.body		br label %for.body

for.body: ; preds = %for.body, %entry		for.body: ; preds = %for.body, %entry
%i.015 = phi i64 [ 0, %entry ], [ %inc, %for.body ]		%i.015 = phi i64 [ 0, %entry ], [ %inc, %for.body ]
Show All 18 Lines