diff --git a/llvm/lib/Target/PowerPC/PPCISelDAGToDAG.cpp b/llvm/lib/Target/PowerPC/PPCISelDAGToDAG.cpp --- a/llvm/lib/Target/PowerPC/PPCISelDAGToDAG.cpp +++ b/llvm/lib/Target/PowerPC/PPCISelDAGToDAG.cpp @@ -5066,37 +5066,53 @@ return; } case PPCISD::TOC_ENTRY: { - assert ((PPCSubTarget->isPPC64() || PPCSubTarget->isSVR4ABI()) && - "Only supported for 64-bit ABI and 32-bit SVR4"); - if (PPCSubTarget->isSVR4ABI() && !PPCSubTarget->isPPC64()) { - SDValue GA = N->getOperand(0); - SDNode *MN = CurDAG->getMachineNode(PPC::LWZtoc, dl, MVT::i32, GA, - N->getOperand(1)); - transferMemOperands(N, MN); - ReplaceNode(N, MN); - return; + bool isPPC64 = PPCSubTarget->isPPC64(); + bool isSVR4ABI = PPCSubTarget->isSVR4ABI(); + bool isAIXABI = PPCSubTarget->isAIXABI(); + + assert ((isPPC64 || isSVR4ABI || isAIXABI) && + "Only supported for 64-bit ABI, 32-bit SVR4 and AIX ABI"); + + CodeModel::Model CModel = TM.getCodeModel(); + if (!isPPC64 && ((isAIXABI && CModel == CodeModel::Small) || isSVR4ABI)) { + SDValue GA = N->getOperand(0); + SDNode *MN = CurDAG->getMachineNode(PPC::LWZtoc, dl, MVT::i32, GA, + N->getOperand(1)); + transferMemOperands(N, MN); + ReplaceNode(N, MN); + return; } // For medium and large code model, we generate two instructions as // described below. Otherwise we allow SelectCodeCommon to handle this, // selecting one of LDtoc, LDtocJTI, LDtocCPT, and LDtocBA. - CodeModel::Model CModel = TM.getCodeModel(); if (CModel != CodeModel::Medium && CModel != CodeModel::Large) break; + if (isAIXABI && CModel == CodeModel::Medium) + report_fatal_error("Medium code model is not supported on AIX."); + // The first source operand is a TargetGlobalAddress or a TargetJumpTable. // If it must be toc-referenced according to PPCSubTarget, we generate: + // [32 bit] + // LWZtocL(@sym, ADDIStocHA32(%r2, @sym)) + // [64 bit] // LDtocL(@sym, ADDIStocHA(%x2, @sym)) // Otherwise we generate: // ADDItocL(ADDIStocHA(%x2, @sym), @sym) SDValue GA = N->getOperand(0); SDValue TOCbase = N->getOperand(1); - SDNode *Tmp = CurDAG->getMachineNode(PPC::ADDIStocHA, dl, MVT::i64, - TOCbase, GA); + + EVT VT = isPPC64 ? MVT::i64 : MVT::i32; + SDNode *Tmp = CurDAG->getMachineNode((isPPC64) ? PPC::ADDIStocHA : + PPC::ADDIStocHA32, dl, VT, TOCbase, + GA); + if (PPCLowering->isAccessedAsGotIndirect(GA)) { - // If it is access as got-indirect, we need an extra LD to load - // the address. - SDNode *MN = CurDAG->getMachineNode(PPC::LDtocL, dl, MVT::i64, GA, + // If it is accessed as got-indirect, we need an extra LWZ/LD to load + // the address. + SDNode *MN = CurDAG->getMachineNode((isPPC64) ? PPC::LDtocL : + PPC::LWZtocL, dl, VT, GA, SDValue(Tmp, 0)); transferMemOperands(N, MN); ReplaceNode(N, MN); diff --git a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp --- a/llvm/lib/Target/PowerPC/PPCISelLowering.cpp +++ b/llvm/lib/Target/PowerPC/PPCISelLowering.cpp @@ -2638,12 +2638,14 @@ setUsesTOCBasePtr(DAG.getMachineFunction()); } -static SDValue getTOCEntry(SelectionDAG &DAG, const SDLoc &dl, bool Is64Bit, - SDValue GA) { +static SDValue getTOCEntry(SelectionDAG &DAG, const SDLoc &dl, + const PPCSubtarget &Subtarget, SDValue GA) { + bool Is64Bit = Subtarget.isPPC64(); EVT VT = Is64Bit ? MVT::i64 : MVT::i32; - SDValue Reg = Is64Bit ? DAG.getRegister(PPC::X2, VT) : - DAG.getNode(PPCISD::GlobalBaseReg, dl, VT); - + SDValue Reg = Is64Bit ? DAG.getRegister(PPC::X2, VT) + : Subtarget.isAIXABI() + ? DAG.getRegister(PPC::R2, VT) + : DAG.getNode(PPCISD::GlobalBaseReg, dl, VT); SDValue Ops[] = { GA, Reg }; return DAG.getMemIntrinsicNode( PPCISD::TOC_ENTRY, dl, DAG.getVTList(VT, MVT::Other), Ops, VT, @@ -2662,7 +2664,7 @@ if (Subtarget.isSVR4ABI() && Subtarget.isPPC64()) { setUsesTOCBasePtr(DAG); SDValue GA = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment(), 0); - return getTOCEntry(DAG, SDLoc(CP), true, GA); + return getTOCEntry(DAG, SDLoc(CP), Subtarget, GA); } unsigned MOHiFlag, MOLoFlag; @@ -2672,7 +2674,7 @@ if (IsPIC && Subtarget.isSVR4ABI()) { SDValue GA = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment(), PPCII::MO_PIC_FLAG); - return getTOCEntry(DAG, SDLoc(CP), false, GA); + return getTOCEntry(DAG, SDLoc(CP), Subtarget, GA); } SDValue CPIHi = @@ -2738,7 +2740,7 @@ if (Subtarget.isSVR4ABI() && Subtarget.isPPC64()) { setUsesTOCBasePtr(DAG); SDValue GA = DAG.getTargetJumpTable(JT->getIndex(), PtrVT); - return getTOCEntry(DAG, SDLoc(JT), true, GA); + return getTOCEntry(DAG, SDLoc(JT), Subtarget, GA); } unsigned MOHiFlag, MOLoFlag; @@ -2748,7 +2750,7 @@ if (IsPIC && Subtarget.isSVR4ABI()) { SDValue GA = DAG.getTargetJumpTable(JT->getIndex(), PtrVT, PPCII::MO_PIC_FLAG); - return getTOCEntry(DAG, SDLoc(GA), false, GA); + return getTOCEntry(DAG, SDLoc(GA), Subtarget, GA); } SDValue JTIHi = DAG.getTargetJumpTable(JT->getIndex(), PtrVT, MOHiFlag); @@ -2769,7 +2771,7 @@ if (Subtarget.isPPC64()) setUsesTOCBasePtr(DAG); SDValue GA = DAG.getTargetBlockAddress(BA, PtrVT, BASDN->getOffset()); - return getTOCEntry(DAG, SDLoc(BASDN), Subtarget.isPPC64(), GA); + return getTOCEntry(DAG, SDLoc(BASDN), Subtarget, GA); } unsigned MOHiFlag, MOLoFlag; @@ -2884,12 +2886,12 @@ SDLoc DL(GSDN); const GlobalValue *GV = GSDN->getGlobal(); - // 64-bit SVR4 ABI code is always position-independent. + // 64-bit SVR4 ABI & AIX ABI code is always position-independent. // The actual address of the GlobalValue is stored in the TOC. - if (Subtarget.isSVR4ABI() && Subtarget.isPPC64()) { + if ((Subtarget.isSVR4ABI() && Subtarget.isPPC64()) || Subtarget.isAIXABI()) { setUsesTOCBasePtr(DAG); SDValue GA = DAG.getTargetGlobalAddress(GV, DL, PtrVT, GSDN->getOffset()); - return getTOCEntry(DAG, DL, true, GA); + return getTOCEntry(DAG, DL, Subtarget, GA); } unsigned MOHiFlag, MOLoFlag; @@ -2900,7 +2902,7 @@ SDValue GA = DAG.getTargetGlobalAddress(GV, DL, PtrVT, GSDN->getOffset(), PPCII::MO_PIC_FLAG); - return getTOCEntry(DAG, DL, false, GA); + return getTOCEntry(DAG, DL, Subtarget, GA); } SDValue GAHi = @@ -14302,11 +14304,17 @@ if (Subtarget.isSVR4ABI() && !Subtarget.isPPC64()) return true; + // AIX accesses everything indirectly through the TOC, which is similar to + // the GOT. + if (Subtarget.isAIXABI()) + return true; + CodeModel::Model CModel = getTargetMachine().getCodeModel(); // If it is small or large code model, module locals are accessed // indirectly by loading their address from .toc/.got. The difference - // is that for large code model we have ADDISTocHa + LDtocL and for - // small code model we simply have LDtoc. + // is that for large code model we have ADDISTocHa + LDtocL(64-bit)/ + // LWZtocL(32-bit) and for small code model we simply have LDtoc(64-bit)/ + // LWZtoc(32-bit). if (CModel == CodeModel::Small || CModel == CodeModel::Large) return true; diff --git a/llvm/lib/Target/PowerPC/PPCInstrInfo.td b/llvm/lib/Target/PowerPC/PPCInstrInfo.td --- a/llvm/lib/Target/PowerPC/PPCInstrInfo.td +++ b/llvm/lib/Target/PowerPC/PPCInstrInfo.td @@ -3166,6 +3166,15 @@ "#LWZtoc", [(set i32:$rD, (PPCtoc_entry tglobaladdr:$disp, i32:$reg))]>; +def LWZtocL : PPCEmitTimePseudo<(outs gprc:$rD), (ins tocentry32:$disp, gprc_nor0:$reg), + "#LWZtocL", + [(set i32:$rD, + (PPCtoc_entry tglobaladdr:$disp, i32:$reg))]>; +def ADDIStocHA32: PPCEmitTimePseudo<(outs gprc:$rD), (ins gprc:$reg, tocentry32:$disp), + "#ADDIStocHA32", + [(set i32:$rD, + (PPCtoc_entry i32:$reg, tglobaladdr:$disp))]>; + // Get Global (GOT) Base Register offset, from the word immediately preceding // the function label. def UpdateGBR : PPCEmitTimePseudo<(outs gprc:$rD, gprc:$rT), (ins gprc:$rI), "#UpdateGBR", []>; diff --git a/llvm/lib/Target/PowerPC/PPCTOCRegDeps.cpp b/llvm/lib/Target/PowerPC/PPCTOCRegDeps.cpp --- a/llvm/lib/Target/PowerPC/PPCTOCRegDeps.cpp +++ b/llvm/lib/Target/PowerPC/PPCTOCRegDeps.cpp @@ -95,7 +95,8 @@ protected: bool hasTOCLoReloc(const MachineInstr &MI) { if (MI.getOpcode() == PPC::LDtocL || - MI.getOpcode() == PPC::ADDItocL) + MI.getOpcode() == PPC::ADDItocL || + MI.getOpcode() == PPC::LWZtocL) return true; for (const MachineOperand &MO : MI.operands()) { @@ -106,14 +107,14 @@ return false; } - bool processBlock(MachineBasicBlock &MBB) { + bool processBlock(MachineBasicBlock &MBB, unsigned TOCReg) { bool Changed = false; for (auto &MI : MBB) { if (!hasTOCLoReloc(MI)) continue; - MI.addOperand(MachineOperand::CreateReg(PPC::X2, + MI.addOperand(MachineOperand::CreateReg(TOCReg, false /*IsDef*/, true /*IsImp*/)); Changed = true; @@ -128,7 +129,10 @@ for (MachineFunction::iterator I = MF.begin(); I != MF.end();) { MachineBasicBlock &B = *I++; - if (processBlock(B)) + // Only AIX might use R2. + bool Is64Bit = MF.getSubtarget().isPPC64(); + unsigned TOCReg = Is64Bit ? PPC::X2 : PPC::R2; + if (processBlock(B, TOCReg)) Changed = true; } diff --git a/llvm/lib/Target/PowerPC/PPCTargetMachine.cpp b/llvm/lib/Target/PowerPC/PPCTargetMachine.cpp --- a/llvm/lib/Target/PowerPC/PPCTargetMachine.cpp +++ b/llvm/lib/Target/PowerPC/PPCTargetMachine.cpp @@ -248,7 +248,7 @@ report_fatal_error("Target does not support the kernel CodeModel", false); return *CM; } - if (!TT.isOSDarwin() && !JIT && + if (!TT.isOSAIX() && !TT.isOSDarwin() && !JIT && (TT.getArch() == Triple::ppc64 || TT.getArch() == Triple::ppc64le)) return CodeModel::Medium; return CodeModel::Small; diff --git a/llvm/test/CodeGen/PowerPC/lower-globaladdr32-aix.ll b/llvm/test/CodeGen/PowerPC/lower-globaladdr32-aix.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/PowerPC/lower-globaladdr32-aix.ll @@ -0,0 +1,38 @@ +; RUN: llc -mtriple powerpc-ibm-aix-xcoff -code-model=small \ +; RUN: -stop-after=machine-cp -print-before=simple-register-coalescing 2>&1 < \ +; RUN: %s | FileCheck --check-prefix=SMALL %s + +; RUN: not llc -mtriple powerpc-ibm-aix-xcoff -code-model=medium \ +; RUN: -stop-after=machine-cp 2>&1 < %s | FileCheck --check-prefix=MEDIUM %s + +; RUN: llc -mtriple powerpc-ibm-aix-xcoff -code-model=large \ +; RUN: -stop-after=machine-cp -print-before=simple-register-coalescing 2>&1 < \ +; RUN: %s | FileCheck --check-prefix=LARGE %s + +; RUN: llc -mtriple powerpc-ibm-aix-xcoff -stop-after=machine-cp \ +; RUN: -print-before=simple-register-coalescing 2>&1 < %s | FileCheck \ +; RUN: --check-prefix=SMALL %s + +@msg = common global i8* null, align 4 +@ptr = common global i8* null, align 4 + +define void @foo() { +entry: +; SMALL: %0:gprc_and_gprc_nor0 = LWZtoc @msg, $r2 :: (load 4 from got) +; SMALL: %1:gprc = LWZ 0, %0:gprc_and_gprc_nor0 :: (dereferenceable load 4 from @msg) +; SMALL: %2:gprc_and_gprc_nor0 = LWZtoc @ptr, $r2 :: (load 4 from got) +; SMALL: STW %1:gprc, 0, %2:gprc_and_gprc_nor0 :: (store 4 into @ptr) + +; MEDIUM: Medium code model is not supported on AIX. + +; LARGE: %0:gprc_and_gprc_nor0 = ADDIStocHA32 $r2, @msg +; LARGE: %1:gprc_and_gprc_nor0 = LWZtocL @msg, %0:gprc_and_gprc_nor0, implicit $r2 :: (load 4 from got) +; LARGE: %2:gprc = LWZ 0, %1:gprc_and_gprc_nor0 :: (dereferenceable load 4 from @msg) +; LARGE: %3:gprc_and_gprc_nor0 = ADDIStocHA32 $r2, @ptr +; LARGE: %4:gprc_and_gprc_nor0 = LWZtocL @ptr, %3:gprc_and_gprc_nor0, implicit $r2 :: (load 4 from got) +; LARGE: STW %2:gprc, 0, %4:gprc_and_gprc_nor0 :: (store 4 into @ptr) + + %0 = load i8*, i8** @msg, align 4 + store i8* %0, i8** @ptr, align 4 + ret void +} diff --git a/llvm/test/CodeGen/PowerPC/lower-globaladdr64-aix.ll b/llvm/test/CodeGen/PowerPC/lower-globaladdr64-aix.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/PowerPC/lower-globaladdr64-aix.ll @@ -0,0 +1,38 @@ +; RUN: llc -mtriple powerpc64-ibm-aix-xcoff -code-model=small \ +; RUN: -stop-after=machine-cp -print-before=simple-register-coalescing 2>&1 < \ +; RUN: %s | FileCheck --check-prefix=SMALL %s + +; RUN: not llc -mtriple powerpc64-ibm-aix-xcoff -code-model=medium \ +; RUN: -stop-after=machine-cp 2>&1 < %s | FileCheck --check-prefix=MEDIUM %s + +; RUN: llc -mtriple powerpc64-ibm-aix-xcoff -code-model=large \ +; RUN: -stop-after=machine-cp -print-before=simple-register-coalescing 2>&1 < \ +; RUN: %s | FileCheck --check-prefix=LARGE %s + +; RUN: llc -mtriple powerpc64-ibm-aix-xcoff -stop-after=machine-cp \ +; RUN: -print-before=simple-register-coalescing 2>&1 < %s | FileCheck \ +; RUN: --check-prefix=SMALL %s + +@msg = common global i8* null, align 8 +@ptr = common global i8* null, align 8 + +define void @foo() { +entry: +; SMALL: %0:g8rc_and_g8rc_nox0 = LDtoc @msg, $x2 :: (load 8 from got) +; SMALL: %1:g8rc = LD 0, %0:g8rc_and_g8rc_nox0 :: (dereferenceable load 8 from @msg) +; SMALL: %2:g8rc_and_g8rc_nox0 = LDtoc @ptr, $x2 :: (load 8 from got) +; SMALL: STD %1:g8rc, 0, %2:g8rc_and_g8rc_nox0 :: (store 8 into @ptr) + +; MEDIUM: Medium code model is not supported on AIX. + +; LARGE: %0:g8rc_and_g8rc_nox0 = ADDIStocHA $x2, @msg +; LARGE: %1:g8rc_and_g8rc_nox0 = LDtocL @msg, %0:g8rc_and_g8rc_nox0, implicit $x2 :: (load 8 from got) +; LARGE: %2:g8rc = LD 0, %1:g8rc_and_g8rc_nox0 :: (dereferenceable load 8 from @msg) +; LARGE: %3:g8rc_and_g8rc_nox0 = ADDIStocHA $x2, @ptr +; LARGE: %4:g8rc_and_g8rc_nox0 = LDtocL @ptr, %3:g8rc_and_g8rc_nox0, implicit $x2 :: (load 8 from got) +; LARGE: STD %2:g8rc, 0, %4:g8rc_and_g8rc_nox0 :: (store 8 into @ptr) + + %0 = load i8*, i8** @msg, align 8 + store i8* %0, i8** @ptr, align 8 + ret void +}