diff --git a/llvm/lib/Target/AVR/AVRExpandPseudoInsts.cpp b/llvm/lib/Target/AVR/AVRExpandPseudoInsts.cpp --- a/llvm/lib/Target/AVR/AVRExpandPseudoInsts.cpp +++ b/llvm/lib/Target/AVR/AVRExpandPseudoInsts.cpp @@ -14,9 +14,11 @@ #include "AVR.h" #include "AVRInstrInfo.h" +#include "AVRMachineFunctionInfo.h" #include "AVRTargetMachine.h" #include "MCTargetDesc/AVRMCTargetDesc.h" +#include "llvm/CodeGen/MachineFunction.h" #include "llvm/CodeGen/MachineFunctionPass.h" #include "llvm/CodeGen/MachineInstrBuilder.h" #include "llvm/CodeGen/MachineRegisterInfo.h" @@ -57,8 +59,8 @@ /// The IO address of the status register. const unsigned SREG_ADDR = 0x3f; - bool expandMBB(Block &MBB); - bool expandMI(Block &MBB, BlockIt MBBI); + bool expandMBB(MachineFunction &MF, Block &MBB); + bool expandMI(MachineFunction &MF, Block &MBB, BlockIt MBBI); template bool expand(Block &MBB, BlockIt MBBI); MachineInstrBuilder buildMI(Block &MBB, BlockIt MBBI, unsigned Opcode) { @@ -108,13 +110,13 @@ char AVRExpandPseudo::ID = 0; -bool AVRExpandPseudo::expandMBB(MachineBasicBlock &MBB) { +bool AVRExpandPseudo::expandMBB(MachineFunction &MF, MachineBasicBlock &MBB) { bool Modified = false; BlockIt MBBI = MBB.begin(), E = MBB.end(); while (MBBI != E) { BlockIt NMBBI = std::next(MBBI); - Modified |= expandMI(MBB, MBBI); + Modified |= expandMI(MF, MBB, MBBI); MBBI = NMBBI; } @@ -139,7 +141,7 @@ do { assert(ExpandCount < 10 && "pseudo expand limit reached"); - bool BlockModified = expandMBB(MBB); + bool BlockModified = expandMBB(MF, MBB); Modified |= BlockModified; ExpandCount++; @@ -2103,10 +2105,21 @@ return true; } -bool AVRExpandPseudo::expandMI(Block &MBB, BlockIt MBBI) { +bool AVRExpandPseudo::expandMI(MachineFunction &MF, Block &MBB, BlockIt MBBI) { MachineInstr &MI = *MBBI; int Opcode = MBBI->getOpcode(); + if (Opcode == AVR::STDWSPQRr || Opcode == AVR::STDSPQRr) { + const AVRMachineFunctionInfo *AFI = MF.getInfo(); + Register FP = AFI->hasReservedCallFrame(MF) ? AVR::R29R28 : AVR::R31R30; + + Opcode = + (Opcode == AVR::STDWSPQRr) ? AVR::STDWPtrQRr : AVR::STDPtrQRr; + + MI.setDesc(TII->get(Opcode)); + MI.getOperand(0).setReg(FP); + } + #define EXPAND(Op) \ case Op: \ return expand(MBB, MI) diff --git a/llvm/lib/Target/AVR/AVRFrameLowering.cpp b/llvm/lib/Target/AVR/AVRFrameLowering.cpp --- a/llvm/lib/Target/AVR/AVRFrameLowering.cpp +++ b/llvm/lib/Target/AVR/AVRFrameLowering.cpp @@ -40,13 +40,7 @@ } bool AVRFrameLowering::hasReservedCallFrame(const MachineFunction &MF) const { - // Reserve call frame memory in function prologue under the following - // conditions: - // - Y pointer is reserved to be the frame pointer. - // - The function does not contain variable sized objects. - - const MachineFrameInfo &MFI = MF.getFrameInfo(); - return hasFP(MF) && !MFI.hasVarSizedObjects(); + return MF.getInfo()->hasReservedCallFrame(MF); } void AVRFrameLowering::emitPrologue(MachineFunction &MF, @@ -228,10 +222,7 @@ // Notice that strictly this is not a frame pointer because it contains SP after // frame allocation instead of having the original SP in function entry. bool AVRFrameLowering::hasFP(const MachineFunction &MF) const { - const AVRMachineFunctionInfo *FuncInfo = MF.getInfo(); - - return (FuncInfo->getHasSpills() || FuncInfo->getHasAllocas() || - FuncInfo->getHasStackArgs()); + return MF.getInfo()->hasFP(); } bool AVRFrameLowering::spillCalleeSavedRegisters( @@ -298,38 +289,6 @@ return true; } -/// Replace pseudo store instructions that pass arguments through the stack with -/// real instructions. -static void fixStackStores(MachineBasicBlock &MBB, - MachineBasicBlock::iterator MI, - const TargetInstrInfo &TII, Register FP) { - // Iterate through the BB until we hit a call instruction or we reach the end. - for (auto I = MI, E = MBB.end(); I != E && !I->isCall();) { - MachineBasicBlock::iterator NextMI = std::next(I); - MachineInstr &MI = *I; - unsigned Opcode = I->getOpcode(); - - // Only care of pseudo store instructions where SP is the base pointer. - if (Opcode != AVR::STDSPQRr && Opcode != AVR::STDWSPQRr) { - I = NextMI; - continue; - } - - assert(MI.getOperand(0).getReg() == AVR::SP && - "Invalid register, should be SP!"); - - // Replace this instruction with a regular store. Use Y as the base - // pointer since it is guaranteed to contain a copy of SP. - unsigned STOpc = - (Opcode == AVR::STDWSPQRr) ? AVR::STDWPtrQRr : AVR::STDPtrQRr; - - MI.setDesc(TII.get(STOpc)); - MI.getOperand(0).setReg(FP); - - I = NextMI; - } -} - MachineBasicBlock::iterator AVRFrameLowering::eliminateCallFramePseudoInstr( MachineFunction &MF, MachineBasicBlock &MBB, MachineBasicBlock::iterator MI) const { @@ -340,7 +299,6 @@ // function entry. Delete the call frame pseudo and replace all pseudo stores // with real store instructions. if (hasReservedCallFrame(MF)) { - fixStackStores(MBB, MI, TII, AVR::R29R28); return MBB.erase(MI); } @@ -368,10 +326,6 @@ BuildMI(MBB, MI, DL, TII.get(AVR::SPWRITE), AVR::SP) .addReg(AVR::R31R30); - - // Make sure the remaining stack stores are converted to real store - // instructions. - fixStackStores(MBB, MI, TII, AVR::R31R30); } else { assert(Opcode == TII.getCallFrameDestroyOpcode()); diff --git a/llvm/lib/Target/AVR/AVRMachineFunctionInfo.h b/llvm/lib/Target/AVR/AVRMachineFunctionInfo.h --- a/llvm/lib/Target/AVR/AVRMachineFunctionInfo.h +++ b/llvm/lib/Target/AVR/AVRMachineFunctionInfo.h @@ -13,6 +13,7 @@ #ifndef LLVM_AVR_MACHINE_FUNCTION_INFO_H #define LLVM_AVR_MACHINE_FUNCTION_INFO_H +#include "llvm/CodeGen/MachineFrameInfo.h" #include "llvm/CodeGen/MachineFunction.h" namespace llvm { @@ -79,6 +80,14 @@ int getVarArgsFrameIndex() const { return VarArgsFrameIndex; } void setVarArgsFrameIndex(int Idx) { VarArgsFrameIndex = Idx; } + + bool hasReservedCallFrame(const MachineFunction &MF) const { + return hasFP() && !MF.getFrameInfo().hasVarSizedObjects(); + } + + bool hasFP() const { + return (getHasSpills() || getHasAllocas() || getHasStackArgs()); + } }; } // end llvm namespace diff --git a/llvm/test/CodeGen/AVR/bug-2021-01-29-complex-frame-pointer-usage.ll b/llvm/test/CodeGen/AVR/bug-2021-01-29-complex-frame-pointer-usage.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/AVR/bug-2021-01-29-complex-frame-pointer-usage.ll @@ -0,0 +1,38 @@ +; RUN: llc < %s -march=avr -mcpu=atmega328 -filetype=obj -o /dev/null --print-options 2>&1 | FileCheck %s --check-prefix=CHECK-ERROR +; RUN: llc < %s -march=avr -mcpu=atmega328 -filetype=obj | llvm-objdump -S - | FileCheck %s --check-prefix=CHECK-OBJDUMP + +; This test verifies that the AVR backend can successfully lower code +; which is very register heavy, containing many references to the frame +; pointer. +; +; Before this bug was fixed, this testcase would fail with the message: +; +; LLVM ERROR: Not supported instr: > +; +; where XXX is the OpCode of either the STDWSPQRr instruction or the STDSPQRr instruction. +; +; The issue was that the ISel lowering pass would lower many stack slot stores to these +; instructions, but the frame pointer elimination code (that is designed to rewrite these two +; instructions to real instructions) was only designed to run for STDWSPQRr/STDSPQRr instructions +; that appeared in the basic blocks that contained the FrameSetup/FrameDestroy instructions. +; +; The bug was fixed by modifying the code so that it unconditionally runs on STDWSPQRr/STDSPQRr +; instructions and always expands them with the relevant STDWPtrQRr or STDPtrQRr instructions. +; +; This bug was originally discovered due to the Rust compiler_builtins library. Its 0.1.37 release +; contained a 128-bit software division/remainder routine that exercised this buggy branch in the code. + +; CHECK-ERROR-NOT: LLVM ERROR: Not supported instr + +declare { i128, i128 } @div_rem_u128(i128, i128) addrspace(1) + +; CHECK-OBJDUMP-LABEL: main +define i128 @main(i128 %a, i128 %b) addrspace(1) { +start: + %b_neg = icmp slt i128 %b, 0 + %divisor = select i1 %b_neg, i128 0, i128 %b + %result = tail call fastcc addrspace(1) { i128, i128 } @div_rem_u128(i128 undef, i128 %divisor) + + ; CHECK-OBJDUMP: ret + ret i128 0 +}