Index: clang/include/clang/Driver/Options.td =================================================================== --- clang/include/clang/Driver/Options.td +++ clang/include/clang/Driver/Options.td @@ -3617,6 +3617,7 @@ Group; def mno_check_zero_division : Flag<["-"], "mno-check-zero-division">, Group; +def mfix4300 : Flag<["-"], "mfix4300">, Group; def mcompact_branches_EQ : Joined<["-"], "mcompact-branches=">, Group; def mbranch_likely : Flag<["-"], "mbranch-likely">, Group, Index: clang/lib/Driver/ToolChains/Clang.cpp =================================================================== --- clang/lib/Driver/ToolChains/Clang.cpp +++ clang/lib/Driver/ToolChains/Clang.cpp @@ -1929,6 +1929,11 @@ } } + if (Arg *A = Args.getLastArg(options::OPT_mfix4300)) { + CmdArgs.push_back("-mllvm"); + CmdArgs.push_back("-mfix4300"); + } + if (Arg *A = Args.getLastArg(options::OPT_G)) { StringRef v = A->getValue(); CmdArgs.push_back("-mllvm"); Index: llvm/lib/Target/Mips/CMakeLists.txt =================================================================== --- llvm/lib/Target/Mips/CMakeLists.txt +++ llvm/lib/Target/Mips/CMakeLists.txt @@ -59,6 +59,7 @@ MipsTargetMachine.cpp MipsTargetObjectFile.cpp MicroMipsSizeReduction.cpp + MipsMulMulBugPass.cpp LINK_COMPONENTS Analysis Index: llvm/lib/Target/Mips/Mips.h =================================================================== --- llvm/lib/Target/Mips/Mips.h +++ llvm/lib/Target/Mips/Mips.h @@ -38,6 +38,7 @@ FunctionPass *createMicroMipsSizeReducePass(); FunctionPass *createMipsExpandPseudoPass(); FunctionPass *createMipsPreLegalizeCombiner(); + FunctionPass *createMipsMulMulBugPass(); InstructionSelector *createMipsInstructionSelector(const MipsTargetMachine &, MipsSubtarget &, Index: llvm/lib/Target/Mips/MipsMulMulBugPass.cpp =================================================================== --- /dev/null +++ llvm/lib/Target/Mips/MipsMulMulBugPass.cpp @@ -0,0 +1,121 @@ +#include "Mips.h" +#include "MipsInstrInfo.h" +#include "MipsSubtarget.h" +#include "llvm/CodeGen/MachineBasicBlock.h" +#include "llvm/CodeGen/MachineFunction.h" +#include "llvm/CodeGen/MachineFunctionPass.h" +#include "llvm/Support/CommandLine.h" +#include "llvm/Support/Debug.h" +#include "llvm/Target/TargetMachine.h" + +#define DEBUG_TYPE "mips-r4300-mulmul-fix" + +using namespace llvm; + +static cl::opt + EnableMulMulFix("mfix4300", cl::init(false), + cl::desc("Enable the VR4300 mulmul bug fix."), cl::Hidden); + +class MipsMulMulBugFix : public MachineFunctionPass { +public: + MipsMulMulBugFix() : MachineFunctionPass(ID) {} + + StringRef getPassName() const override { return "Mips mulmul bugfix"; } + + MachineFunctionProperties getRequiredProperties() const override { + return MachineFunctionProperties().set( + MachineFunctionProperties::Property::NoVRegs); + } + + bool runOnMachineFunction(MachineFunction &MF) override; + bool FixMulMulBB(MachineBasicBlock &MBB); + + static char ID; + +private: + static const MipsInstrInfo *MipsII; + const MipsSubtarget *Subtarget; +}; + +char MipsMulMulBugFix::ID = 0; +const MipsInstrInfo *MipsMulMulBugFix::MipsII; + +bool MipsMulMulBugFix::runOnMachineFunction(MachineFunction &MF) { + + if (!EnableMulMulFix) + return false; + + Subtarget = &static_cast(MF.getSubtarget()); + MipsII = static_cast(Subtarget->getInstrInfo()); + + bool Modified = false; + MachineFunction::iterator I = MF.begin(), E = MF.end(); + + for (; I != E; ++I) + Modified |= FixMulMulBB(*I); + + return Modified; +} + +static bool isFirstMul(const MachineInstr *MI) { + switch (MI->getOpcode()) { + case Mips::MUL: + case Mips::FMUL_S: + case Mips::FMUL_D: + case Mips::FMUL_D32: + case Mips::FMUL_D64: + return true; + default: + return false; + } +} + +static bool isSecondMulOrBranch(const MachineInstr *MI) { + if (MI->isBranch() || MI->isIndirectBranch() || MI->isCall()) + return true; + + switch (MI->getOpcode()) { + case Mips::MUL: + case Mips::FMUL_S: + case Mips::FMUL_D: + case Mips::FMUL_D32: + case Mips::FMUL_D64: + case Mips::MULT: + case Mips::MULTu: + case Mips::DMULT: + case Mips::DMULTu: + return true; + default: + return false; + } +} + +bool MipsMulMulBugFix::FixMulMulBB(MachineBasicBlock &MBB) { + bool Modified = false; + MachineBasicBlock::instr_iterator MII = MBB.instr_begin(), + E = MBB.instr_end(); + MachineBasicBlock::instr_iterator NextMII; + + // Iterate through the instructions in the basic block + for (; MII != E; MII = NextMII) { + + NextMII = std::next(MII); + MachineInstr *MI = &*MII; + + // Trigger when the current instruction is a mul and the next instruction + // is either a mul or a branch in case the branch target start with a mul + if (NextMII != E && isFirstMul(MI) && isSecondMulOrBranch(&*NextMII)) { + LLVM_DEBUG(dbgs() << "Found mulmul!"); + + MachineBasicBlock &MBB = *MI->getParent(); + const MCInstrDesc &NewMCID = MipsII->get(Mips::NOP); + BuildMI(MBB, NextMII, DebugLoc(), NewMCID); + Modified = true; + } + } + + return Modified; +} + +/// createMipsMulMulBugPass - Returns a pass that fixes the mulmul bug +FunctionPass *llvm::createMipsMulMulBugPass() { return new MipsMulMulBugFix(); } Index: llvm/lib/Target/Mips/MipsTargetMachine.cpp =================================================================== --- llvm/lib/Target/Mips/MipsTargetMachine.cpp +++ llvm/lib/Target/Mips/MipsTargetMachine.cpp @@ -292,6 +292,10 @@ // instructions which can be remapped to a 16 bit instruction. addPass(createMicroMipsSizeReducePass()); + // This pass inserts a nop instruction between two back-to-back multiplication + // instructions when the "mfix4300" flag is passed. + addPass(createMipsMulMulBugPass()); + // The delay slot filler pass can potientially create forbidden slot hazards // for MIPSR6 and therefore it should go before MipsBranchExpansion pass. addPass(createMipsDelaySlotFillerPass()); Index: llvm/test/CodeGen/Mips/vr4300mulmul/mulbranch.ll =================================================================== --- /dev/null +++ llvm/test/CodeGen/Mips/vr4300mulmul/mulbranch.ll @@ -0,0 +1,12 @@ +; RUN: llc -march=mips -mfix4300 -verify-machineinstrs < %s | FileCheck %s + +; Function Attrs: nounwind +define dso_local i32 @my_func(i32 signext %a) local_unnamed_addr #0 { +; CHECK: mul +; CHECK-NEXT: nop + %mul = mul nsw i32 %a, %a + %call = tail call i32 @foo(i32 signext %mul) #2 + ret i32 %call +} + +declare dso_local i32 @foo(i32 signext) local_unnamed_addr #1 Index: llvm/test/CodeGen/Mips/vr4300mulmul/mulmul.ll =================================================================== --- /dev/null +++ llvm/test/CodeGen/Mips/vr4300mulmul/mulmul.ll @@ -0,0 +1,12 @@ +; RUN: llc -march=mips -mfix4300 -verify-machineinstrs < %s | FileCheck %s + +; Function Attrs: mustprogress nofree norecurse nosync nounwind readnone willreturn +define dso_local i32 @fun(i32 signext %x, i32 signext %y) local_unnamed_addr #0 { +; CHECK: mul +; CHECK-NEXT: nop +; CHECK-NEXT: mul + %mul = mul nsw i32 %x, %x + %mul1 = mul nsw i32 %y, %y + %add = add nuw nsw i32 %mul1, %mul + ret i32 %add +}