Index: llvm/lib/Target/ARM/ARMBaseInstrInfo.cpp =================================================================== --- llvm/lib/Target/ARM/ARMBaseInstrInfo.cpp +++ llvm/lib/Target/ARM/ARMBaseInstrInfo.cpp @@ -3270,7 +3270,7 @@ } unsigned UseOpc = UseMI.getOpcode(); - unsigned NewUseOpc = 0; + unsigned NewUseOpc1 = 0, NewUseOpc2 = 0; uint32_t ImmVal = (uint32_t)DefMI.getOperand(1).getImm(); uint32_t SOImmValV1 = 0, SOImmValV2 = 0; bool Commute = false; @@ -3288,22 +3288,40 @@ switch (UseOpc) { default: break; case ARM::ADDrr: - case ARM::SUBrr: + case ARM::SUBrr: { if (UseOpc == ARM::SUBrr && Commute) return false; + bool IsSub = false; // ADD/SUB are special because they're essentially the same operation, so // we can handle a larger range of immediates. - if (ARM_AM::isSOImmTwoPartVal(ImmVal)) - NewUseOpc = UseOpc == ARM::ADDrr ? ARM::ADDri : ARM::SUBri; - else if (ARM_AM::isSOImmTwoPartVal(-ImmVal)) { + if (ARM_AM::isSOImmTwoPartVal(ImmVal)) { + NewUseOpc1 = UseOpc == ARM::ADDrr ? ARM::ADDri : ARM::SUBri; + NewUseOpc2 = UseOpc == ARM::ADDrr ? ARM::ADDri : ARM::SUBri; + } else if (ARM_AM::isSOImmTwoPartVal(-ImmVal)) { ImmVal = -ImmVal; - NewUseOpc = UseOpc == ARM::ADDrr ? ARM::SUBri : ARM::ADDri; - } else + NewUseOpc1 = UseOpc == ARM::ADDrr ? ARM::SUBri : ARM::ADDri; + NewUseOpc2 = UseOpc == ARM::ADDrr ? ARM::SUBri : ARM::ADDri; + } else if (ARM_AM::isSOImmTwoPartValSub(ImmVal, &SOImmValV2, + &SOImmValV1)) { + IsSub = true; + NewUseOpc1 = UseOpc == ARM::ADDrr ? ARM::ADDri : ARM::SUBri; + NewUseOpc2 = UseOpc == ARM::ADDrr ? ARM::SUBri : ARM::ADDri; + } else if (ARM_AM::isSOImmTwoPartValSub(-ImmVal, &SOImmValV2, + &SOImmValV1)) { + IsSub = true; + NewUseOpc1 = UseOpc == ARM::ADDrr ? ARM::SUBri : ARM::ADDri; + NewUseOpc2 = UseOpc == ARM::ADDrr ? ARM::ADDri : ARM::SUBri; + } else { return false; - SOImmValV1 = (uint32_t)ARM_AM::getSOImmTwoPartFirst(ImmVal); - SOImmValV2 = (uint32_t)ARM_AM::getSOImmTwoPartSecond(ImmVal); + } + + if (!IsSub) { + SOImmValV1 = (uint32_t)ARM_AM::getSOImmTwoPartFirst(ImmVal); + SOImmValV2 = (uint32_t)ARM_AM::getSOImmTwoPartSecond(ImmVal); + } break; + } case ARM::ORRrr: case ARM::EORrr: if (!ARM_AM::isSOImmTwoPartVal(ImmVal)) @@ -3312,8 +3330,8 @@ SOImmValV2 = (uint32_t)ARM_AM::getSOImmTwoPartSecond(ImmVal); switch (UseOpc) { default: break; - case ARM::ORRrr: NewUseOpc = ARM::ORRri; break; - case ARM::EORrr: NewUseOpc = ARM::EORri; break; + case ARM::ORRrr: NewUseOpc1 = NewUseOpc2 = ARM::ORRri; break; + case ARM::EORrr: NewUseOpc1 = NewUseOpc2 = ARM::EORri; break; } break; case ARM::t2ADDrr: @@ -3326,11 +3344,13 @@ const bool ToSP = DefMI.getOperand(0).getReg() == ARM::SP; const unsigned t2ADD = ToSP ? ARM::t2ADDspImm : ARM::t2ADDri; const unsigned t2SUB = ToSP ? ARM::t2SUBspImm : ARM::t2SUBri; - if (ARM_AM::isT2SOImmTwoPartVal(ImmVal)) - NewUseOpc = UseOpc == ARM::t2ADDrr ? t2ADD : t2SUB; - else if (ARM_AM::isT2SOImmTwoPartVal(-ImmVal)) { + if (ARM_AM::isT2SOImmTwoPartVal(ImmVal)) { + NewUseOpc1 = UseOpc == ARM::t2ADDrr ? t2ADD : t2SUB; + NewUseOpc2 = UseOpc == ARM::t2ADDrr ? t2ADD : t2SUB; + } else if (ARM_AM::isT2SOImmTwoPartVal(-ImmVal)) { ImmVal = -ImmVal; - NewUseOpc = UseOpc == ARM::t2ADDrr ? t2SUB : t2ADD; + NewUseOpc1 = UseOpc == ARM::t2ADDrr ? t2SUB : t2ADD; + NewUseOpc2 = UseOpc == ARM::t2ADDrr ? t2SUB : t2ADD; } else return false; SOImmValV1 = (uint32_t)ARM_AM::getT2SOImmTwoPartFirst(ImmVal); @@ -3345,8 +3365,8 @@ SOImmValV2 = (uint32_t)ARM_AM::getT2SOImmTwoPartSecond(ImmVal); switch (UseOpc) { default: break; - case ARM::t2ORRrr: NewUseOpc = ARM::t2ORRri; break; - case ARM::t2EORrr: NewUseOpc = ARM::t2EORri; break; + case ARM::t2ORRrr: NewUseOpc1 = NewUseOpc2 = ARM::t2ORRri; break; + case ARM::t2EORrr: NewUseOpc1 = NewUseOpc2 = ARM::t2EORri; break; } break; } @@ -3358,13 +3378,13 @@ bool isKill = UseMI.getOperand(OpIdx).isKill(); const TargetRegisterClass *TRC = MRI->getRegClass(Reg); Register NewReg = MRI->createVirtualRegister(TRC); - BuildMI(*UseMI.getParent(), UseMI, UseMI.getDebugLoc(), get(NewUseOpc), + BuildMI(*UseMI.getParent(), UseMI, UseMI.getDebugLoc(), get(NewUseOpc1), NewReg) .addReg(Reg1, getKillRegState(isKill)) .addImm(SOImmValV1) .add(predOps(ARMCC::AL)) .add(condCodeOp()); - UseMI.setDesc(get(NewUseOpc)); + UseMI.setDesc(get(NewUseOpc2)); UseMI.getOperand(1).setReg(NewReg); UseMI.getOperand(1).setIsKill(); UseMI.getOperand(2).ChangeToImmediate(SOImmValV2); @@ -3374,11 +3394,12 @@ // Then the below code will not be needed, as the input/output register // classes will be rgpr or gprSP. // For now, we fix the UseMI operand explicitly here: - switch(NewUseOpc){ + switch(NewUseOpc1){ case ARM::t2ADDspImm: case ARM::t2SUBspImm: case ARM::t2ADDri: case ARM::t2SUBri: + assert(NewUseOpc1 == NewUseOpc2); MRI->setRegClass(UseMI.getOperand(0).getReg(), TRC); } return true; @@ -5501,6 +5522,8 @@ return ForCodesize ? 4 : 1; if (ARM_AM::isSOImmTwoPartVal(Val)) // two instrs return ForCodesize ? 8 : 2; + if (ARM_AM::isSOImmTwoPartValSub(Val)) // two instrs + return ForCodesize ? 8 : 2; } if (Subtarget->useMovt()) // MOVW + MOVT return ForCodesize ? 8 : 2; Index: llvm/lib/Target/ARM/ARMExpandPseudoInsts.cpp =================================================================== --- llvm/lib/Target/ARM/ARMExpandPseudoInsts.cpp +++ llvm/lib/Target/ARM/ARMExpandPseudoInsts.cpp @@ -873,16 +873,28 @@ // FIXME Windows CE supports older ARM CPUs assert(!STI->isTargetWindows() && "Windows on ARM requires ARMv7+"); - // Expand into a movi + orr. - LO16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVi), DstReg); - HI16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::ORRri)) - .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead)) - .addReg(DstReg); - assert (MO.isImm() && "MOVi32imm w/ non-immediate source operand!"); unsigned ImmVal = (unsigned)MO.getImm(); - unsigned SOImmValV1 = ARM_AM::getSOImmTwoPartFirst(ImmVal); - unsigned SOImmValV2 = ARM_AM::getSOImmTwoPartSecond(ImmVal); + unsigned SOImmValV1 = 0, SOImmValV2 = 0; + + if (ARM_AM::isSOImmTwoPartVal(ImmVal)) { + // Expand into a movi + orr. + LO16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVi), DstReg); + HI16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::ORRri)) + .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead)) + .addReg(DstReg); + SOImmValV1 = ARM_AM::getSOImmTwoPartFirst(ImmVal); + SOImmValV2 = ARM_AM::getSOImmTwoPartSecond(ImmVal); + } else if (ARM_AM::isSOImmTwoPartValSub(ImmVal, &SOImmValV2, &SOImmValV1)) { + // Expand into a movi + subri. + LO16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVi), DstReg); + HI16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::SUBri)) + .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead)) + .addReg(DstReg); + } else { + llvm_unreachable("unknown immediate type"); + } + unsigned MIFlags = MI.getFlags(); LO16 = LO16.addImm(SOImmValV1); HI16 = HI16.addImm(SOImmValV2); Index: llvm/lib/Target/ARM/ARMInstrInfo.td =================================================================== --- llvm/lib/Target/ARM/ARMInstrInfo.td +++ llvm/lib/Target/ARM/ARMInstrInfo.td @@ -812,7 +812,9 @@ def arm_i32imm : IntImmLeafuseMovt()) return true; - return ARM_AM::isSOImmTwoPartVal(Imm.getZExtValue()); + if (ARM_AM::isSOImmTwoPartVal(Imm.getZExtValue())) + return true; + return ARM_AM::isSOImmTwoPartValSub(Imm.getZExtValue()); }]>; /// imm0_1 predicate - Immediate in the range [0,1]. Index: llvm/lib/Target/ARM/MCTargetDesc/ARMAddressingModes.h =================================================================== --- llvm/lib/Target/ARM/MCTargetDesc/ARMAddressingModes.h +++ llvm/lib/Target/ARM/MCTargetDesc/ARMAddressingModes.h @@ -175,6 +175,35 @@ return rotl32(Arg, RotAmt) | ((RotAmt>>1) << 8); } + /// isSOImmTwoPartValSub - Return true if the specified value V can be + /// obtained by two SOImmVal's subtraction: V = Y - X. + inline bool isSOImmTwoPartValSub(unsigned V, unsigned *PX = nullptr, + unsigned *PY = nullptr) { + // If this can be handled with a single shifter_op, bail out. + if ((rotr32(~255U, getSOImmValRotate(V)) & V) == 0) + return false; + // Check if V can be obtained by Y-X, both Y and X are SOImmVal. + // Suppose V in the form of + // {leading 00, upper effective bits, lower 8 effective bits, trailing 00} + // The first step is calculating the top bit position of the lower 8 + // effective bits. + unsigned Bits = countTrailingZeros(V); + Bits += Bits & 1 ? 7 : 8; + // The second step is calculating X. + unsigned XMask = (1 << Bits) - 1; + unsigned X = (1 << Bits) - (V & XMask); + // The third step is calculating Y. + unsigned Y = V + X; + // Check if Y is SOImmVal. + if ((rotr32(~255U, getSOImmValRotate(Y)) & Y) != 0) + return false; + if (PX) + *PX = X; + if (PY) + *PY = Y; + return true; + } + /// isSOImmTwoPartVal - Return true if the specified value can be obtained by /// or'ing together two SOImmVal's. inline bool isSOImmTwoPartVal(unsigned V) { Index: llvm/test/CodeGen/ARM/sadd_sat.ll =================================================================== --- llvm/test/CodeGen/ARM/sadd_sat.ll +++ llvm/test/CodeGen/ARM/sadd_sat.ll @@ -276,14 +276,11 @@ ; CHECK-ARMNODPS-NEXT: orr r1, r1, #32512 ; CHECK-ARMNODPS-NEXT: cmp r0, r1 ; CHECK-ARMNODPS-NEXT: movlt r1, r0 -; CHECK-ARMNODPS-NEXT: ldr r0, .LCPI2_0 +; CHECK-ARMNODPS-NEXT: mov r0, #0 +; CHECK-ARMNODPS-NEXT: sub r0, r0, #32768 ; CHECK-ARMNODPS-NEXT: cmn r1, #32768 ; CHECK-ARMNODPS-NEXT: movgt r0, r1 ; CHECK-ARMNODPS-NEXT: bx lr -; CHECK-ARMNODPS-NEXT: .p2align 2 -; CHECK-ARMNODPS-NEXT: @ %bb.1: -; CHECK-ARMNODPS-NEXT: .LCPI2_0: -; CHECK-ARMNODPS-NEXT: .long 4294934528 @ 0xffff8000 ; ; CHECK-ARMBASEDSP-LABEL: func16: ; CHECK-ARMBASEDSP: @ %bb.0: Index: llvm/test/CodeGen/ARM/ssub_sat.ll =================================================================== --- llvm/test/CodeGen/ARM/ssub_sat.ll +++ llvm/test/CodeGen/ARM/ssub_sat.ll @@ -277,14 +277,11 @@ ; CHECK-ARMNODPS-NEXT: orr r1, r1, #32512 ; CHECK-ARMNODPS-NEXT: cmp r0, r1 ; CHECK-ARMNODPS-NEXT: movlt r1, r0 -; CHECK-ARMNODPS-NEXT: ldr r0, .LCPI2_0 +; CHECK-ARMNODPS-NEXT: mov r0, #0 +; CHECK-ARMNODPS-NEXT: sub r0, r0, #32768 ; CHECK-ARMNODPS-NEXT: cmn r1, #32768 ; CHECK-ARMNODPS-NEXT: movgt r0, r1 ; CHECK-ARMNODPS-NEXT: bx lr -; CHECK-ARMNODPS-NEXT: .p2align 2 -; CHECK-ARMNODPS-NEXT: @ %bb.1: -; CHECK-ARMNODPS-NEXT: .LCPI2_0: -; CHECK-ARMNODPS-NEXT: .long 4294934528 @ 0xffff8000 ; ; CHECK-ARMBASEDSP-LABEL: func16: ; CHECK-ARMBASEDSP: @ %bb.0: