diff --git a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp --- a/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp @@ -1533,8 +1533,8 @@ APInt Ones = APInt::getAllOnes(BitWidth); Ones = Op0Opcode == ISD::SHL ? Ones.shl(ShiftAmt) : Ones.lshr(ShiftAmt); - if (C->getAPIntValue() == Ones) { - // If the xor constant is a shifted -1, do a 'not' before the + if ((DemandedBits & C->getAPIntValue()) == (DemandedBits & Ones)) { + // If the xor constant is a demanded mask, do a 'not' before the // shift: // xor (X << ShiftC), XorC --> (not X) << ShiftC // xor (X >> ShiftC), XorC --> (not X) >> ShiftC diff --git a/llvm/test/CodeGen/AArch64/optimize-imm.ll b/llvm/test/CodeGen/AArch64/optimize-imm.ll --- a/llvm/test/CodeGen/AArch64/optimize-imm.ll +++ b/llvm/test/CodeGen/AArch64/optimize-imm.ll @@ -56,13 +56,12 @@ } ; Make sure we don't shrink or optimize an XOR's immediate operand if the -; immediate is -1. Instruction selection turns (and ((xor $mask, -1), $v0)) into -; a BIC. +; immediate is -1. define i32 @xor1(i32 %a) { ; CHECK-LABEL: xor1: ; CHECK: // %bb.0: // %entry -; CHECK-NEXT: mov w8, #56 -; CHECK-NEXT: bic w0, w8, w0, lsl #3 +; CHECK-NEXT: mvn w8, w0 +; CHECK-NEXT: ubfiz w0, w8, #3, #3 ; CHECK-NEXT: ret entry: %shl = shl i32 %a, 3 diff --git a/llvm/test/CodeGen/AArch64/selectcc-to-shiftand.ll b/llvm/test/CodeGen/AArch64/selectcc-to-shiftand.ll --- a/llvm/test/CodeGen/AArch64/selectcc-to-shiftand.ll +++ b/llvm/test/CodeGen/AArch64/selectcc-to-shiftand.ll @@ -71,8 +71,9 @@ define i32 @pos_sel_special_constant(i32 %a) { ; CHECK-LABEL: pos_sel_special_constant: ; CHECK: // %bb.0: -; CHECK-NEXT: mov w8, #512 -; CHECK-NEXT: bic w0, w8, w0, lsr #22 +; CHECK-NEXT: mvn w8, w0 +; CHECK-NEXT: lsr w8, w8, #22 +; CHECK-NEXT: and w0, w8, #0x200 ; CHECK-NEXT: ret %tmp.1 = icmp sgt i32 %a, -1 %retval = select i1 %tmp.1, i32 512, i32 0 diff --git a/llvm/test/CodeGen/ARM/pr36577.ll b/llvm/test/CodeGen/ARM/pr36577.ll --- a/llvm/test/CodeGen/ARM/pr36577.ll +++ b/llvm/test/CodeGen/ARM/pr36577.ll @@ -15,8 +15,9 @@ ; CHECK-NEXT: mvn r1, #7 ; CHECK-NEXT: movt r0, :upper16:a ; CHECK-NEXT: ldrh r0, [r0] -; CHECK-NEXT: mvn r0, r0, lsr #7 -; CHECK-NEXT: orr r0, r1, r0, lsl #2 +; CHECK-NEXT: mvn r0, r0 +; CHECK-NEXT: orr r0, r1, r0, lsr #5 +; CHECK-NEXT: bic r0, r0, #3 ; CHECK-NEXT: bx lr ; ; CHECK-T2-LABEL: pr36577: @@ -25,8 +26,9 @@ ; CHECK-T2-NEXT: mvn r1, #7 ; CHECK-T2-NEXT: movt r0, :upper16:a ; CHECK-T2-NEXT: ldrh r0, [r0] -; CHECK-T2-NEXT: mvn.w r0, r0, lsr #7 -; CHECK-T2-NEXT: orr.w r0, r1, r0, lsl #2 +; CHECK-T2-NEXT: mvns r0, r0 +; CHECK-T2-NEXT: orr.w r0, r1, r0, lsr #5 +; CHECK-T2-NEXT: bic r0, r0, #3 ; CHECK-T2-NEXT: bx lr entry: %0 = load i16, i16* @a, align 2 diff --git a/llvm/test/CodeGen/Mips/bittest.ll b/llvm/test/CodeGen/Mips/bittest.ll --- a/llvm/test/CodeGen/Mips/bittest.ll +++ b/llvm/test/CodeGen/Mips/bittest.ll @@ -149,29 +149,27 @@ define signext i32 @bittest_16_i32(i32 signext %a) nounwind { ; MIPS-LABEL: bittest_16_i32: ; MIPS: # %bb.0: -; MIPS-NEXT: srl $1, $4, 16 -; MIPS-NEXT: not $1, $1 +; MIPS-NEXT: not $1, $4 +; MIPS-NEXT: srl $1, $1, 16 ; MIPS-NEXT: jr $ra ; MIPS-NEXT: andi $2, $1, 1 ; ; MIPS32R2-LABEL: bittest_16_i32: ; MIPS32R2: # %bb.0: -; MIPS32R2-NEXT: srl $1, $4, 16 -; MIPS32R2-NEXT: not $1, $1 +; MIPS32R2-NEXT: not $1, $4 ; MIPS32R2-NEXT: jr $ra -; MIPS32R2-NEXT: andi $2, $1, 1 +; MIPS32R2-NEXT: ext $2, $1, 16, 1 ; ; MIPS32R6-LABEL: bittest_16_i32: ; MIPS32R6: # %bb.0: -; MIPS32R6-NEXT: srl $1, $4, 16 -; MIPS32R6-NEXT: not $1, $1 +; MIPS32R6-NEXT: not $1, $4 ; MIPS32R6-NEXT: jr $ra -; MIPS32R6-NEXT: andi $2, $1, 1 +; MIPS32R6-NEXT: ext $2, $1, 16, 1 ; ; MIPS64-LABEL: bittest_16_i32: ; MIPS64: # %bb.0: -; MIPS64-NEXT: srl $1, $4, 16 -; MIPS64-NEXT: not $1, $1 +; MIPS64-NEXT: not $1, $4 +; MIPS64-NEXT: srl $1, $1, 16 ; MIPS64-NEXT: andi $1, $1, 1 ; MIPS64-NEXT: dsll $1, $1, 32 ; MIPS64-NEXT: jr $ra @@ -179,32 +177,28 @@ ; ; MIPS64R2-LABEL: bittest_16_i32: ; MIPS64R2: # %bb.0: -; MIPS64R2-NEXT: srl $1, $4, 16 -; MIPS64R2-NEXT: not $1, $1 -; MIPS64R2-NEXT: andi $1, $1, 1 +; MIPS64R2-NEXT: not $1, $4 +; MIPS64R2-NEXT: ext $1, $1, 16, 1 ; MIPS64R2-NEXT: jr $ra ; MIPS64R2-NEXT: dext $2, $1, 0, 32 ; ; MIPS64R6-LABEL: bittest_16_i32: ; MIPS64R6: # %bb.0: -; MIPS64R6-NEXT: srl $1, $4, 16 -; MIPS64R6-NEXT: not $1, $1 -; MIPS64R6-NEXT: andi $1, $1, 1 +; MIPS64R6-NEXT: not $1, $4 +; MIPS64R6-NEXT: ext $1, $1, 16, 1 ; MIPS64R6-NEXT: jr $ra ; MIPS64R6-NEXT: dext $2, $1, 0, 32 ; ; MM32R3-LABEL: bittest_16_i32: ; MM32R3: # %bb.0: -; MM32R3-NEXT: srl $2, $4, 16 -; MM32R3-NEXT: not16 $2, $2 -; MM32R3-NEXT: andi16 $2, $2, 1 -; MM32R3-NEXT: jrc $ra +; MM32R3-NEXT: not16 $2, $4 +; MM32R3-NEXT: jr $ra +; MM32R3-NEXT: ext $2, $2, 16, 1 ; ; MM32R6-LABEL: bittest_16_i32: ; MM32R6: # %bb.0: -; MM32R6-NEXT: srl $2, $4, 16 -; MM32R6-NEXT: not16 $2, $2 -; MM32R6-NEXT: andi16 $2, $2, 1 +; MM32R6-NEXT: not16 $2, $4 +; MM32R6-NEXT: ext $2, $2, 16, 1 ; MM32R6-NEXT: jrc $ra %shr = lshr i32 %a, 16 %not = xor i32 %shr, -1 @@ -399,65 +393,59 @@ define i64 @bittest_16_i64(i64 %a) nounwind { ; MIPS-LABEL: bittest_16_i64: ; MIPS: # %bb.0: -; MIPS-NEXT: srl $1, $5, 16 -; MIPS-NEXT: not $1, $1 +; MIPS-NEXT: not $1, $5 +; MIPS-NEXT: srl $1, $1, 16 ; MIPS-NEXT: andi $3, $1, 1 ; MIPS-NEXT: jr $ra ; MIPS-NEXT: addiu $2, $zero, 0 ; ; MIPS32R2-LABEL: bittest_16_i64: ; MIPS32R2: # %bb.0: -; MIPS32R2-NEXT: srl $1, $5, 16 -; MIPS32R2-NEXT: not $1, $1 -; MIPS32R2-NEXT: andi $3, $1, 1 +; MIPS32R2-NEXT: not $1, $5 +; MIPS32R2-NEXT: ext $3, $1, 16, 1 ; MIPS32R2-NEXT: jr $ra ; MIPS32R2-NEXT: addiu $2, $zero, 0 ; ; MIPS32R6-LABEL: bittest_16_i64: ; MIPS32R6: # %bb.0: -; MIPS32R6-NEXT: srl $1, $5, 16 -; MIPS32R6-NEXT: not $1, $1 -; MIPS32R6-NEXT: andi $3, $1, 1 +; MIPS32R6-NEXT: not $1, $5 +; MIPS32R6-NEXT: ext $3, $1, 16, 1 ; MIPS32R6-NEXT: jr $ra ; MIPS32R6-NEXT: addiu $2, $zero, 0 ; ; MIPS64-LABEL: bittest_16_i64: ; MIPS64: # %bb.0: -; MIPS64-NEXT: dsrl $1, $4, 16 -; MIPS64-NEXT: daddiu $2, $zero, -1 -; MIPS64-NEXT: xor $1, $1, $2 +; MIPS64-NEXT: daddiu $1, $zero, -1 +; MIPS64-NEXT: xor $1, $4, $1 +; MIPS64-NEXT: dsrl $1, $1, 16 ; MIPS64-NEXT: jr $ra ; MIPS64-NEXT: andi $2, $1, 1 ; ; MIPS64R2-LABEL: bittest_16_i64: ; MIPS64R2: # %bb.0: -; MIPS64R2-NEXT: dsrl $1, $4, 16 -; MIPS64R2-NEXT: daddiu $2, $zero, -1 -; MIPS64R2-NEXT: xor $1, $1, $2 +; MIPS64R2-NEXT: daddiu $1, $zero, -1 +; MIPS64R2-NEXT: xor $1, $4, $1 ; MIPS64R2-NEXT: jr $ra -; MIPS64R2-NEXT: andi $2, $1, 1 +; MIPS64R2-NEXT: dext $2, $1, 16, 1 ; ; MIPS64R6-LABEL: bittest_16_i64: ; MIPS64R6: # %bb.0: -; MIPS64R6-NEXT: dsrl $1, $4, 16 -; MIPS64R6-NEXT: daddiu $2, $zero, -1 -; MIPS64R6-NEXT: xor $1, $1, $2 +; MIPS64R6-NEXT: daddiu $1, $zero, -1 +; MIPS64R6-NEXT: xor $1, $4, $1 ; MIPS64R6-NEXT: jr $ra -; MIPS64R6-NEXT: andi $2, $1, 1 +; MIPS64R6-NEXT: dext $2, $1, 16, 1 ; ; MM32R3-LABEL: bittest_16_i64: ; MM32R3: # %bb.0: -; MM32R3-NEXT: srl $2, $5, 16 -; MM32R3-NEXT: not16 $2, $2 -; MM32R3-NEXT: andi16 $3, $2, 1 +; MM32R3-NEXT: not16 $2, $5 +; MM32R3-NEXT: ext $3, $2, 16, 1 ; MM32R3-NEXT: li16 $2, 0 ; MM32R3-NEXT: jrc $ra ; ; MM32R6-LABEL: bittest_16_i64: ; MM32R6: # %bb.0: -; MM32R6-NEXT: srl $2, $5, 16 -; MM32R6-NEXT: not16 $2, $2 -; MM32R6-NEXT: andi16 $3, $2, 1 +; MM32R6-NEXT: not16 $2, $5 +; MM32R6-NEXT: ext $3, $2, 16, 1 ; MM32R6-NEXT: li16 $2, 0 ; MM32R6-NEXT: jrc $ra %shr = lshr i64 %a, 16 @@ -490,27 +478,25 @@ ; ; MIPS64-LABEL: bittest_31_i64: ; MIPS64: # %bb.0: -; MIPS64-NEXT: dsrl $1, $4, 31 -; MIPS64-NEXT: daddiu $2, $zero, -1 -; MIPS64-NEXT: xor $1, $1, $2 +; MIPS64-NEXT: daddiu $1, $zero, -1 +; MIPS64-NEXT: xor $1, $4, $1 +; MIPS64-NEXT: dsrl $1, $1, 31 ; MIPS64-NEXT: jr $ra ; MIPS64-NEXT: andi $2, $1, 1 ; ; MIPS64R2-LABEL: bittest_31_i64: ; MIPS64R2: # %bb.0: -; MIPS64R2-NEXT: dsrl $1, $4, 31 -; MIPS64R2-NEXT: daddiu $2, $zero, -1 -; MIPS64R2-NEXT: xor $1, $1, $2 +; MIPS64R2-NEXT: daddiu $1, $zero, -1 +; MIPS64R2-NEXT: xor $1, $4, $1 ; MIPS64R2-NEXT: jr $ra -; MIPS64R2-NEXT: andi $2, $1, 1 +; MIPS64R2-NEXT: dext $2, $1, 31, 1 ; ; MIPS64R6-LABEL: bittest_31_i64: ; MIPS64R6: # %bb.0: -; MIPS64R6-NEXT: dsrl $1, $4, 31 -; MIPS64R6-NEXT: daddiu $2, $zero, -1 -; MIPS64R6-NEXT: xor $1, $1, $2 +; MIPS64R6-NEXT: daddiu $1, $zero, -1 +; MIPS64R6-NEXT: xor $1, $4, $1 ; MIPS64R6-NEXT: jr $ra -; MIPS64R6-NEXT: andi $2, $1, 1 +; MIPS64R6-NEXT: dext $2, $1, 31, 1 ; ; MM32R3-LABEL: bittest_31_i64: ; MM32R3: # %bb.0: @@ -555,27 +541,25 @@ ; ; MIPS64-LABEL: bittest_32_i64: ; MIPS64: # %bb.0: -; MIPS64-NEXT: dsrl $1, $4, 32 -; MIPS64-NEXT: daddiu $2, $zero, -1 -; MIPS64-NEXT: xor $1, $1, $2 +; MIPS64-NEXT: daddiu $1, $zero, -1 +; MIPS64-NEXT: xor $1, $4, $1 +; MIPS64-NEXT: dsrl $1, $1, 32 ; MIPS64-NEXT: jr $ra ; MIPS64-NEXT: andi $2, $1, 1 ; ; MIPS64R2-LABEL: bittest_32_i64: ; MIPS64R2: # %bb.0: -; MIPS64R2-NEXT: dsrl $1, $4, 32 -; MIPS64R2-NEXT: daddiu $2, $zero, -1 -; MIPS64R2-NEXT: xor $1, $1, $2 +; MIPS64R2-NEXT: daddiu $1, $zero, -1 +; MIPS64R2-NEXT: xor $1, $4, $1 ; MIPS64R2-NEXT: jr $ra -; MIPS64R2-NEXT: andi $2, $1, 1 +; MIPS64R2-NEXT: dextu $2, $1, 32, 1 ; ; MIPS64R6-LABEL: bittest_32_i64: ; MIPS64R6: # %bb.0: -; MIPS64R6-NEXT: dsrl $1, $4, 32 -; MIPS64R6-NEXT: daddiu $2, $zero, -1 -; MIPS64R6-NEXT: xor $1, $1, $2 +; MIPS64R6-NEXT: daddiu $1, $zero, -1 +; MIPS64R6-NEXT: xor $1, $4, $1 ; MIPS64R6-NEXT: jr $ra -; MIPS64R6-NEXT: andi $2, $1, 1 +; MIPS64R6-NEXT: dextu $2, $1, 32, 1 ; ; MM32R3-LABEL: bittest_32_i64: ; MM32R3: # %bb.0: diff --git a/llvm/test/CodeGen/RISCV/bittest.ll b/llvm/test/CodeGen/RISCV/bittest.ll --- a/llvm/test/CodeGen/RISCV/bittest.ll +++ b/llvm/test/CodeGen/RISCV/bittest.ll @@ -1,8 +1,8 @@ ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc -mtriple=riscv32 -verify-machineinstrs < %s \ -; RUN: | FileCheck %s -check-prefixes=CHECK,NOZBS,RV32,RV32I +; RUN: | FileCheck %s -check-prefixes=CHECK,RV32,RV32I ; RUN: llc -mtriple=riscv64 -verify-machineinstrs < %s \ -; RUN: | FileCheck %s -check-prefixes=CHECK,NOZBS,RV64,RV64I +; RUN: | FileCheck %s -check-prefixes=CHECK,RV64,RV64I ; RUN: llc -mtriple=riscv32 -mattr=+zbs -verify-machineinstrs < %s \ ; RUN: | FileCheck %s -check-prefixes=CHECK,ZBS,RV32,RV32ZBS ; RUN: llc -mtriple=riscv64 -mattr=+zbs -verify-machineinstrs < %s \ @@ -33,17 +33,24 @@ } define signext i32 @bittest_11_i32(i32 signext %a) nounwind { -; NOZBS-LABEL: bittest_11_i32: -; NOZBS: # %bb.0: -; NOZBS-NEXT: srli a0, a0, 11 -; NOZBS-NEXT: not a0, a0 -; NOZBS-NEXT: andi a0, a0, 1 -; NOZBS-NEXT: ret +; RV32I-LABEL: bittest_11_i32: +; RV32I: # %bb.0: +; RV32I-NEXT: not a0, a0 +; RV32I-NEXT: slli a0, a0, 20 +; RV32I-NEXT: srli a0, a0, 31 +; RV32I-NEXT: ret +; +; RV64I-LABEL: bittest_11_i32: +; RV64I: # %bb.0: +; RV64I-NEXT: not a0, a0 +; RV64I-NEXT: slli a0, a0, 52 +; RV64I-NEXT: srli a0, a0, 63 +; RV64I-NEXT: ret ; ; ZBS-LABEL: bittest_11_i32: ; ZBS: # %bb.0: +; ZBS-NEXT: not a0, a0 ; ZBS-NEXT: bexti a0, a0, 11 -; ZBS-NEXT: xori a0, a0, 1 ; ZBS-NEXT: ret %shr = lshr i32 %a, 11 %not = xor i32 %shr, -1 @@ -110,30 +117,30 @@ define i64 @bittest_11_i64(i64 %a) nounwind { ; RV32I-LABEL: bittest_11_i64: ; RV32I: # %bb.0: -; RV32I-NEXT: srli a0, a0, 11 ; RV32I-NEXT: not a0, a0 -; RV32I-NEXT: andi a0, a0, 1 +; RV32I-NEXT: slli a0, a0, 20 +; RV32I-NEXT: srli a0, a0, 31 ; RV32I-NEXT: li a1, 0 ; RV32I-NEXT: ret ; ; RV64I-LABEL: bittest_11_i64: ; RV64I: # %bb.0: -; RV64I-NEXT: srli a0, a0, 11 ; RV64I-NEXT: not a0, a0 -; RV64I-NEXT: andi a0, a0, 1 +; RV64I-NEXT: slli a0, a0, 52 +; RV64I-NEXT: srli a0, a0, 63 ; RV64I-NEXT: ret ; ; RV32ZBS-LABEL: bittest_11_i64: ; RV32ZBS: # %bb.0: +; RV32ZBS-NEXT: not a0, a0 ; RV32ZBS-NEXT: bexti a0, a0, 11 -; RV32ZBS-NEXT: xori a0, a0, 1 ; RV32ZBS-NEXT: li a1, 0 ; RV32ZBS-NEXT: ret ; ; RV64ZBS-LABEL: bittest_11_i64: ; RV64ZBS: # %bb.0: +; RV64ZBS-NEXT: not a0, a0 ; RV64ZBS-NEXT: bexti a0, a0, 11 -; RV64ZBS-NEXT: xori a0, a0, 1 ; RV64ZBS-NEXT: ret %shr = lshr i64 %a, 11 %not = xor i64 %shr, -1 @@ -149,18 +156,11 @@ ; RV32-NEXT: li a1, 0 ; RV32-NEXT: ret ; -; RV64I-LABEL: bittest_31_i64: -; RV64I: # %bb.0: -; RV64I-NEXT: srli a0, a0, 31 -; RV64I-NEXT: not a0, a0 -; RV64I-NEXT: andi a0, a0, 1 -; RV64I-NEXT: ret -; -; RV64ZBS-LABEL: bittest_31_i64: -; RV64ZBS: # %bb.0: -; RV64ZBS-NEXT: bexti a0, a0, 31 -; RV64ZBS-NEXT: xori a0, a0, 1 -; RV64ZBS-NEXT: ret +; RV64-LABEL: bittest_31_i64: +; RV64: # %bb.0: +; RV64-NEXT: not a0, a0 +; RV64-NEXT: srliw a0, a0, 31 +; RV64-NEXT: ret %shr = lshr i64 %a, 31 %not = xor i64 %shr, -1 %and = and i64 %not, 1 @@ -177,15 +177,15 @@ ; ; RV64I-LABEL: bittest_32_i64: ; RV64I: # %bb.0: -; RV64I-NEXT: srli a0, a0, 32 ; RV64I-NEXT: not a0, a0 -; RV64I-NEXT: andi a0, a0, 1 +; RV64I-NEXT: slli a0, a0, 31 +; RV64I-NEXT: srli a0, a0, 63 ; RV64I-NEXT: ret ; ; RV64ZBS-LABEL: bittest_32_i64: ; RV64ZBS: # %bb.0: +; RV64ZBS-NEXT: not a0, a0 ; RV64ZBS-NEXT: bexti a0, a0, 32 -; RV64ZBS-NEXT: xori a0, a0, 1 ; RV64ZBS-NEXT: ret %shr = lshr i64 %a, 32 %not = xor i64 %shr, -1 diff --git a/llvm/test/CodeGen/X86/speculative-load-hardening.ll b/llvm/test/CodeGen/X86/speculative-load-hardening.ll --- a/llvm/test/CodeGen/X86/speculative-load-hardening.ll +++ b/llvm/test/CodeGen/X86/speculative-load-hardening.ll @@ -911,8 +911,8 @@ ; X64-NEXT: cmpq $.Lslh_ret_addr23, %rcx ; X64-NEXT: cmovneq %r15, %rax ; X64-NEXT: movswl (%rbx), %edi -; X64-NEXT: shrl $7, %edi ; X64-NEXT: notl %edi +; X64-NEXT: shrl $7, %edi ; X64-NEXT: orl $-65536, %edi # imm = 0xFFFF0000 ; X64-NEXT: orl %eax, %edi ; X64-NEXT: shlq $47, %rax @@ -964,8 +964,8 @@ ; X64-LFENCE-NEXT: shll $7, %edi ; X64-LFENCE-NEXT: callq sink@PLT ; X64-LFENCE-NEXT: movswl (%rbx), %edi -; X64-LFENCE-NEXT: shrl $7, %edi ; X64-LFENCE-NEXT: notl %edi +; X64-LFENCE-NEXT: shrl $7, %edi ; X64-LFENCE-NEXT: orl $-65536, %edi # imm = 0xFFFF0000 ; X64-LFENCE-NEXT: callq sink@PLT ; X64-LFENCE-NEXT: movzwl (%rbx), %eax