Skip to content

Commit aab65b1

Browse files
committedNov 30, 2016
[AArch64] Fix useful bits detection for BFM instructions
Summary: When computing useful bits for a BFM instruction, we need to take into consideration the case where both operands of the BFM are equal and provide data that we need to track. Not doing this can cause us to miss useful bits. Fixes PR31138 (https://llvm.org/bugs/show_bug.cgi?id=31138) Reviewers: t.p.northover, jmolloy Subscribers: evandro, gberry, srhines, pirama, mcrosier, aemerson, llvm-commits, rengolin Differential Revision: https://reviews.llvm.org/D27130 llvm-svn: 288253
1 parent 2c6f75d commit aab65b1

File tree

2 files changed

+68
-9
lines changed

2 files changed

+68
-9
lines changed
 

‎llvm/lib/Target/AArch64/AArch64ISelDAGToDAG.cpp

+38-9
Original file line numberDiff line numberDiff line change
@@ -1875,23 +1875,52 @@ static void getUsefulBitsFromBFM(SDValue Op, SDValue Orig, APInt &UsefulBits,
18751875
uint64_t MSB =
18761876
cast<const ConstantSDNode>(Op.getOperand(3).getNode())->getZExtValue();
18771877

1878-
if (Op.getOperand(1) == Orig)
1879-
return getUsefulBitsFromBitfieldMoveOpd(Op, UsefulBits, Imm, MSB, Depth);
1880-
18811878
APInt OpUsefulBits(UsefulBits);
18821879
OpUsefulBits = 1;
18831880

1881+
APInt ResultUsefulBits(UsefulBits.getBitWidth(), 0);
1882+
ResultUsefulBits.flipAllBits();
1883+
APInt Mask(UsefulBits.getBitWidth(), 0);
1884+
1885+
getUsefulBits(Op, ResultUsefulBits, Depth + 1);
1886+
18841887
if (MSB >= Imm) {
1885-
OpUsefulBits = OpUsefulBits.shl(MSB - Imm + 1);
1888+
// The instruction is a BFXIL.
1889+
uint64_t Width = MSB - Imm + 1;
1890+
uint64_t LSB = Imm;
1891+
1892+
OpUsefulBits = OpUsefulBits.shl(Width);
18861893
--OpUsefulBits;
1887-
UsefulBits &= ~OpUsefulBits;
1888-
getUsefulBits(Op, UsefulBits, Depth + 1);
1894+
1895+
if (Op.getOperand(1) == Orig) {
1896+
// Copy the low bits from the result to bits starting from LSB.
1897+
Mask = ResultUsefulBits & OpUsefulBits;
1898+
Mask = Mask.shl(LSB);
1899+
}
1900+
1901+
if (Op.getOperand(0) == Orig)
1902+
// Bits starting from LSB in the input contribute to the result.
1903+
Mask |= (ResultUsefulBits & ~OpUsefulBits);
18891904
} else {
1890-
OpUsefulBits = OpUsefulBits.shl(MSB + 1);
1905+
// The instruction is a BFI.
1906+
uint64_t Width = MSB + 1;
1907+
uint64_t LSB = UsefulBits.getBitWidth() - Imm;
1908+
1909+
OpUsefulBits = OpUsefulBits.shl(Width);
18911910
--OpUsefulBits;
1892-
UsefulBits = ~(OpUsefulBits.shl(OpUsefulBits.getBitWidth() - Imm));
1893-
getUsefulBits(Op, UsefulBits, Depth + 1);
1911+
OpUsefulBits = OpUsefulBits.shl(LSB);
1912+
1913+
if (Op.getOperand(1) == Orig) {
1914+
// Copy the bits from the result to the zero bits.
1915+
Mask = ResultUsefulBits & OpUsefulBits;
1916+
Mask = Mask.lshr(LSB);
1917+
}
1918+
1919+
if (Op.getOperand(0) == Orig)
1920+
Mask |= (ResultUsefulBits & ~OpUsefulBits);
18941921
}
1922+
1923+
UsefulBits &= Mask;
18951924
}
18961925

18971926
static void getUsefulBitsForUse(SDNode *UserNode, APInt &UsefulBits,

‎llvm/test/CodeGen/AArch64/arm64-bitfield-extract.ll

+30
Original file line numberDiff line numberDiff line change
@@ -530,3 +530,33 @@ define i16 @test_ignored_rightbits(i32 %dst, i32 %in) {
530530

531531
ret i16 %conv19
532532
}
533+
534+
; The following test excercises the case where we have a BFI
535+
; instruction with the same input in both operands. We need to
536+
; track the useful bits through both operands.
537+
; CHECK-LABEL: sameOperandBFI
538+
; CHECK: lsr
539+
; CHECK: and
540+
; CHECK: bfi
541+
; CHECK: bfi
542+
define void @sameOperandBFI(i64 %src, i64 %src2, i16 *%ptr) {
543+
entry:
544+
%shr47 = lshr i64 %src, 47
545+
%src2.trunc = trunc i64 %src2 to i32
546+
br i1 undef, label %end, label %if.else
547+
548+
if.else:
549+
%and3 = and i32 %src2.trunc, 3
550+
%shl2 = shl nuw nsw i64 %shr47, 2
551+
%shl2.trunc = trunc i64 %shl2 to i32
552+
%and12 = and i32 %shl2.trunc, 12
553+
%BFISource = or i32 %and3, %and12 ; ...00000ABCD
554+
%BFIRHS = shl nuw nsw i32 %BFISource, 4 ; ...0ABCD0000
555+
%BFI = or i32 %BFIRHS, %BFISource ; ...0ABCDABCD
556+
%BFItrunc = trunc i32 %BFI to i16
557+
store i16 %BFItrunc, i16* %ptr, align 4
558+
br label %end
559+
560+
end:
561+
ret void
562+
}

0 commit comments

Comments
 (0)
Please sign in to comment.