Diff 194005

llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

Show First 20 Lines • Show All 916 Lines • ▼ Show 20 Lines	if (ConstantSDNode *SA = isConstOrConstSplat(Op1)) {
}		}
}		}
}		}

if (SimplifyDemandedBits(Op0, DemandedBits.lshr(ShAmt), DemandedElts,		if (SimplifyDemandedBits(Op0, DemandedBits.lshr(ShAmt), DemandedElts,
Known, TLO, Depth + 1))		Known, TLO, Depth + 1))
return true;		return true;

		// Try shrinking the operation as long as the shift amount will still be
		// in range.
		if ((ShAmt < DemandedBits.getActiveBits()) &&
		ShrinkDemandedOp(Op, BitWidth, DemandedBits, TLO))
		return true;

// Convert (shl (anyext x, c)) to (anyext (shl x, c)) if the high bits		// Convert (shl (anyext x, c)) to (anyext (shl x, c)) if the high bits
// are not demanded. This will likely allow the anyext to be folded away.		// are not demanded. This will likely allow the anyext to be folded away.
if (Op0.getOpcode() == ISD::ANY_EXTEND) {		if (Op0.getOpcode() == ISD::ANY_EXTEND) {
SDValue InnerOp = Op0.getOperand(0);		SDValue InnerOp = Op0.getOperand(0);
EVT InnerVT = InnerOp.getValueType();		EVT InnerVT = InnerOp.getValueType();
unsigned InnerBits = InnerVT.getScalarSizeInBits();		unsigned InnerBits = InnerVT.getScalarSizeInBits();
if (ShAmt < InnerBits && DemandedBits.getActiveBits() <= InnerBits &&		if (ShAmt < InnerBits && DemandedBits.getActiveBits() <= InnerBits &&
isTypeDesirableForOp(ISD::SHL, InnerVT)) {		isTypeDesirableForOp(ISD::SHL, InnerVT)) {
▲ Show 20 Lines • Show All 4,823 Lines • Show Last 20 Lines

llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 11,032 Lines • ▼ Show 20 Lines	static SDValue getTestBitOperand(SDValue Op, unsigned &Bit, bool &Invert,

// (tbz (trunc x), b) -> (tbz x, b)		// (tbz (trunc x), b) -> (tbz x, b)
// This case is just here to enable more of the below cases to be caught.		// This case is just here to enable more of the below cases to be caught.
if (Op->getOpcode() == ISD::TRUNCATE &&		if (Op->getOpcode() == ISD::TRUNCATE &&
Bit < Op->getValueType(0).getSizeInBits()) {		Bit < Op->getValueType(0).getSizeInBits()) {
return getTestBitOperand(Op->getOperand(0), Bit, Invert, DAG);		return getTestBitOperand(Op->getOperand(0), Bit, Invert, DAG);
}		}

		// (tbz (any_ext x), b) -> (tbz x, b) if we don't use the extended bits.
		if (Op->getOpcode() == ISD::ANY_EXTEND &&
		Bit < Op->getOperand(0).getValueSizeInBits()) {
		return getTestBitOperand(Op->getOperand(0), Bit, Invert, DAG);
		}
		spatelUnsubmitted Not Done Reply Inline Actions It would be better to split this change off on its own while adding a test specifically for this pattern. IIUC, we can modify the existing test slightly and show the missing fold: declare void @t() define void @tbz_zext(i32 %in) { %shl = shl i32 %in, 3 %t = zext i32 %shl to i64 %and = and i64 %t, 32 %cond = icmp eq i64 %and, 0 br i1 %cond, label %then, label %end then: call void @t() br label %end end: ret void } spatel: It would be better to split this change off on its own while adding a test specifically for…

if (Op->getNumOperands() != 2)		if (Op->getNumOperands() != 2)
return Op;		return Op;

auto *C = dyn_cast<ConstantSDNode>(Op->getOperand(1));		auto *C = dyn_cast<ConstantSDNode>(Op->getOperand(1));
if (!C)		if (!C)
return Op;		return Op;

switch (Op->getOpcode()) {		switch (Op->getOpcode()) {
▲ Show 20 Lines • Show All 936 Lines • Show Last 20 Lines

llvm/test/CodeGen/X86/narrow-shl-cst.ll

Show First 20 Lines • Show All 146 Lines • ▼ Show 20 Lines	; CHECK-NEXT: retq
%shl = and i32 %and, 255		%shl = and i32 %and, 255
store i32 %shl, i32* %y		store i32 %shl, i32* %y
ret i32 %shl		ret i32 %shl
}		}

define i64 @test13(i64 %x, i64* %y) nounwind {		define i64 @test13(i64 %x, i64* %y) nounwind {
; CHECK-LABEL: test13:		; CHECK-LABEL: test13:
; CHECK: # %bb.0:		; CHECK: # %bb.0:
; CHECK-NEXT: movq %rdi, %rax		; CHECK-NEXT: addl %edi, %edi
; CHECK-NEXT: andl $127, %eax		; CHECK-NEXT: movzbl %dil, %eax
; CHECK-NEXT: addq %rax, %rax
; CHECK-NEXT: movq %rax, (%rsi)		; CHECK-NEXT: movq %rax, (%rsi)
; CHECK-NEXT: retq		; CHECK-NEXT: retq
%and = shl i64 %x, 1		%and = shl i64 %x, 1
%shl = and i64 %and, 255		%shl = and i64 %and, 255
store i64 %shl, i64* %y		store i64 %shl, i64* %y
ret i64 %shl		ret i64 %shl
}		}

Show All 35 Lines

llvm/test/CodeGen/X86/zext-logicop-shift-load.ll

	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc < %s -mtriple=x86_64-unknown-unknown \| FileCheck %s			; RUN: llc < %s -mtriple=x86_64-unknown-unknown \| FileCheck %s


	define i64 @test1(i8* %data) {			define i64 @test1(i8* %data) {
	; CHECK-LABEL: test1:			; CHECK-LABEL: test1:
	; CHECK: # %bb.0: # %entry			; CHECK: # %bb.0: # %entry
	; CHECK-NEXT: movzbl (%rdi), %eax			; CHECK-NEXT: movl (%rdi), %eax
	; CHECK-NEXT: shlq $2, %rax			; CHECK-NEXT: shll $2, %eax
	; CHECK-NEXT: andl $60, %eax			; CHECK-NEXT: andl $60, %eax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	entry:			entry:
	%bf.load = load i8, i8* %data, align 4			%bf.load = load i8, i8* %data, align 4
	%bf.clear = shl i8 %bf.load, 2			%bf.clear = shl i8 %bf.load, 2
	%0 = and i8 %bf.clear, 60			%0 = and i8 %bf.clear, 60
	%mul = zext i8 %0 to i64			%mul = zext i8 %0 to i64
	ret i64 %mul			ret i64 %mul
	}			}

	define i8* @test2(i8* %data) {			define i8* @test2(i8* %data) {
	; CHECK-LABEL: test2:			; CHECK-LABEL: test2:
	; CHECK: # %bb.0: # %entry			; CHECK: # %bb.0: # %entry
	; CHECK-NEXT: movzbl (%rdi), %eax			; CHECK-NEXT: movl (%rdi), %eax
	; CHECK-NEXT: andl $15, %eax			; CHECK-NEXT: shll $2, %eax
	; CHECK-NEXT: leaq (%rdi,%rax,4), %rax			; CHECK-NEXT: andl $60, %eax
				RKSimonUnsubmitted Not Done Reply Inline Actions Are you looking at this as a followup? RKSimon: Are you looking at this as a followup?
				; CHECK-NEXT: addq %rdi, %rax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	entry:			entry:
	%bf.load = load i8, i8* %data, align 4			%bf.load = load i8, i8* %data, align 4
	%bf.clear = shl i8 %bf.load, 2			%bf.clear = shl i8 %bf.load, 2
	%0 = and i8 %bf.clear, 60			%0 = and i8 %bf.clear, 60
	%mul = zext i8 %0 to i64			%mul = zext i8 %0 to i64
	%add.ptr = getelementptr inbounds i8, i8* %data, i64 %mul			%add.ptr = getelementptr inbounds i8, i8* %data, i64 %mul
	ret i8* %add.ptr			ret i8* %add.ptr
	▲ Show 20 Lines • Show All 82 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[TargetLowering][X86] Teach SimplifyDemandedBits to use ShrinkDemandedOp on ISD::SHL nodes.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 194005

llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

llvm/test/CodeGen/X86/narrow-shl-cst.ll

llvm/test/CodeGen/X86/zext-logicop-shift-load.ll

This is an archive of the discontinued LLVM Phabricator instance.

[TargetLowering][X86] Teach SimplifyDemandedBits to use ShrinkDemandedOp on ISD::SHL nodes.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 194005

llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

llvm/test/CodeGen/X86/narrow-shl-cst.ll

llvm/test/CodeGen/X86/zext-logicop-shift-load.ll

[TargetLowering][X86] Teach SimplifyDemandedBits to use ShrinkDemandedOp on ISD::SHL nodes.
ClosedPublic