Diff 110735

llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 7,390 Lines • ▼ Show 20 Lines	if (N0.getOpcode() == ISD::SETCC) {
// of the appropriate width.		// of the appropriate width.
SDValue ExtTrueVal = (SetCCWidth == 1) ? DAG.getAllOnesConstant(DL, VT)		SDValue ExtTrueVal = (SetCCWidth == 1) ? DAG.getAllOnesConstant(DL, VT)
: TLI.getConstTrueVal(DAG, VT, DL);		: TLI.getConstTrueVal(DAG, VT, DL);
SDValue Zero = DAG.getConstant(0, DL, VT);		SDValue Zero = DAG.getConstant(0, DL, VT);
if (SDValue SCC =		if (SDValue SCC =
SimplifySelectCC(DL, N00, N01, ExtTrueVal, Zero, CC, true))		SimplifySelectCC(DL, N00, N01, ExtTrueVal, Zero, CC, true))
return SCC;		return SCC;

if (!VT.isVector()) {		if (!VT.isVector() && !TLI.convertSelectOfConstantsToMath()) {
EVT SetCCVT = getSetCCResultType(N00VT);		EVT SetCCVT = getSetCCResultType(N00VT);
// Don't do this transform for i1 because there's a select transform		// Don't do this transform for i1 because there's a select transform
// that would reverse it.		// that would reverse it.
// TODO: We should not do this transform at all without a target hook		// TODO: We should not do this transform at all without a target hook
// because a sext is likely cheaper than a select?		// because a sext is likely cheaper than a select?
if (SetCCVT.getScalarSizeInBits() != 1 &&		if (SetCCVT.getScalarSizeInBits() != 1 &&
(!LegalOperations \|\| TLI.isOperationLegal(ISD::SETCC, N00VT))) {		(!LegalOperations \|\| TLI.isOperationLegal(ISD::SETCC, N00VT))) {
SDValue SetCC = DAG.getSetCC(DL, SetCCVT, N00, N01, CC);		SDValue SetCC = DAG.getSetCC(DL, SetCCVT, N00, N01, CC);
▲ Show 20 Lines • Show All 9,900 Lines • Show Last 20 Lines

llvm/trunk/lib/Target/X86/X86ISelLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 30,075 Lines • ▼ Show 20 Lines	static SDValue combineSelectOfTwoConstants(SDNode *N, SelectionDAG &DAG) {
SDLoc DL(N);		SDLoc DL(N);

auto *TrueC = dyn_cast<ConstantSDNode>(LHS);		auto *TrueC = dyn_cast<ConstantSDNode>(LHS);
auto *FalseC = dyn_cast<ConstantSDNode>(RHS);		auto *FalseC = dyn_cast<ConstantSDNode>(RHS);
if (!TrueC \|\| !FalseC)		if (!TrueC \|\| !FalseC)
return SDValue();		return SDValue();

// Don't do this for crazy integer types.		// Don't do this for crazy integer types.
if (!DAG.getTargetLoweringInfo().isTypeLegal(LHS.getValueType()))		EVT VT = N->getValueType(0);
		if (!DAG.getTargetLoweringInfo().isTypeLegal(VT))
return SDValue();		return SDValue();

// If this is efficiently invertible, canonicalize the LHSC/RHSC values		// We're going to use the condition bit in math or logic ops. We could allow
// so that TrueC (the true value) is larger than FalseC.		// this with a wider condition value (post-legalization it becomes an i8),
bool NeedsCondInvert = false;		// but if nothing is creating selects that late, it doesn't matter.
if (TrueC->getAPIntValue().ult(FalseC->getAPIntValue()) &&		if (Cond.getValueType() != MVT::i1)
// Efficiently invertible.		return SDValue();
(Cond.getOpcode() == ISD::SETCC \|\| // setcc -> invertible.
(Cond.getOpcode() == ISD::XOR && // xor(X, C) -> invertible.		// A power-of-2 multiply is just a shift. LEA also cheaply handles multiply by
isa<ConstantSDNode>(Cond.getOperand(1))))) {		// 3, 5, or 9 with i32/i64, so those get transformed too.
NeedsCondInvert = true;		// TODO: For constants that overflow or do not differ by power-of-2 or small
		// multiplier, convert to 'and' + 'add'.
		const APInt &TrueVal = TrueC->getAPIntValue();
		const APInt &FalseVal = FalseC->getAPIntValue();
		bool OV;
		APInt Diff = TrueVal.ssub_ov(FalseVal, OV);
		if (OV)
		return SDValue();

		APInt AbsDiff = Diff.abs();
		if (AbsDiff.isPowerOf2() \|\|
		((VT == MVT::i32 \|\| VT == MVT::i64) &&
		(AbsDiff == 3 \|\| AbsDiff == 5 \|\| AbsDiff == 9))) {

		// We need a positive multiplier constant for shift/LEA codegen. The 'not'
		// of the condition can usually be folded into a compare predicate, but even
		// without that, the sequence should be cheaper than a CMOV alternative.
		if (TrueVal.slt(FalseVal)) {
		Cond = DAG.getNOT(DL, Cond, MVT::i1);
std::swap(TrueC, FalseC);		std::swap(TrueC, FalseC);
}		}

// Optimize C ? 8 : 0 -> zext(C) << 3. Likewise for any pow2/0.		// select Cond, TC, FC --> (zext(Cond) * (TC - FC)) + FC
if (FalseC->getAPIntValue() == 0 && TrueC->getAPIntValue().isPowerOf2()) {		SDValue R = DAG.getNode(ISD::ZERO_EXTEND, DL, VT, Cond);
if (NeedsCondInvert) // Invert the condition if needed.
Cond = DAG.getNode(ISD::XOR, DL, Cond.getValueType(), Cond,
DAG.getConstant(1, DL, Cond.getValueType()));

// Zero extend the condition if needed.
Cond = DAG.getNode(ISD::ZERO_EXTEND, DL, LHS.getValueType(), Cond);

unsigned ShAmt = TrueC->getAPIntValue().logBase2();		// Multiply condition by the difference if non-one.
return DAG.getNode(ISD::SHL, DL, LHS.getValueType(), Cond,		if (!AbsDiff.isOneValue())
DAG.getConstant(ShAmt, DL, MVT::i8));		R = DAG.getNode(ISD::MUL, DL, VT, R, DAG.getConstant(AbsDiff, DL, VT));
}

// Optimize cases that will turn into an LEA instruction. This requires
// an i32 or i64 and an efficient multiplier (1, 2, 3, 4, 5, 8, 9).
if (N->getValueType(0) == MVT::i32 \|\| N->getValueType(0) == MVT::i64) {
uint64_t Diff = TrueC->getZExtValue() - FalseC->getZExtValue();
if (N->getValueType(0) == MVT::i32)
Diff = (unsigned)Diff;

bool IsFastMultiplier = false;
if (Diff < 10) {
switch ((unsigned char)Diff) {
default:
break;
case 1: // result = add base, cond
case 2: // result = lea base( , cond*2)
case 3: // result = lea base(cond, cond*2)
case 4: // result = lea base( , cond*4)
case 5: // result = lea base(cond, cond*4)
case 8: // result = lea base( , cond*8)
case 9: // result = lea base(cond, cond*8)
IsFastMultiplier = true;
break;
}
}

if (IsFastMultiplier) {
APInt Diff = TrueC->getAPIntValue() - FalseC->getAPIntValue();
if (NeedsCondInvert) // Invert the condition if needed.
Cond = DAG.getNode(ISD::XOR, DL, Cond.getValueType(), Cond,
DAG.getConstant(1, DL, Cond.getValueType()));

// Zero extend the condition if needed.
Cond = DAG.getNode(ISD::ZERO_EXTEND, DL, FalseC->getValueType(0), Cond);
// Scale the condition by the difference.
if (Diff != 1)
Cond = DAG.getNode(ISD::MUL, DL, Cond.getValueType(), Cond,
DAG.getConstant(Diff, DL, Cond.getValueType()));

// Add the base if non-zero.		// Add the base if non-zero.
if (FalseC->getAPIntValue() != 0)		if (!FalseC->isNullValue())
Cond = DAG.getNode(ISD::ADD, DL, Cond.getValueType(), Cond,		R = DAG.getNode(ISD::ADD, DL, VT, R, SDValue(FalseC, 0));
SDValue(FalseC, 0));
return Cond;		return R;
}
}		}

return SDValue();		return SDValue();
}		}

// If this is a bitcasted op that can be represented as another type, push the		// If this is a bitcasted op that can be represented as another type, push the
// the bitcast to the inputs. This allows more opportunities for pattern		// the bitcast to the inputs. This allows more opportunities for pattern
// matching masked instructions. This is called when we know that the operation		// matching masked instructions. This is called when we know that the operation
▲ Show 20 Lines • Show All 6,577 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/2010-08-04-MaskedSignedCompare.ll

	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc < %s -mtriple=x86_64-unknown-unknown \| FileCheck %s			; RUN: llc < %s -mtriple=x86_64-unknown-unknown \| FileCheck %s
	; PR7814			; PR7814

	@g_16 = global i64 -3738643449681751625, align 8			@g_16 = global i64 -3738643449681751625, align 8
	@g_38 = global i32 0, align 4			@g_38 = global i32 0, align 4
	@.str = private constant [4 x i8] c"%d\0A\00"			@.str = private constant [4 x i8] c"%d\0A\00"

	define i32 @main() nounwind {			define i32 @main() nounwind {
	; CHECK-LABEL: main:			; CHECK-LABEL: main:
	; CHECK: # BB#0: # %entry			; CHECK: # BB#0: # %entry
	; CHECK-NEXT: cmpq $0, {{.*}}(%rip)
	; CHECK-NEXT: movb $-106, %al
	; CHECK-NEXT: jne .LBB0_2
	; CHECK-NEXT: # BB#1: # %entry
	; CHECK-NEXT: xorl %eax, %eax			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: .LBB0_2: # %entry			; CHECK-NEXT: cmpq {{.*}}(%rip), %rax
				; CHECK-NEXT: sbbl %eax, %eax
				; CHECK-NEXT: andl $150, %eax
	; CHECK-NEXT: testb %al, %al			; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: jle .LBB0_3			; CHECK-NEXT: jle .LBB0_1
	; CHECK-NEXT: # BB#4: # %if.then			; CHECK-NEXT: # BB#2: # %if.then
	; CHECK-NEXT: movl $1, {{.*}}(%rip)			; CHECK-NEXT: movl $1, {{.*}}(%rip)
	; CHECK-NEXT: movl $1, %esi			; CHECK-NEXT: movl $1, %esi
	; CHECK-NEXT: jmp .LBB0_5			; CHECK-NEXT: jmp .LBB0_3
	; CHECK-NEXT: .LBB0_3: # %entry.if.end_crit_edge			; CHECK-NEXT: .LBB0_1: # %entry.if.end_crit_edge
	; CHECK-NEXT: movl {{.*}}(%rip), %esi			; CHECK-NEXT: movl {{.*}}(%rip), %esi
	; CHECK-NEXT: .LBB0_5: # %if.end			; CHECK-NEXT: .LBB0_3: # %if.end
	; CHECK-NEXT: pushq %rax			; CHECK-NEXT: pushq %rax
	; CHECK-NEXT: movl $.L.str, %edi			; CHECK-NEXT: movl $.L.str, %edi
	; CHECK-NEXT: xorl %eax, %eax			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: callq printf			; CHECK-NEXT: callq printf
	; CHECK-NEXT: xorl %eax, %eax			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: popq %rcx			; CHECK-NEXT: popq %rcx
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	entry:			entry:
	Show All 24 Lines

llvm/trunk/test/CodeGen/X86/memcmp-optsize.ll

	Show First 20 Lines • Show All 119 Lines • ▼ Show 20 Lines
	; X86-NEXT: cmpw %si, %dx			; X86-NEXT: cmpw %si, %dx
	; X86-NEXT: jne .LBB4_1			; X86-NEXT: jne .LBB4_1
	; X86-NEXT: # BB#2: # %loadbb1			; X86-NEXT: # BB#2: # %loadbb1
	; X86-NEXT: movzbl 2(%eax), %eax			; X86-NEXT: movzbl 2(%eax), %eax
	; X86-NEXT: movzbl 2(%ecx), %ecx			; X86-NEXT: movzbl 2(%ecx), %ecx
	; X86-NEXT: subl %ecx, %eax			; X86-NEXT: subl %ecx, %eax
	; X86-NEXT: jmp .LBB4_3			; X86-NEXT: jmp .LBB4_3
	; X86-NEXT: .LBB4_1: # %res_block			; X86-NEXT: .LBB4_1: # %res_block
	; X86-NEXT: xorl %ecx, %ecx			; X86-NEXT: setae %al
	; X86-NEXT: incl %ecx			; X86-NEXT: movzbl %al, %eax
	; X86-NEXT: xorl %eax, %eax			; X86-NEXT: leal -1(%eax,%eax), %eax
	; X86-NEXT: decl %eax
	; X86-NEXT: cmpw %si, %dx
	; X86-NEXT: cmovael %ecx, %eax
	; X86-NEXT: .LBB4_3: # %endblock			; X86-NEXT: .LBB4_3: # %endblock
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-LABEL: length3:			; X64-LABEL: length3:
	; X64: # BB#0: # %loadbb			; X64: # BB#0: # %loadbb
	; X64-NEXT: movzwl (%rdi), %eax			; X64-NEXT: movzwl (%rdi), %eax
	; X64-NEXT: movzwl (%rsi), %ecx			; X64-NEXT: movzwl (%rsi), %ecx
	; X64-NEXT: rolw $8, %ax			; X64-NEXT: rolw $8, %ax
	; X64-NEXT: rolw $8, %cx			; X64-NEXT: rolw $8, %cx
	; X64-NEXT: cmpw %cx, %ax			; X64-NEXT: cmpw %cx, %ax
	; X64-NEXT: jne .LBB4_1			; X64-NEXT: jne .LBB4_1
	; X64-NEXT: # BB#2: # %loadbb1			; X64-NEXT: # BB#2: # %loadbb1
	; X64-NEXT: movzbl 2(%rdi), %eax			; X64-NEXT: movzbl 2(%rdi), %eax
	; X64-NEXT: movzbl 2(%rsi), %ecx			; X64-NEXT: movzbl 2(%rsi), %ecx
	; X64-NEXT: subl %ecx, %eax			; X64-NEXT: subl %ecx, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	; X64-NEXT: .LBB4_1: # %res_block			; X64-NEXT: .LBB4_1: # %res_block
	; X64-NEXT: movl $-1, %ecx			; X64-NEXT: setae %al
	; X64-NEXT: movl $1, %eax			; X64-NEXT: movzbl %al, %eax
	; X64-NEXT: cmovbl %ecx, %eax			; X64-NEXT: leal -1(%rax,%rax), %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 3) nounwind			%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 3) nounwind
	ret i32 %m			ret i32 %m
	}			}

	define i1 @length3_eq(i8* %X, i8* %Y) nounwind optsize {			define i1 @length3_eq(i8* %X, i8* %Y) nounwind optsize {
	; X86-LABEL: length3_eq:			; X86-LABEL: length3_eq:
	; X86: # BB#0: # %loadbb			; X86: # BB#0: # %loadbb
	▲ Show 20 Lines • Show All 118 Lines • ▼ Show 20 Lines
	; X86-NEXT: cmpl %esi, %edx			; X86-NEXT: cmpl %esi, %edx
	; X86-NEXT: jne .LBB9_1			; X86-NEXT: jne .LBB9_1
	; X86-NEXT: # BB#2: # %loadbb1			; X86-NEXT: # BB#2: # %loadbb1
	; X86-NEXT: movzbl 4(%eax), %eax			; X86-NEXT: movzbl 4(%eax), %eax
	; X86-NEXT: movzbl 4(%ecx), %ecx			; X86-NEXT: movzbl 4(%ecx), %ecx
	; X86-NEXT: subl %ecx, %eax			; X86-NEXT: subl %ecx, %eax
	; X86-NEXT: jmp .LBB9_3			; X86-NEXT: jmp .LBB9_3
	; X86-NEXT: .LBB9_1: # %res_block			; X86-NEXT: .LBB9_1: # %res_block
	; X86-NEXT: xorl %ecx, %ecx			; X86-NEXT: setae %al
	; X86-NEXT: incl %ecx			; X86-NEXT: movzbl %al, %eax
	; X86-NEXT: xorl %eax, %eax			; X86-NEXT: leal -1(%eax,%eax), %eax
	; X86-NEXT: decl %eax
	; X86-NEXT: cmpl %esi, %edx
	; X86-NEXT: cmovael %ecx, %eax
	; X86-NEXT: .LBB9_3: # %endblock			; X86-NEXT: .LBB9_3: # %endblock
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-LABEL: length5:			; X64-LABEL: length5:
	; X64: # BB#0: # %loadbb			; X64: # BB#0: # %loadbb
	; X64-NEXT: movl (%rdi), %eax			; X64-NEXT: movl (%rdi), %eax
	; X64-NEXT: movl (%rsi), %ecx			; X64-NEXT: movl (%rsi), %ecx
	; X64-NEXT: bswapl %eax			; X64-NEXT: bswapl %eax
	; X64-NEXT: bswapl %ecx			; X64-NEXT: bswapl %ecx
	; X64-NEXT: cmpl %ecx, %eax			; X64-NEXT: cmpl %ecx, %eax
	; X64-NEXT: jne .LBB9_1			; X64-NEXT: jne .LBB9_1
	; X64-NEXT: # BB#2: # %loadbb1			; X64-NEXT: # BB#2: # %loadbb1
	; X64-NEXT: movzbl 4(%rdi), %eax			; X64-NEXT: movzbl 4(%rdi), %eax
	; X64-NEXT: movzbl 4(%rsi), %ecx			; X64-NEXT: movzbl 4(%rsi), %ecx
	; X64-NEXT: subl %ecx, %eax			; X64-NEXT: subl %ecx, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	; X64-NEXT: .LBB9_1: # %res_block			; X64-NEXT: .LBB9_1: # %res_block
	; X64-NEXT: movl $-1, %ecx			; X64-NEXT: setae %al
	; X64-NEXT: movl $1, %eax			; X64-NEXT: movzbl %al, %eax
	; X64-NEXT: cmovbl %ecx, %eax			; X64-NEXT: leal -1(%rax,%rax), %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 5) nounwind			%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 5) nounwind
	ret i32 %m			ret i32 %m
	}			}

	define i1 @length5_eq(i8* %X, i8* %Y) nounwind optsize {			define i1 @length5_eq(i8* %X, i8* %Y) nounwind optsize {
	; X86-LABEL: length5_eq:			; X86-LABEL: length5_eq:
	; X86: # BB#0: # %loadbb			; X86: # BB#0: # %loadbb
	▲ Show 20 Lines • Show All 52 Lines • ▼ Show 20 Lines
	; X86-NEXT: movl 4(%esi), %ecx			; X86-NEXT: movl 4(%esi), %ecx
	; X86-NEXT: movl 4(%eax), %edx			; X86-NEXT: movl 4(%eax), %edx
	; X86-NEXT: bswapl %ecx			; X86-NEXT: bswapl %ecx
	; X86-NEXT: bswapl %edx			; X86-NEXT: bswapl %edx
	; X86-NEXT: xorl %eax, %eax			; X86-NEXT: xorl %eax, %eax
	; X86-NEXT: cmpl %edx, %ecx			; X86-NEXT: cmpl %edx, %ecx
	; X86-NEXT: je .LBB11_3			; X86-NEXT: je .LBB11_3
	; X86-NEXT: .LBB11_1: # %res_block			; X86-NEXT: .LBB11_1: # %res_block
	; X86-NEXT: xorl %esi, %esi
	; X86-NEXT: incl %esi
	; X86-NEXT: xorl %eax, %eax			; X86-NEXT: xorl %eax, %eax
	; X86-NEXT: decl %eax
	; X86-NEXT: cmpl %edx, %ecx			; X86-NEXT: cmpl %edx, %ecx
	; X86-NEXT: cmovael %esi, %eax			; X86-NEXT: setae %al
				; X86-NEXT: leal -1(%eax,%eax), %eax
	; X86-NEXT: .LBB11_3: # %endblock			; X86-NEXT: .LBB11_3: # %endblock
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-LABEL: length8:			; X64-LABEL: length8:
	; X64: # BB#0:			; X64: # BB#0:
	; X64-NEXT: movq (%rdi), %rcx			; X64-NEXT: movq (%rdi), %rcx
	; X64-NEXT: movq (%rsi), %rdx			; X64-NEXT: movq (%rsi), %rdx
	▲ Show 20 Lines • Show All 128 Lines • ▼ Show 20 Lines
	; X64-NEXT: bswapl %ecx			; X64-NEXT: bswapl %ecx
	; X64-NEXT: bswapl %edx			; X64-NEXT: bswapl %edx
	; X64-NEXT: xorl %eax, %eax			; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: cmpq %rdx, %rcx			; X64-NEXT: cmpq %rdx, %rcx
	; X64-NEXT: jne .LBB15_1			; X64-NEXT: jne .LBB15_1
	; X64-NEXT: # BB#3: # %endblock			; X64-NEXT: # BB#3: # %endblock
	; X64-NEXT: retq			; X64-NEXT: retq
	; X64-NEXT: .LBB15_1: # %res_block			; X64-NEXT: .LBB15_1: # %res_block
				; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: cmpq %rdx, %rcx			; X64-NEXT: cmpq %rdx, %rcx
	; X64-NEXT: movl $-1, %ecx			; X64-NEXT: setae %al
	; X64-NEXT: movl $1, %eax			; X64-NEXT: leal -1(%rax,%rax), %eax
	; X64-NEXT: cmovbl %ecx, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 12) nounwind			%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 12) nounwind
	ret i32 %m			ret i32 %m
	}			}

	; PR33329 - https://bugs.llvm.org/show_bug.cgi?id=33329			; PR33329 - https://bugs.llvm.org/show_bug.cgi?id=33329

	define i32 @length16(i8* %X, i8* %Y) nounwind optsize {			define i32 @length16(i8* %X, i8* %Y) nounwind optsize {
	Show All 21 Lines
	; X64-NEXT: bswapq %rcx			; X64-NEXT: bswapq %rcx
	; X64-NEXT: bswapq %rdx			; X64-NEXT: bswapq %rdx
	; X64-NEXT: xorl %eax, %eax			; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: cmpq %rdx, %rcx			; X64-NEXT: cmpq %rdx, %rcx
	; X64-NEXT: jne .LBB16_1			; X64-NEXT: jne .LBB16_1
	; X64-NEXT: # BB#3: # %endblock			; X64-NEXT: # BB#3: # %endblock
	; X64-NEXT: retq			; X64-NEXT: retq
	; X64-NEXT: .LBB16_1: # %res_block			; X64-NEXT: .LBB16_1: # %res_block
				; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: cmpq %rdx, %rcx			; X64-NEXT: cmpq %rdx, %rcx
	; X64-NEXT: movl $-1, %ecx			; X64-NEXT: setae %al
	; X64-NEXT: movl $1, %eax			; X64-NEXT: leal -1(%rax,%rax), %eax
	; X64-NEXT: cmovbl %ecx, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 16) nounwind			%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 16) nounwind
	ret i32 %m			ret i32 %m
	}			}

	define i1 @length16_eq(i8* %x, i8* %y) nounwind optsize {			define i1 @length16_eq(i8* %x, i8* %y) nounwind optsize {
	; X86-NOSSE-LABEL: length16_eq:			; X86-NOSSE-LABEL: length16_eq:
	; X86-NOSSE: # BB#0:			; X86-NOSSE: # BB#0:
	▲ Show 20 Lines • Show All 333 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/memcmp.ll

	Show First 20 Lines • Show All 120 Lines • ▼ Show 20 Lines
	; X86-NEXT: jne .LBB4_1			; X86-NEXT: jne .LBB4_1
	; X86-NEXT: # BB#2: # %loadbb1			; X86-NEXT: # BB#2: # %loadbb1
	; X86-NEXT: movzbl 2(%eax), %eax			; X86-NEXT: movzbl 2(%eax), %eax
	; X86-NEXT: movzbl 2(%ecx), %ecx			; X86-NEXT: movzbl 2(%ecx), %ecx
	; X86-NEXT: subl %ecx, %eax			; X86-NEXT: subl %ecx, %eax
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: retl			; X86-NEXT: retl
	; X86-NEXT: .LBB4_1: # %res_block			; X86-NEXT: .LBB4_1: # %res_block
	; X86-NEXT: movl $-1, %ecx			; X86-NEXT: setae %al
	; X86-NEXT: movl $1, %eax			; X86-NEXT: movzbl %al, %eax
	; X86-NEXT: cmovbl %ecx, %eax			; X86-NEXT: leal -1(%eax,%eax), %eax
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-LABEL: length3:			; X64-LABEL: length3:
	; X64: # BB#0: # %loadbb			; X64: # BB#0: # %loadbb
	; X64-NEXT: movzwl (%rdi), %eax			; X64-NEXT: movzwl (%rdi), %eax
	; X64-NEXT: movzwl (%rsi), %ecx			; X64-NEXT: movzwl (%rsi), %ecx
	; X64-NEXT: rolw $8, %ax			; X64-NEXT: rolw $8, %ax
	; X64-NEXT: rolw $8, %cx			; X64-NEXT: rolw $8, %cx
	; X64-NEXT: cmpw %cx, %ax			; X64-NEXT: cmpw %cx, %ax
	; X64-NEXT: jne .LBB4_1			; X64-NEXT: jne .LBB4_1
	; X64-NEXT: # BB#2: # %loadbb1			; X64-NEXT: # BB#2: # %loadbb1
	; X64-NEXT: movzbl 2(%rdi), %eax			; X64-NEXT: movzbl 2(%rdi), %eax
	; X64-NEXT: movzbl 2(%rsi), %ecx			; X64-NEXT: movzbl 2(%rsi), %ecx
	; X64-NEXT: subl %ecx, %eax			; X64-NEXT: subl %ecx, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	; X64-NEXT: .LBB4_1: # %res_block			; X64-NEXT: .LBB4_1: # %res_block
	; X64-NEXT: movl $-1, %ecx			; X64-NEXT: setae %al
	; X64-NEXT: movl $1, %eax			; X64-NEXT: movzbl %al, %eax
	; X64-NEXT: cmovbl %ecx, %eax			; X64-NEXT: leal -1(%rax,%rax), %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 3) nounwind			%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 3) nounwind
	ret i32 %m			ret i32 %m
	}			}

	define i1 @length3_eq(i8* %X, i8* %Y) nounwind {			define i1 @length3_eq(i8* %X, i8* %Y) nounwind {
	; X86-LABEL: length3_eq:			; X86-LABEL: length3_eq:
	; X86: # BB#0: # %loadbb			; X86: # BB#0: # %loadbb
	▲ Show 20 Lines • Show All 118 Lines • ▼ Show 20 Lines
	; X86-NEXT: jne .LBB9_1			; X86-NEXT: jne .LBB9_1
	; X86-NEXT: # BB#2: # %loadbb1			; X86-NEXT: # BB#2: # %loadbb1
	; X86-NEXT: movzbl 4(%eax), %eax			; X86-NEXT: movzbl 4(%eax), %eax
	; X86-NEXT: movzbl 4(%ecx), %ecx			; X86-NEXT: movzbl 4(%ecx), %ecx
	; X86-NEXT: subl %ecx, %eax			; X86-NEXT: subl %ecx, %eax
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: retl			; X86-NEXT: retl
	; X86-NEXT: .LBB9_1: # %res_block			; X86-NEXT: .LBB9_1: # %res_block
	; X86-NEXT: movl $-1, %ecx			; X86-NEXT: setae %al
	; X86-NEXT: movl $1, %eax			; X86-NEXT: movzbl %al, %eax
	; X86-NEXT: cmovbl %ecx, %eax			; X86-NEXT: leal -1(%eax,%eax), %eax
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-LABEL: length5:			; X64-LABEL: length5:
	; X64: # BB#0: # %loadbb			; X64: # BB#0: # %loadbb
	; X64-NEXT: movl (%rdi), %eax			; X64-NEXT: movl (%rdi), %eax
	; X64-NEXT: movl (%rsi), %ecx			; X64-NEXT: movl (%rsi), %ecx
	; X64-NEXT: bswapl %eax			; X64-NEXT: bswapl %eax
	; X64-NEXT: bswapl %ecx			; X64-NEXT: bswapl %ecx
	; X64-NEXT: cmpl %ecx, %eax			; X64-NEXT: cmpl %ecx, %eax
	; X64-NEXT: jne .LBB9_1			; X64-NEXT: jne .LBB9_1
	; X64-NEXT: # BB#2: # %loadbb1			; X64-NEXT: # BB#2: # %loadbb1
	; X64-NEXT: movzbl 4(%rdi), %eax			; X64-NEXT: movzbl 4(%rdi), %eax
	; X64-NEXT: movzbl 4(%rsi), %ecx			; X64-NEXT: movzbl 4(%rsi), %ecx
	; X64-NEXT: subl %ecx, %eax			; X64-NEXT: subl %ecx, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	; X64-NEXT: .LBB9_1: # %res_block			; X64-NEXT: .LBB9_1: # %res_block
	; X64-NEXT: movl $-1, %ecx			; X64-NEXT: setae %al
	; X64-NEXT: movl $1, %eax			; X64-NEXT: movzbl %al, %eax
	; X64-NEXT: cmovbl %ecx, %eax			; X64-NEXT: leal -1(%rax,%rax), %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 5) nounwind			%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 5) nounwind
	ret i32 %m			ret i32 %m
	}			}

	define i1 @length5_eq(i8* %X, i8* %Y) nounwind {			define i1 @length5_eq(i8* %X, i8* %Y) nounwind {
	; X86-LABEL: length5_eq:			; X86-LABEL: length5_eq:
	; X86: # BB#0: # %loadbb			; X86: # BB#0: # %loadbb
	▲ Show 20 Lines • Show All 54 Lines • ▼ Show 20 Lines
	; X86-NEXT: bswapl %edx			; X86-NEXT: bswapl %edx
	; X86-NEXT: xorl %eax, %eax			; X86-NEXT: xorl %eax, %eax
	; X86-NEXT: cmpl %edx, %ecx			; X86-NEXT: cmpl %edx, %ecx
	; X86-NEXT: jne .LBB11_1			; X86-NEXT: jne .LBB11_1
	; X86-NEXT: # BB#3: # %endblock			; X86-NEXT: # BB#3: # %endblock
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: retl			; X86-NEXT: retl
	; X86-NEXT: .LBB11_1: # %res_block			; X86-NEXT: .LBB11_1: # %res_block
				; X86-NEXT: xorl %eax, %eax
	; X86-NEXT: cmpl %edx, %ecx			; X86-NEXT: cmpl %edx, %ecx
	; X86-NEXT: movl $-1, %ecx			; X86-NEXT: setae %al
	; X86-NEXT: movl $1, %eax			; X86-NEXT: leal -1(%eax,%eax), %eax
	; X86-NEXT: cmovbl %ecx, %eax
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-LABEL: length8:			; X64-LABEL: length8:
	; X64: # BB#0:			; X64: # BB#0:
	; X64-NEXT: movq (%rdi), %rcx			; X64-NEXT: movq (%rdi), %rcx
	; X64-NEXT: movq (%rsi), %rdx			; X64-NEXT: movq (%rsi), %rdx
	; X64-NEXT: bswapq %rcx			; X64-NEXT: bswapq %rcx
	▲ Show 20 Lines • Show All 125 Lines • ▼ Show 20 Lines
	; X64-NEXT: bswapl %ecx			; X64-NEXT: bswapl %ecx
	; X64-NEXT: bswapl %edx			; X64-NEXT: bswapl %edx
	; X64-NEXT: xorl %eax, %eax			; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: cmpq %rdx, %rcx			; X64-NEXT: cmpq %rdx, %rcx
	; X64-NEXT: jne .LBB15_1			; X64-NEXT: jne .LBB15_1
	; X64-NEXT: # BB#3: # %endblock			; X64-NEXT: # BB#3: # %endblock
	; X64-NEXT: retq			; X64-NEXT: retq
	; X64-NEXT: .LBB15_1: # %res_block			; X64-NEXT: .LBB15_1: # %res_block
				; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: cmpq %rdx, %rcx			; X64-NEXT: cmpq %rdx, %rcx
	; X64-NEXT: movl $-1, %ecx			; X64-NEXT: setae %al
	; X64-NEXT: movl $1, %eax			; X64-NEXT: leal -1(%rax,%rax), %eax
	; X64-NEXT: cmovbl %ecx, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 12) nounwind			%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 12) nounwind
	ret i32 %m			ret i32 %m
	}			}

	; PR33329 - https://bugs.llvm.org/show_bug.cgi?id=33329			; PR33329 - https://bugs.llvm.org/show_bug.cgi?id=33329

	define i32 @length16(i8* %X, i8* %Y) nounwind {			define i32 @length16(i8* %X, i8* %Y) nounwind {
	Show All 21 Lines
	; X64-NEXT: bswapq %rcx			; X64-NEXT: bswapq %rcx
	; X64-NEXT: bswapq %rdx			; X64-NEXT: bswapq %rdx
	; X64-NEXT: xorl %eax, %eax			; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: cmpq %rdx, %rcx			; X64-NEXT: cmpq %rdx, %rcx
	; X64-NEXT: jne .LBB16_1			; X64-NEXT: jne .LBB16_1
	; X64-NEXT: # BB#3: # %endblock			; X64-NEXT: # BB#3: # %endblock
	; X64-NEXT: retq			; X64-NEXT: retq
	; X64-NEXT: .LBB16_1: # %res_block			; X64-NEXT: .LBB16_1: # %res_block
				; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: cmpq %rdx, %rcx			; X64-NEXT: cmpq %rdx, %rcx
	; X64-NEXT: movl $-1, %ecx			; X64-NEXT: setae %al
	; X64-NEXT: movl $1, %eax			; X64-NEXT: leal -1(%rax,%rax), %eax
	; X64-NEXT: cmovbl %ecx, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 16) nounwind			%m = tail call i32 @memcmp(i8* %X, i8* %Y, i64 16) nounwind
	ret i32 %m			ret i32 %m
	}			}

	define i1 @length16_eq(i8* %x, i8* %y) nounwind {			define i1 @length16_eq(i8* %x, i8* %y) nounwind {
	; X86-NOSSE-LABEL: length16_eq:			; X86-NOSSE-LABEL: length16_eq:
	; X86-NOSSE: # BB#0:			; X86-NOSSE: # BB#0:
	▲ Show 20 Lines • Show All 333 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/merge-consecutive-stores.ll

	Show All 10 Lines
	; CHECK-NEXT: movl $0, 28(%eax)			; CHECK-NEXT: movl $0, 28(%eax)
	; CHECK-NEXT: movl $0, 24(%eax)			; CHECK-NEXT: movl $0, 24(%eax)
	; CHECK-NEXT: movl 20(%eax), %ecx			; CHECK-NEXT: movl 20(%eax), %ecx
	; CHECK-NEXT: movl $0, 20(%eax)			; CHECK-NEXT: movl $0, 20(%eax)
	; CHECK-NEXT: xorl %edx, %edx			; CHECK-NEXT: xorl %edx, %edx
	; CHECK-NEXT: cmpl 16(%eax), %edx			; CHECK-NEXT: cmpl 16(%eax), %edx
	; CHECK-NEXT: movl $0, 16(%eax)			; CHECK-NEXT: movl $0, 16(%eax)
	; CHECK-NEXT: sbbl %ecx, %edx			; CHECK-NEXT: sbbl %ecx, %edx
	; CHECK-NEXT: movl $-1, %eax			; CHECK-NEXT: setl %al
	; CHECK-NEXT: jl .LBB0_2			; CHECK-NEXT: movzbl %al, %eax
	; CHECK-NEXT: # BB#1:			; CHECK-NEXT: negl %eax
	; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: .LBB0_2:
	; CHECK-NEXT: retl			; CHECK-NEXT: retl
	%used = getelementptr inbounds i64, i64* %so, i32 3			%used = getelementptr inbounds i64, i64* %so, i32 3
	store i64 0, i64* %used, align 8			store i64 0, i64* %used, align 8
	%fill = getelementptr inbounds i64, i64* %so, i32 2			%fill = getelementptr inbounds i64, i64* %so, i32 2
	%L = load i64, i64* %fill, align 8			%L = load i64, i64* %fill, align 8
	store i64 0, i64* %fill, align 8			store i64 0, i64* %fill, align 8
	%cmp28 = icmp sgt i64 %L, 0			%cmp28 = icmp sgt i64 %L, 0
	%R = sext i1 %cmp28 to i32			%R = sext i1 %cmp28 to i32
	ret i32 %R			ret i32 %R
	}			}

llvm/trunk/test/CodeGen/X86/mul-constant-result.ll

	Show First 20 Lines • Show All 946 Lines • ▼ Show 20 Lines
	; X86-NEXT: pushl $32			; X86-NEXT: pushl $32
	; X86-NEXT: .Lcfi102:			; X86-NEXT: .Lcfi102:
	; X86-NEXT: .cfi_adjust_cfa_offset 4			; X86-NEXT: .cfi_adjust_cfa_offset 4
	; X86-NEXT: calll mult			; X86-NEXT: calll mult
	; X86-NEXT: addl $8, %esp			; X86-NEXT: addl $8, %esp
	; X86-NEXT: .Lcfi103:			; X86-NEXT: .Lcfi103:
	; X86-NEXT: .cfi_adjust_cfa_offset -8			; X86-NEXT: .cfi_adjust_cfa_offset -8
	; X86-NEXT: xorl $32, %eax			; X86-NEXT: xorl $32, %eax
				; X86-NEXT: xorl %ecx, %ecx
	; X86-NEXT: orl %ebx, %eax			; X86-NEXT: orl %ebx, %eax
	; X86-NEXT: movl $-1, %eax			; X86-NEXT: setne %cl
	; X86-NEXT: jne .LBB1_2			; X86-NEXT: negl %ecx
	; X86-NEXT: # BB#1:			; X86-NEXT: movl %ecx, %eax
	; X86-NEXT: xorl %eax, %eax
	; X86-NEXT: .LBB1_2:
	; X86-NEXT: popl %esi			; X86-NEXT: popl %esi
	; X86-NEXT: popl %edi			; X86-NEXT: popl %edi
	; X86-NEXT: popl %ebx			; X86-NEXT: popl %ebx
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-HSW-LABEL: foo:			; X64-HSW-LABEL: foo:
	; X64-HSW: # BB#0:			; X64-HSW: # BB#0:
	; X64-HSW-NEXT: pushq %rbp			; X64-HSW-NEXT: pushq %rbp
	; X64-HSW-NEXT: .Lcfi0:			; X64-HSW-NEXT: .Lcfi0:
	; X64-HSW-NEXT: .cfi_def_cfa_offset 16			; X64-HSW-NEXT: .cfi_def_cfa_offset 16
	; X64-HSW-NEXT: pushq %r15			; X64-HSW-NEXT: pushq %r15
	; X64-HSW-NEXT: .Lcfi1:			; X64-HSW-NEXT: .Lcfi1:
	; X64-HSW-NEXT: .cfi_def_cfa_offset 24			; X64-HSW-NEXT: .cfi_def_cfa_offset 24
	; X64-HSW-NEXT: pushq %r14			; X64-HSW-NEXT: pushq %r14
	; X64-HSW-NEXT: .Lcfi2:			; X64-HSW-NEXT: .Lcfi2:
	; X64-HSW-NEXT: .cfi_def_cfa_offset 32			; X64-HSW-NEXT: .cfi_def_cfa_offset 32
	; X64-HSW-NEXT: pushq %r12			; X64-HSW-NEXT: pushq %rbx
	; X64-HSW-NEXT: .Lcfi3:			; X64-HSW-NEXT: .Lcfi3:
	; X64-HSW-NEXT: .cfi_def_cfa_offset 40			; X64-HSW-NEXT: .cfi_def_cfa_offset 40
	; X64-HSW-NEXT: pushq %rbx			; X64-HSW-NEXT: pushq %rax
	; X64-HSW-NEXT: .Lcfi4:			; X64-HSW-NEXT: .Lcfi4:
	; X64-HSW-NEXT: .cfi_def_cfa_offset 48			; X64-HSW-NEXT: .cfi_def_cfa_offset 48
	; X64-HSW-NEXT: .Lcfi5:			; X64-HSW-NEXT: .Lcfi5:
	; X64-HSW-NEXT: .cfi_offset %rbx, -48			; X64-HSW-NEXT: .cfi_offset %rbx, -40
	; X64-HSW-NEXT: .Lcfi6:			; X64-HSW-NEXT: .Lcfi6:
	; X64-HSW-NEXT: .cfi_offset %r12, -40
	; X64-HSW-NEXT: .Lcfi7:
	; X64-HSW-NEXT: .cfi_offset %r14, -32			; X64-HSW-NEXT: .cfi_offset %r14, -32
	; X64-HSW-NEXT: .Lcfi8:			; X64-HSW-NEXT: .Lcfi7:
	; X64-HSW-NEXT: .cfi_offset %r15, -24			; X64-HSW-NEXT: .cfi_offset %r15, -24
	; X64-HSW-NEXT: .Lcfi9:			; X64-HSW-NEXT: .Lcfi8:
	; X64-HSW-NEXT: .cfi_offset %rbp, -16			; X64-HSW-NEXT: .cfi_offset %rbp, -16
	; X64-HSW-NEXT: xorl %r12d, %r12d
	; X64-HSW-NEXT: movl $1, %edi			; X64-HSW-NEXT: movl $1, %edi
	; X64-HSW-NEXT: xorl %esi, %esi			; X64-HSW-NEXT: xorl %esi, %esi
	; X64-HSW-NEXT: callq mult			; X64-HSW-NEXT: callq mult
	; X64-HSW-NEXT: movl %eax, %ebx			; X64-HSW-NEXT: movl %eax, %ebx
	; X64-HSW-NEXT: xorl $1, %ebx			; X64-HSW-NEXT: xorl $1, %ebx
	; X64-HSW-NEXT: movl $2, %edi			; X64-HSW-NEXT: movl $2, %edi
	; X64-HSW-NEXT: movl $1, %esi			; X64-HSW-NEXT: movl $1, %esi
	; X64-HSW-NEXT: callq mult			; X64-HSW-NEXT: callq mult
	▲ Show 20 Lines • Show All 173 Lines • ▼ Show 20 Lines
	; X64-HSW-NEXT: movl %eax, %ebx			; X64-HSW-NEXT: movl %eax, %ebx
	; X64-HSW-NEXT: xorl $31, %ebx			; X64-HSW-NEXT: xorl $31, %ebx
	; X64-HSW-NEXT: orl %r14d, %ebx			; X64-HSW-NEXT: orl %r14d, %ebx
	; X64-HSW-NEXT: orl %ebp, %ebx			; X64-HSW-NEXT: orl %ebp, %ebx
	; X64-HSW-NEXT: movl $32, %edi			; X64-HSW-NEXT: movl $32, %edi
	; X64-HSW-NEXT: movl $16, %esi			; X64-HSW-NEXT: movl $16, %esi
	; X64-HSW-NEXT: callq mult			; X64-HSW-NEXT: callq mult
	; X64-HSW-NEXT: xorl $32, %eax			; X64-HSW-NEXT: xorl $32, %eax
				; X64-HSW-NEXT: xorl %ecx, %ecx
	; X64-HSW-NEXT: orl %ebx, %eax			; X64-HSW-NEXT: orl %ebx, %eax
	; X64-HSW-NEXT: movl $-1, %eax			; X64-HSW-NEXT: setne %cl
	; X64-HSW-NEXT: cmovel %r12d, %eax			; X64-HSW-NEXT: negl %ecx
				; X64-HSW-NEXT: movl %ecx, %eax
				; X64-HSW-NEXT: addq $8, %rsp
	; X64-HSW-NEXT: popq %rbx			; X64-HSW-NEXT: popq %rbx
	; X64-HSW-NEXT: popq %r12
	; X64-HSW-NEXT: popq %r14			; X64-HSW-NEXT: popq %r14
	; X64-HSW-NEXT: popq %r15			; X64-HSW-NEXT: popq %r15
	; X64-HSW-NEXT: popq %rbp			; X64-HSW-NEXT: popq %rbp
	; X64-HSW-NEXT: retq			; X64-HSW-NEXT: retq
	%1 = tail call i32 @mult(i32 1, i32 0)			%1 = tail call i32 @mult(i32 1, i32 0)
	%2 = icmp ne i32 %1, 1			%2 = icmp ne i32 %1, 1
	%3 = tail call i32 @mult(i32 2, i32 1)			%3 = tail call i32 @mult(i32 2, i32 1)
	%4 = icmp ne i32 %3, 2			%4 = icmp ne i32 %3, 2
	▲ Show 20 Lines • Show All 96 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/pr22338.ll

	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc < %s -mtriple=i686-unknown-linux-gnu \| FileCheck %s --check-prefix=X86			; RUN: llc < %s -mtriple=i686-unknown-linux-gnu \| FileCheck %s --check-prefix=X86
	; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu \| FileCheck %s --check-prefix=X64			; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu \| FileCheck %s --check-prefix=X64

	define i32 @fn() {			define i32 @fn() {
	; X86-LABEL: fn:			; X86-LABEL: fn:
	; X86: # BB#0: # %entry			; X86: # BB#0: # %entry
				; X86-NEXT: xorl %eax, %eax
	; X86-NEXT: cmpl $1, %eax			; X86-NEXT: cmpl $1, %eax
				; X86-NEXT: setne %al
	; X86-NEXT: sete %cl			; X86-NEXT: sete %cl
	; X86-NEXT: movl $-1, %eax			; X86-NEXT: negl %eax
	; X86-NEXT: jne .LBB0_2
	; X86-NEXT: # BB#1: # %entry
	; X86-NEXT: xorl %eax, %eax
	; X86-NEXT: .LBB0_2: # %entry
	; X86-NEXT: addb %cl, %cl			; X86-NEXT: addb %cl, %cl
	; X86-NEXT: shll %cl, %eax			; X86-NEXT: shll %cl, %eax
	; X86-NEXT: .p2align 4, 0x90			; X86-NEXT: .p2align 4, 0x90
	; X86-NEXT: .LBB0_3: # %bb1			; X86-NEXT: .LBB0_1: # %bb1
	; X86-NEXT: # =>This Inner Loop Header: Depth=1			; X86-NEXT: # =>This Inner Loop Header: Depth=1
	; X86-NEXT: testl %eax, %eax			; X86-NEXT: testl %eax, %eax
	; X86-NEXT: je .LBB0_3			; X86-NEXT: je .LBB0_1
	; X86-NEXT: # BB#4: # %bb2			; X86-NEXT: # BB#2: # %bb2
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-LABEL: fn:			; X64-LABEL: fn:
	; X64: # BB#0: # %entry			; X64: # BB#0: # %entry
	; X64-NEXT: xorl %edx, %edx			; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: cmpl $1, %eax			; X64-NEXT: cmpl $1, %eax
				; X64-NEXT: setne %al
	; X64-NEXT: sete %cl			; X64-NEXT: sete %cl
	; X64-NEXT: movl $-1, %eax			; X64-NEXT: negl %eax
	; X64-NEXT: cmovel %edx, %eax
	; X64-NEXT: addb %cl, %cl			; X64-NEXT: addb %cl, %cl
	; X64-NEXT: shll %cl, %eax			; X64-NEXT: shll %cl, %eax
	; X64-NEXT: .p2align 4, 0x90			; X64-NEXT: .p2align 4, 0x90
	; X64-NEXT: .LBB0_1: # %bb1			; X64-NEXT: .LBB0_1: # %bb1
	; X64-NEXT: # =>This Inner Loop Header: Depth=1			; X64-NEXT: # =>This Inner Loop Header: Depth=1
	; X64-NEXT: testl %eax, %eax			; X64-NEXT: testl %eax, %eax
	; X64-NEXT: je .LBB0_1			; X64-NEXT: je .LBB0_1
	; X64-NEXT: # BB#2: # %bb2			; X64-NEXT: # BB#2: # %bb2
	Show All 18 Lines

llvm/trunk/test/CodeGen/X86/sbb.ll

	Show First 20 Lines • Show All 124 Lines • ▼ Show 20 Lines
	}			}

	; Swap the predicate and compare operands:			; Swap the predicate and compare operands:
	; (Y >u X) ? -1 : 0 --> cmp, sbb			; (Y >u X) ? -1 : 0 --> cmp, sbb

	define i32 @ugt_select_neg1_or_0(i32 %x, i32 %y) nounwind {			define i32 @ugt_select_neg1_or_0(i32 %x, i32 %y) nounwind {
	; CHECK-LABEL: ugt_select_neg1_or_0:			; CHECK-LABEL: ugt_select_neg1_or_0:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: xorl %ecx, %ecx			; CHECK-NEXT: cmpl %esi, %edi
	; CHECK-NEXT: cmpl %edi, %esi			; CHECK-NEXT: sbbl %eax, %eax
	; CHECK-NEXT: movl $-1, %eax
	; CHECK-NEXT: cmovbel %ecx, %eax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%cmp = icmp ugt i32 %y, %x			%cmp = icmp ugt i32 %y, %x
	%ext = sext i1 %cmp to i32			%ext = sext i1 %cmp to i32
	ret i32 %ext			ret i32 %ext
	}			}

	; Invert the predicate and effectively swap the select operands:			; Invert the predicate and effectively swap the select operands:
	; (X >=u Y) ? 0 : -1 --> (X <u Y) ? -1 : 0 --> cmp, sbb			; (X >=u Y) ? 0 : -1 --> (X <u Y) ? -1 : 0 --> cmp, sbb
	▲ Show 20 Lines • Show All 100 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/select.ll

	Show First 20 Lines • Show All 539 Lines • ▼ Show 20 Lines
	; ATOM-NEXT: orq %rsi, %rax			; ATOM-NEXT: orq %rsi, %rax
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: retq			; ATOM-NEXT: retq
	; ATOM-NEXT: ## -- End function			; ATOM-NEXT: ## -- End function
	;			;
	; MCU-LABEL: test9b:			; MCU-LABEL: test9b:
	; MCU: # BB#0:			; MCU: # BB#0:
	; MCU-NEXT: orl %edx, %eax			; MCU-NEXT: movl %edx, %ecx
	; MCU-NEXT: movl $-1, %edx
	; MCU-NEXT: je .LBB10_2
	; MCU-NEXT: # BB#1:
	; MCU-NEXT: xorl %edx, %edx			; MCU-NEXT: xorl %edx, %edx
	; MCU-NEXT: .LBB10_2:			; MCU-NEXT: orl %ecx, %eax
				; MCU-NEXT: sete %dl
				; MCU-NEXT: negl %edx
	; MCU-NEXT: movl {{[0-9]+}}(%esp), %eax			; MCU-NEXT: movl {{[0-9]+}}(%esp), %eax
	; MCU-NEXT: orl %edx, %eax			; MCU-NEXT: orl %edx, %eax
	; MCU-NEXT: orl {{[0-9]+}}(%esp), %edx			; MCU-NEXT: orl {{[0-9]+}}(%esp), %edx
	; MCU-NEXT: retl			; MCU-NEXT: retl
	%cmp = icmp eq i64 %x, 0			%cmp = icmp eq i64 %x, 0
	%A = sext i1 %cmp to i64			%A = sext i1 %cmp to i64
	%cond = or i64 %y, %A			%cond = or i64 %y, %A
	ret i64 %cond			ret i64 %cond
	}			}

	;; Select between -1 and 1.			;; Select between -1 and 1.
	define i64 @test10(i64 %x, i64 %y) nounwind readnone ssp noredzone {			define i64 @test10(i64 %x, i64 %y) nounwind readnone ssp noredzone {
	; GENERIC-LABEL: test10:			; CHECK-LABEL: test10:
	; GENERIC: ## BB#0:			; CHECK: ## BB#0:
	; GENERIC-NEXT: cmpq $1, %rdi			; CHECK-NEXT: xorl %eax, %eax
	; GENERIC-NEXT: sbbq %rax, %rax			; CHECK-NEXT: testq %rdi, %rdi
	; GENERIC-NEXT: orq $1, %rax			; CHECK-NEXT: setne %al
	; GENERIC-NEXT: retq			; CHECK-NEXT: leaq -1(%rax,%rax), %rax
	; GENERIC-NEXT: ## -- End function			; CHECK-NEXT: retq
	;			; CHECK-NEXT: ## -- End function
	; ATOM-LABEL: test10:
	; ATOM: ## BB#0:
	; ATOM-NEXT: cmpq $1, %rdi
	; ATOM-NEXT: sbbq %rax, %rax
	; ATOM-NEXT: orq $1, %rax
	; ATOM-NEXT: nop
	; ATOM-NEXT: nop
	; ATOM-NEXT: retq
	; ATOM-NEXT: ## -- End function
	;			;
	; MCU-LABEL: test10:			; MCU-LABEL: test10:
	; MCU: # BB#0:			; MCU: # BB#0:
	; MCU-NEXT: orl %edx, %eax			; MCU-NEXT: orl %edx, %eax
	; MCU-NEXT: movl $-1, %eax			; MCU-NEXT: movl $-1, %eax
	; MCU-NEXT: movl $-1, %edx			; MCU-NEXT: movl $-1, %edx
	; MCU-NEXT: je .LBB11_2			; MCU-NEXT: je .LBB11_2
	; MCU-NEXT: # BB#1:			; MCU-NEXT: # BB#1:
	▲ Show 20 Lines • Show All 151 Lines • ▼ Show 20 Lines
	; MCU-NEXT: sbbl %eax, %eax			; MCU-NEXT: sbbl %eax, %eax
	; MCU-NEXT: retl			; MCU-NEXT: retl
	%c = icmp ult i32 %a, %b			%c = icmp ult i32 %a, %b
	%d = sext i1 %c to i32			%d = sext i1 %c to i32
	ret i32 %d			ret i32 %d
	}			}

	define i32 @test14(i32 %a, i32 %b) nounwind {			define i32 @test14(i32 %a, i32 %b) nounwind {
	; GENERIC-LABEL: test14:			; CHECK-LABEL: test14:
	; GENERIC: ## BB#0:			; CHECK: ## BB#0:
	; GENERIC-NEXT: cmpl %esi, %edi			; CHECK-NEXT: xorl %eax, %eax
	; GENERIC-NEXT: sbbl %eax, %eax			; CHECK-NEXT: cmpl %esi, %edi
	; GENERIC-NEXT: notl %eax			; CHECK-NEXT: setae %al
	; GENERIC-NEXT: retq			; CHECK-NEXT: negl %eax
	; GENERIC-NEXT: ## -- End function			; CHECK-NEXT: retq
	;			; CHECK-NEXT: ## -- End function
	; ATOM-LABEL: test14:
	; ATOM: ## BB#0:
	; ATOM-NEXT: cmpl %esi, %edi
	; ATOM-NEXT: sbbl %eax, %eax
	; ATOM-NEXT: notl %eax
	; ATOM-NEXT: nop
	; ATOM-NEXT: nop
	; ATOM-NEXT: retq
	; ATOM-NEXT: ## -- End function
	;			;
	; MCU-LABEL: test14:			; MCU-LABEL: test14:
	; MCU: # BB#0:			; MCU: # BB#0:
				; MCU-NEXT: xorl %ecx, %ecx
	; MCU-NEXT: cmpl %edx, %eax			; MCU-NEXT: cmpl %edx, %eax
	; MCU-NEXT: sbbl %eax, %eax			; MCU-NEXT: setae %cl
	; MCU-NEXT: notl %eax			; MCU-NEXT: negl %ecx
				; MCU-NEXT: movl %ecx, %eax
	; MCU-NEXT: retl			; MCU-NEXT: retl
	%c = icmp uge i32 %a, %b			%c = icmp uge i32 %a, %b
	%d = sext i1 %c to i32			%d = sext i1 %c to i32
	ret i32 %d			ret i32 %d
	}			}

	; rdar://10961709			; rdar://10961709
	define i32 @test15(i32 %x) nounwind {			define i32 @test15(i32 %x) nounwind {
	Show All 40 Lines
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: retq			; ATOM-NEXT: retq
	;			;
	; MCU-LABEL: test16:			; MCU-LABEL: test16:
	; MCU: # BB#0: # %entry			; MCU: # BB#0: # %entry
	; MCU-NEXT: orl %edx, %eax			; MCU-NEXT: movl %eax, %ecx
	; MCU-NEXT: movl $-1, %eax
	; MCU-NEXT: jne .LBB18_2
	; MCU-NEXT: # BB#1: # %entry
	; MCU-NEXT: xorl %eax, %eax			; MCU-NEXT: xorl %eax, %eax
	; MCU-NEXT: .LBB18_2: # %entry			; MCU-NEXT: orl %edx, %ecx
				; MCU-NEXT: setne %al
				; MCU-NEXT: negl %eax
	; MCU-NEXT: movl %eax, %edx			; MCU-NEXT: movl %eax, %edx
	; MCU-NEXT: retl			; MCU-NEXT: retl
	entry:			entry:
	%cmp = icmp ne i64 %x, 0			%cmp = icmp ne i64 %x, 0
	%conv1 = sext i1 %cmp to i64			%conv1 = sext i1 %cmp to i64
	ret i64 %conv1			ret i64 %conv1
	}			}

	define i16 @test17(i16 %x) nounwind {			define i16 @test17(i16 %x) nounwind {
	; GENERIC-LABEL: test17:			; GENERIC-LABEL: test17:
	; GENERIC: ## BB#0: ## %entry			; GENERIC: ## BB#0: ## %entry
	; GENERIC-NEXT: negw %di			; GENERIC-NEXT: negw %di
	; GENERIC-NEXT: sbbw %ax, %ax			; GENERIC-NEXT: sbbl %eax, %eax
				; GENERIC-NEXT: ## kill: %AX<def> %AX<kill> %EAX<kill>
	; GENERIC-NEXT: retq			; GENERIC-NEXT: retq
	; GENERIC-NEXT: ## -- End function			; GENERIC-NEXT: ## -- End function
	;			;
	; ATOM-LABEL: test17:			; ATOM-LABEL: test17:
	; ATOM: ## BB#0: ## %entry			; ATOM: ## BB#0: ## %entry
	; ATOM-NEXT: negw %di			; ATOM-NEXT: negw %di
	; ATOM-NEXT: sbbw %ax, %ax			; ATOM-NEXT: sbbl %eax, %eax
				; ATOM-NEXT: ## kill: %AX<def> %AX<kill> %EAX<kill>
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: nop			; ATOM-NEXT: nop
	; ATOM-NEXT: retq			; ATOM-NEXT: retq
	; ATOM-NEXT: ## -- End function			; ATOM-NEXT: ## -- End function
	;			;
	; MCU-LABEL: test17:			; MCU-LABEL: test17:
	; MCU: # BB#0: # %entry			; MCU: # BB#0: # %entry
	; MCU-NEXT: negw %ax			; MCU-NEXT: negw %ax
	; MCU-NEXT: sbbw %ax, %ax			; MCU-NEXT: sbbl %eax, %eax
				; MCU-NEXT: # kill: %AX<def> %AX<kill> %EAX<kill>
	; MCU-NEXT: retl			; MCU-NEXT: retl
	entry:			entry:
	%cmp = icmp ne i16 %x, 0			%cmp = icmp ne i16 %x, 0
	%sub = sext i1 %cmp to i16			%sub = sext i1 %cmp to i16
	ret i16 %sub			ret i16 %sub
	}			}

	define i8 @test18(i32 %x, i8 zeroext %a, i8 zeroext %b) nounwind {			define i8 @test18(i32 %x, i8 zeroext %a, i8 zeroext %b) nounwind {
	▲ Show 20 Lines • Show All 331 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/select_const.ll

	Show First 20 Lines • Show All 205 Lines • ▼ Show 20 Lines
	}			}

	; If the constants differ by a small multiplier, use LEA.			; If the constants differ by a small multiplier, use LEA.
	; select Cond, C1, C2 --> add (mul (zext Cond), C1-C2), C2 --> LEA C2(Cond * (C1-C2))			; select Cond, C1, C2 --> add (mul (zext Cond), C1-C2), C2 --> LEA C2(Cond * (C1-C2))

	define i32 @select_lea_2(i1 zeroext %cond) {			define i32 @select_lea_2(i1 zeroext %cond) {
	; CHECK-LABEL: select_lea_2:			; CHECK-LABEL: select_lea_2:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: testb %dil, %dil			; CHECK-NEXT: xorb $1, %dil
	; CHECK-NEXT: movl $-1, %ecx			; CHECK-NEXT: movzbl %dil, %eax
	; CHECK-NEXT: movl $1, %eax			; CHECK-NEXT: leal -1(%rax,%rax), %eax
	; CHECK-NEXT: cmovnel %ecx, %eax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%sel = select i1 %cond, i32 -1, i32 1			%sel = select i1 %cond, i32 -1, i32 1
	ret i32 %sel			ret i32 %sel
	}			}

	define i64 @select_lea_3(i1 zeroext %cond) {			define i64 @select_lea_3(i1 zeroext %cond) {
	; CHECK-LABEL: select_lea_3:			; CHECK-LABEL: select_lea_3:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: testb %dil, %dil			; CHECK-NEXT: xorb $1, %dil
	; CHECK-NEXT: movl $1, %ecx			; CHECK-NEXT: movzbl %dil, %eax
	; CHECK-NEXT: movq $-2, %rax			; CHECK-NEXT: leaq -2(%rax,%rax,2), %rax
	; CHECK-NEXT: cmoveq %rcx, %rax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%sel = select i1 %cond, i64 -2, i64 1			%sel = select i1 %cond, i64 -2, i64 1
	ret i64 %sel			ret i64 %sel
	}			}

	define i32 @select_lea_5(i1 zeroext %cond) {			define i32 @select_lea_5(i1 zeroext %cond) {
	; CHECK-LABEL: select_lea_5:			; CHECK-LABEL: select_lea_5:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: testb %dil, %dil			; CHECK-NEXT: xorb $1, %dil
	; CHECK-NEXT: movl $-2, %ecx			; CHECK-NEXT: movzbl %dil, %eax
	; CHECK-NEXT: movl $3, %eax			; CHECK-NEXT: leal -2(%rax,%rax,4), %eax
	; CHECK-NEXT: cmovnel %ecx, %eax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%sel = select i1 %cond, i32 -2, i32 3			%sel = select i1 %cond, i32 -2, i32 3
	ret i32 %sel			ret i32 %sel
	}			}

	define i64 @select_lea_9(i1 zeroext %cond) {			define i64 @select_lea_9(i1 zeroext %cond) {
	; CHECK-LABEL: select_lea_9:			; CHECK-LABEL: select_lea_9:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: testb %dil, %dil			; CHECK-NEXT: xorb $1, %dil
	; CHECK-NEXT: movl $2, %ecx			; CHECK-NEXT: movzbl %dil, %eax
	; CHECK-NEXT: movq $-7, %rax			; CHECK-NEXT: leaq -7(%rax,%rax,8), %rax
	; CHECK-NEXT: cmoveq %rcx, %rax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%sel = select i1 %cond, i64 -7, i64 2			%sel = select i1 %cond, i64 -7, i64 2
	ret i64 %sel			ret i64 %sel
	}			}

	; Should this be 'sbb x,x' or 'sbb 0,x' with simpler LEA or add?			; Should this be 'sbb x,x' or 'sbb 0,x' with simpler LEA or add?

	define i64 @sel_1_2(i64 %x, i64 %y) {			define i64 @sel_1_2(i64 %x, i64 %y) {
	; CHECK-LABEL: sel_1_2:			; CHECK-LABEL: sel_1_2:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: cmpq $42, %rdi			; CHECK-NEXT: cmpq $42, %rdi
	; CHECK-NEXT: sbbq %rax, %rax			; CHECK-NEXT: sbbq $0, %rsi
	; CHECK-NEXT: leaq 2(%rax,%rsi), %rax			; CHECK-NEXT: leaq 2(%rsi), %rax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%cmp = icmp ult i64 %x, 42			%cmp = icmp ult i64 %x, 42
	%sel = select i1 %cmp, i64 1, i64 2			%sel = select i1 %cmp, i64 1, i64 2
	%sub = add i64 %sel, %y			%sub = add i64 %sel, %y
	ret i64 %sub			ret i64 %sub
	}			}

	; No LEA with 8-bit or 16-bit, but this shouldn't need branches or cmov.			; No LEA with 8-bit, but this shouldn't need branches or cmov.

	define i8 @sel_1_neg1(i32 %x) {			define i8 @sel_1_neg1(i32 %x) {
	; CHECK-LABEL: sel_1_neg1:			; CHECK-LABEL: sel_1_neg1:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: cmpl $42, %edi			; CHECK-NEXT: cmpl $42, %edi
	; CHECK-NEXT: movb $3, %al			; CHECK-NEXT: setg %al
	; CHECK-NEXT: jg .LBB23_2			; CHECK-NEXT: shlb $2, %al
	; CHECK-NEXT: # BB#1:			; CHECK-NEXT: decb %al
	; CHECK-NEXT: movb $-1, %al
	; CHECK-NEXT: .LBB23_2:
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%cmp = icmp sgt i32 %x, 42			%cmp = icmp sgt i32 %x, 42
	%sel = select i1 %cmp, i8 3, i8 -1			%sel = select i1 %cmp, i8 3, i8 -1
	ret i8 %sel			ret i8 %sel
	}			}

				; We get an LEA for 16-bit because we ignore the high-bits.

	define i16 @sel_neg1_1(i32 %x) {			define i16 @sel_neg1_1(i32 %x) {
	; CHECK-LABEL: sel_neg1_1:			; CHECK-LABEL: sel_neg1_1:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: cmpl $42, %edi			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: movw $-1, %cx			; CHECK-NEXT: cmpl $43, %edi
	; CHECK-NEXT: movw $3, %ax			; CHECK-NEXT: setl %al
	; CHECK-NEXT: cmovgw %cx, %ax			; CHECK-NEXT: leal -1(,%rax,4), %eax
				; CHECK-NEXT: # kill: %AX<def> %AX<kill> %EAX<kill>
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%cmp = icmp sgt i32 %x, 42			%cmp = icmp sgt i32 %x, 42
	%sel = select i1 %cmp, i16 -1, i16 3			%sel = select i1 %cmp, i16 -1, i16 3
	ret i16 %sel			ret i16 %sel
	}			}

	; If the comparison is available, the predicate can be inverted.			; If the comparison is available, the predicate can be inverted.

	define i32 @sel_1_neg1_32(i32 %x) {			define i32 @sel_1_neg1_32(i32 %x) {
	; CHECK-LABEL: sel_1_neg1_32:			; CHECK-LABEL: sel_1_neg1_32:
	; CHECK: # BB#0:			; CHECK: # BB#0:
				; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: cmpl $42, %edi			; CHECK-NEXT: cmpl $42, %edi
	; CHECK-NEXT: movl $8, %ecx			; CHECK-NEXT: setg %al
	; CHECK-NEXT: movl $-1, %eax			; CHECK-NEXT: leal -1(%rax,%rax,8), %eax
	; CHECK-NEXT: cmovgl %ecx, %eax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%cmp = icmp sgt i32 %x, 42			%cmp = icmp sgt i32 %x, 42
	%sel = select i1 %cmp, i32 8, i32 -1			%sel = select i1 %cmp, i32 8, i32 -1
	ret i32 %sel			ret i32 %sel
	}			}

	define i32 @sel_neg1_1_32(i32 %x) {			define i32 @sel_neg1_1_32(i32 %x) {
	; CHECK-LABEL: sel_neg1_1_32:			; CHECK-LABEL: sel_neg1_1_32:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: cmpl $42, %edi			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: movl $-7, %ecx			; CHECK-NEXT: cmpl $43, %edi
	; CHECK-NEXT: movl $2, %eax			; CHECK-NEXT: setl %al
	; CHECK-NEXT: cmovgl %ecx, %eax			; CHECK-NEXT: leal -7(%rax,%rax,8), %eax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%cmp = icmp sgt i32 %x, 42			%cmp = icmp sgt i32 %x, 42
	%sel = select i1 %cmp, i32 -7, i32 2			%sel = select i1 %cmp, i32 -7, i32 2
	ret i32 %sel			ret i32 %sel
	}			}


	; If the constants differ by a large power-of-2, that can be a shift of the difference plus the smaller constant.			; If the constants differ by a large power-of-2, that can be a shift of the difference plus the smaller constant.
	; select Cond, C1, C2 --> add (mul (zext Cond), C1-C2), C2			; select Cond, C1, C2 --> add (mul (zext Cond), C1-C2), C2

	define i8 @select_pow2_diff(i1 zeroext %cond) {			define i8 @select_pow2_diff(i1 zeroext %cond) {
	; CHECK-LABEL: select_pow2_diff:			; CHECK-LABEL: select_pow2_diff:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: testb %dil, %dil			; CHECK-NEXT: shlb $4, %dil
	; CHECK-NEXT: movb $19, %al			; CHECK-NEXT: orb $3, %dil
	; CHECK-NEXT: jne .LBB27_2			; CHECK-NEXT: movl %edi, %eax
	; CHECK-NEXT: # BB#1:
	; CHECK-NEXT: movb $3, %al
	; CHECK-NEXT: .LBB27_2:
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%sel = select i1 %cond, i8 19, i8 3			%sel = select i1 %cond, i8 19, i8 3
	ret i8 %sel			ret i8 %sel
	}			}

	define i16 @select_pow2_diff_invert(i1 zeroext %cond) {			define i16 @select_pow2_diff_invert(i1 zeroext %cond) {
	; CHECK-LABEL: select_pow2_diff_invert:			; CHECK-LABEL: select_pow2_diff_invert:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: testb %dil, %dil			; CHECK-NEXT: xorb $1, %dil
	; CHECK-NEXT: movw $7, %cx			; CHECK-NEXT: movzbl %dil, %eax
	; CHECK-NEXT: movw $71, %ax			; CHECK-NEXT: shll $6, %eax
	; CHECK-NEXT: cmovnew %cx, %ax			; CHECK-NEXT: orl $7, %eax
				; CHECK-NEXT: # kill: %AX<def> %AX<kill> %EAX<kill>
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%sel = select i1 %cond, i16 7, i16 71			%sel = select i1 %cond, i16 7, i16 71
	ret i16 %sel			ret i16 %sel
	}			}

	define i32 @select_pow2_diff_neg(i1 zeroext %cond) {			define i32 @select_pow2_diff_neg(i1 zeroext %cond) {
	; CHECK-LABEL: select_pow2_diff_neg:			; CHECK-LABEL: select_pow2_diff_neg:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: testb %dil, %dil			; CHECK-NEXT: shlb $4, %dil
	; CHECK-NEXT: movl $-9, %ecx			; CHECK-NEXT: movzbl %dil, %eax
	; CHECK-NEXT: movl $-25, %eax			; CHECK-NEXT: orl $-25, %eax
	; CHECK-NEXT: cmovnel %ecx, %eax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%sel = select i1 %cond, i32 -9, i32 -25			%sel = select i1 %cond, i32 -9, i32 -25
	ret i32 %sel			ret i32 %sel
	}			}

	define i64 @select_pow2_diff_neg_invert(i1 zeroext %cond) {			define i64 @select_pow2_diff_neg_invert(i1 zeroext %cond) {
	; CHECK-LABEL: select_pow2_diff_neg_invert:			; CHECK-LABEL: select_pow2_diff_neg_invert:
	; CHECK: # BB#0:			; CHECK: # BB#0:
	; CHECK-NEXT: testb %dil, %dil			; CHECK-NEXT: xorb $1, %dil
	; CHECK-NEXT: movl $29, %ecx			; CHECK-NEXT: movzbl %dil, %eax
	; CHECK-NEXT: movq $-99, %rax			; CHECK-NEXT: shlq $7, %rax
	; CHECK-NEXT: cmoveq %rcx, %rax			; CHECK-NEXT: addq $-99, %rax
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	%sel = select i1 %cond, i64 -99, i64 29			%sel = select i1 %cond, i64 -99, i64 29
	ret i64 %sel			ret i64 %sel
	}			}

	; This doesn't need a branch, but don't do the wrong thing if subtraction of the constants overflows.			; This doesn't need a branch, but don't do the wrong thing if subtraction of the constants overflows.

	define i8 @sel_67_neg125(i32 %x) {			define i8 @sel_67_neg125(i32 %x) {
	▲ Show 20 Lines • Show All 126 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/sext-i1.ll

	Show First 20 Lines • Show All 45 Lines • ▼ Show 20 Lines
	; X32-NEXT: sbbl %eax, %eax			; X32-NEXT: sbbl %eax, %eax
	; X32-NEXT: cmpl %eax, %eax			; X32-NEXT: cmpl %eax, %eax
	; X32-NEXT: sbbl %eax, %eax			; X32-NEXT: sbbl %eax, %eax
	; X32-NEXT: xorl %eax, %eax			; X32-NEXT: xorl %eax, %eax
	; X32-NEXT: retl			; X32-NEXT: retl
	;			;
	; X64-LABEL: t3:			; X64-LABEL: t3:
	; X64: # BB#0: # %entry			; X64: # BB#0: # %entry
	; X64-NEXT: cmpl $1, %eax			; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: sbbq %rax, %rax			; X64-NEXT: testl %eax, %eax
				; X64-NEXT: sete %al
				; X64-NEXT: negq %rax
	; X64-NEXT: cmpq %rax, %rax			; X64-NEXT: cmpq %rax, %rax
	; X64-NEXT: xorl %eax, %eax			; X64-NEXT: xorl %eax, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	entry:			entry:
	%not.tobool = icmp eq i32 undef, 0			%not.tobool = icmp eq i32 undef, 0
	%cond = sext i1 %not.tobool to i32			%cond = sext i1 %not.tobool to i32
	%conv = sext i1 %not.tobool to i64			%conv = sext i1 %not.tobool to i64
	%add13 = add i64 0, %conv			%add13 = add i64 0, %conv
	%cmp = icmp ult i64 undef, %add13			%cmp = icmp ult i64 undef, %add13
	br i1 %cmp, label %if.then, label %if.end			br i1 %cmp, label %if.then, label %if.end

	if.then:			if.then:
	br label %if.end			br label %if.end

	if.end:			if.end:
	%xor27 = xor i32 undef, %cond			%xor27 = xor i32 undef, %cond
	ret i32 0			ret i32 0
	}			}

	define i32 @t4(i64 %x) nounwind readnone ssp {			define i32 @t4(i64 %x) nounwind readnone ssp {
	; X32-LABEL: t4:			; X32-LABEL: t4:
	; X32: # BB#0:			; X32: # BB#0:
	; X32-NEXT: movl {{[0-9]+}}(%esp), %eax			; X32-NEXT: movl {{[0-9]+}}(%esp), %ecx
	; X32-NEXT: orl {{[0-9]+}}(%esp), %eax
	; X32-NEXT: movl $-1, %eax
	; X32-NEXT: je .LBB3_2
	; X32-NEXT: # BB#1:
	; X32-NEXT: xorl %eax, %eax			; X32-NEXT: xorl %eax, %eax
	; X32-NEXT: .LBB3_2:			; X32-NEXT: orl {{[0-9]+}}(%esp), %ecx
				; X32-NEXT: sete %al
				; X32-NEXT: negl %eax
	; X32-NEXT: retl			; X32-NEXT: retl
	;			;
	; X64-LABEL: t4:			; X64-LABEL: t4:
	; X64: # BB#0:			; X64: # BB#0:
	; X64-NEXT: cmpq $1, %rdi			; X64-NEXT: cmpq $1, %rdi
	; X64-NEXT: sbbl %eax, %eax			; X64-NEXT: sbbl %eax, %eax
	; X64-NEXT: retq			; X64-NEXT: retq
	%t0 = icmp eq i64 %x, 0			%t0 = icmp eq i64 %x, 0
	▲ Show 20 Lines • Show All 84 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[x86] use more shift or LEA for select-of-constants
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 110735

llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

llvm/trunk/lib/Target/X86/X86ISelLowering.cpp

llvm/trunk/test/CodeGen/X86/2010-08-04-MaskedSignedCompare.ll

llvm/trunk/test/CodeGen/X86/memcmp-optsize.ll

llvm/trunk/test/CodeGen/X86/memcmp.ll

llvm/trunk/test/CodeGen/X86/merge-consecutive-stores.ll

llvm/trunk/test/CodeGen/X86/mul-constant-result.ll

llvm/trunk/test/CodeGen/X86/pr22338.ll

llvm/trunk/test/CodeGen/X86/sbb.ll

llvm/trunk/test/CodeGen/X86/select.ll

llvm/trunk/test/CodeGen/X86/select_const.ll

llvm/trunk/test/CodeGen/X86/sext-i1.ll

This is an archive of the discontinued LLVM Phabricator instance.

[x86] use more shift or LEA for select-of-constantsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 110735

llvm/trunk/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

llvm/trunk/lib/Target/X86/X86ISelLowering.cpp

llvm/trunk/test/CodeGen/X86/2010-08-04-MaskedSignedCompare.ll

llvm/trunk/test/CodeGen/X86/memcmp-optsize.ll

llvm/trunk/test/CodeGen/X86/memcmp.ll

llvm/trunk/test/CodeGen/X86/merge-consecutive-stores.ll

llvm/trunk/test/CodeGen/X86/mul-constant-result.ll

llvm/trunk/test/CodeGen/X86/pr22338.ll

llvm/trunk/test/CodeGen/X86/sbb.ll

llvm/trunk/test/CodeGen/X86/select.ll

llvm/trunk/test/CodeGen/X86/select_const.ll

llvm/trunk/test/CodeGen/X86/sext-i1.ll

[x86] use more shift or LEA for select-of-constants
ClosedPublic