This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] allow more than one use for vector cast folding with selects
ClosedPublic

Authored by spatel on Jun 9 2016, 10:50 AM.

Download Raw Diff

Details

Reviewers

RKSimon
majnemer
eli.friedman

Commits

rG216d8cf72018: [InstCombine] allow more than one use for vector bitcast folding with selects
rL273011: [InstCombine] allow more than one use for vector bitcast folding with selects

Summary

The motivating example for this transform is similar to D20774 where bitcasts interfere with a single cmp/select sequence, but in this case we have 2 uses of each bitcast to produce min and max ops:

define void @minmax_bc_store(<4 x float> %a, <4 x float> %b, <4 x float>* %ptr1, <4 x float>* %ptr2) {
  %cmp = fcmp olt <4 x float> %a, %b
  %bc1 = bitcast <4 x float> %a to <4 x i32>
  %bc2 = bitcast <4 x float> %b to <4 x i32>
  %sel1 = select <4 x i1> %cmp, <4 x i32> %bc1, <4 x i32> %bc2
  %sel2 = select <4 x i1> %cmp, <4 x i32> %bc2, <4 x i32> %bc1
  %bc3 = bitcast <4 x float>* %ptr1 to <4 x i32>*
  store <4 x i32> %sel1, <4 x i32>* %bc3
  %bc4 = bitcast <4 x float>* %ptr2 to <4 x i32>*
  store <4 x i32> %sel2, <4 x i32>* %bc4
  ret void
}

With this patch, we move the selects up to use the input args which allows getting rid of all of the bitcasts:

define void @minmax_bc_store(<4 x float> %a, <4 x float> %b, <4 x float>* %ptr1, <4 x float>* %ptr2) {
  %cmp = fcmp olt <4 x float> %a, %b
  %sel1.v = select <4 x i1> %cmp, <4 x float> %a, <4 x float> %b
  %sel2.v = select <4 x i1> %cmp, <4 x float> %b, <4 x float> %a
  store <4 x float> %sel1.v, <4 x float>* %ptr1, align 16
  store <4 x float> %sel2.v, <4 x float>* %ptr2, align 16
  ret void
}

The asm for x86 SSE then improves from:

movaps	%xmm0, %xmm2
cmpltps	%xmm1, %xmm2
movaps	%xmm2, %xmm3
andnps	%xmm1, %xmm3
movaps	%xmm2, %xmm4
andnps	%xmm0, %xmm4
andps	%xmm2, %xmm0
orps	%xmm3, %xmm0
andps	%xmm1, %xmm2
orps	%xmm4, %xmm2
movaps	%xmm0, (%rdi)
movaps	%xmm2, (%rsi)

To:

movaps	%xmm0, %xmm2
minps	%xmm1, %xmm2
maxps	%xmm0, %xmm1
movaps	%xmm2, (%rdi)
movaps	%xmm1, (%rsi)

Diff Detail

Repository: rL LLVM

Event Timeline

spatel updated this revision to Diff 60197.Jun 9 2016, 10:50 AM

spatel retitled this revision from to [InstCombine] allow more than one use for vector cast folding with selects.

spatel updated this object.

spatel added reviewers: majnemer, eli.friedman, RKSimon.

spatel added a subscriber: llvm-commits.

Herald added a subscriber: mcrosier. · View Herald TranscriptJun 9 2016, 10:50 AM

Is it possible that this could cause an infinite loop in instcombine? Previously, this transform always reduced the total number of bitcasts in the function, but this doesn't. (Consider the case where the select uses its own result.)

lib/Transforms/InstCombine/InstCombineSelect.cpp
151 ↗	(On Diff #60197)	Need to fix comment here?

In D21190#453695, @eli.friedman wrote:

Is it possible that this could cause an infinite loop in instcombine? Previously, this transform always reduced the total number of bitcasts in the function, but this doesn't. (Consider the case where the select uses its own result.)

Sorry for not seeing it - the select uses its own result via a phi? Can you show the construct that you have in mind?

Something like this?

loop:
  %sel = select <4 x i1> %cmp, <4 x i32> %selx, <4 x i32> %selx
  %selx = bitcast <4 x i32> %sel to <4 x f32>
  br label %loop

Your optimization flips the types of the select and the bitcast, I think. Obviously not an actual testcase because it's missing PHI nodes, but that's the basic idea.

In D21190#453811, @eli.friedman wrote:
Something like this?
loop:
  %sel = select <4 x i1> %cmp, <4 x i32> %selx, <4 x i32> %selx
  %selx = bitcast <4 x i32> %sel to <4 x f32>
  br label %loop
Your optimization flips the types of the select and the bitcast, I think. Obviously not an actual testcase because it's missing PHI nodes, but that's the basic idea.

Interesting...I'm trying to be more diabolical, but I can't get it yet. :)
In order for the bitcasted output to feed back into the original intstruction, it would have to be bitcasted back to the original type somewhere along the way? In that case, I think we'd eliminate the bitcasts as they get paired up:

define void @infloop(<4 x i1> %cmp, <4 x i32> %a, <4 x i32> %b) {
entry:
  br label %loop

loop:
  %phi1 = phi <4 x i32> [ %a, %entry ], [ %self1, %loop ]
  %phi2 = phi <4 x i32> [ %b, %entry ], [ %self2, %loop ]
  %selx1 = bitcast <4 x i32> %phi1 to <4 x float>
  %selx2 = bitcast <4 x i32> %phi2 to <4 x float>
  %sel1 = select <4 x i1> %cmp, <4 x float> %selx1, <4 x float> %selx2
  %sel2 = select <4 x i1> %cmp, <4 x float> %selx2, <4 x float> %selx1
  %self1 = bitcast <4 x float> %sel1 to <4 x i32>
  %self2 = bitcast <4 x float> %sel2 to <4 x i32>
  br label %loop

  ret void
}

$ ./opt -instcombine infloop.ll -S

define void @infloop(<4 x i1> %cmp, <4 x i32> %a, <4 x i32> %b) {
entry:
  br label %loop

loop:                                             ; preds = %loop, %entry
  %phi1 = phi <4 x i32> [ %a, %entry ], [ %sel1.v, %loop ]
  %phi2 = phi <4 x i32> [ %b, %entry ], [ %sel2.v, %loop ]
  %sel1.v = select <4 x i1> %cmp, <4 x i32> %phi1, <4 x i32> %phi2
  %sel2.v = select <4 x i1> %cmp, <4 x i32> %phi2, <4 x i32> %phi1
  br label %loop
                                                  ; No predecessors!
  ret void
}

Looking a bit more, I think the infinite loop isn't possible because of the way instcombine works with PHI nodes and the reachable code restriction. Sorry about the false alarm.

In D21190#453940, @eli.friedman wrote:

Looking a bit more, I think the infinite loop isn't possible because of the way instcombine works with PHI nodes and the reachable code restriction. Sorry about the false alarm.

No problem - thanks for making me look harder at the possibilities. I'll upload a new draft with a code comment change.

Patch updated:
Add comment to better explain the one-use restriction.
Also, add a TODO comment for cleanup because there's a strange combo of isa/dyn_cast/llvm_unreachable below here.

Ping.

This patch doesn't only apply to bitcasts, which can lead to gigantic codegen changes in some cases. That isn't a new problem, though; consider:

define void @min_max_trunc(<4 x float> %a, <4 x float> %b, <4 x i64> %c, <4 x i64> %d, <4 x i32>* %ptr1, <4 x i32>* %ptr2) {
  %cmp = fcmp olt <4 x float> %a, %b
  %bc1 = trunc <4 x i64> %c to <4 x i32>
  %bc2 = trunc <4 x i64> %d to <4 x i32>
  %sel1 = select <4 x i1> %cmp, <4 x i32> %bc1, <4 x i32> %bc2
  store <4 x i32> %sel1, <4 x i32>* %ptr1
  ret void
}

instcombine makes this generate much worse code for SSE2. Although, I'm pretty sure we can blame SelectionDAG for some part of that because it's generating absolutely terrible code. Feel free to just file a bug for this, but I'm pretty sure we need some sort of target-hook for this.

It would be nice to throw together a few testcases for zext/sext/trunc/sitofp/fptoui just to make sure we have coverage.

Otherwise LGTM.

This revision is now accepted and ready to land.Jun 16 2016, 10:48 AM

In D21190#460029, @eli.friedman wrote:

This patch doesn't only apply to bitcasts, which can lead to gigantic codegen changes in some cases.

...

Feel free to just file a bug for this, but I'm pretty sure we need some sort of target-hook for this.

Thanks:
https://llvm.org/bugs/show_bug.cgi?id=28160

I think I should limit this patch to only bitcasts to make it safer?

In D21190#460241, @spatel wrote:

I think I should limit this patch to only bitcasts to make it safer?

If you like. Probably not a big deal either way, given the transforms we already perform.

Closed by commit rL273011: [InstCombine] allow more than one use for vector bitcast folding with selects (authored by spatel). · Explain WhyJun 17 2016, 9:53 AM

This revision was automatically updated to reflect the committed changes.

Revision Contents

Path

Size

llvm/

trunk/

lib/

Transforms/

InstCombine/

InstCombineSelect.cpp

48 lines

test/

Transforms/

InstCombine/

select.ll

193 lines

Diff 61105

llvm/trunk/lib/Transforms/InstCombine/InstCombineSelect.cpp

Show First 20 Lines • Show All 110 Lines • ▼ Show 20 Lines	case Instruction::AShr:
return Constant::getNullValue(I->getType());		return Constant::getNullValue(I->getType());
case Instruction::And:		case Instruction::And:
return Constant::getAllOnesValue(I->getType());		return Constant::getAllOnesValue(I->getType());
case Instruction::Mul:		case Instruction::Mul:
return ConstantInt::get(I->getType(), 1);		return ConstantInt::get(I->getType(), 1);
}		}
}		}

/// Here we have (select c, TI, FI), and we know that TI and FI		/// We have (select c, TI, FI), and we know that TI and FI have the same opcode.
/// have the same opcode and only one use each. Try to simplify this.
Instruction InstCombiner::FoldSelectOpOp(SelectInst &SI, Instruction TI,		Instruction InstCombiner::FoldSelectOpOp(SelectInst &SI, Instruction TI,
Instruction *FI) {		Instruction *FI) {
// If this is a cast from the same type, merge.		// If this is a cast from the same type, merge.
if (TI->getNumOperands() == 1 && TI->isCast()) {		if (TI->getNumOperands() == 1 && TI->isCast()) {
Type *FIOpndTy = FI->getOperand(0)->getType();		Type *FIOpndTy = FI->getOperand(0)->getType();
if (TI->getOperand(0)->getType() != FIOpndTy)		if (TI->getOperand(0)->getType() != FIOpndTy)
return nullptr;		return nullptr;

// The select condition may be a vector. We may only change the operand		// The select condition may be a vector. We may only change the operand
// type if the vector width remains the same (and matches the condition).		// type if the vector width remains the same (and matches the condition).
Type *CondTy = SI.getCondition()->getType();		Type *CondTy = SI.getCondition()->getType();
if (CondTy->isVectorTy() &&		if (CondTy->isVectorTy()) {
(!FIOpndTy->isVectorTy() \|\|		if (!FIOpndTy->isVectorTy())
CondTy->getVectorNumElements() != FIOpndTy->getVectorNumElements()))		return nullptr;
		if (CondTy->getVectorNumElements() != FIOpndTy->getVectorNumElements())
		return nullptr;

		// TODO: If the backend knew how to deal with casts better, we could
		// remove this limitation. For now, there's too much potential to create
		// worse codegen by promoting the select ahead of size-altering casts
		// (PR28160).
		//
		// Note that ValueTracking's matchSelectPattern() looks through casts
		// without checking 'hasOneUse' when it matches min/max patterns, so this
		// transform may end up happening anyway.
		if (TI->getOpcode() != Instruction::BitCast &&
		(!TI->hasOneUse() \|\| !FI->hasOneUse()))
return nullptr;		return nullptr;

		} else if (!TI->hasOneUse() \|\| !FI->hasOneUse()) {
		// TODO: The one-use restrictions for a scalar select could be eased if
		// the fold of a select in visitLoadInst() was enhanced to match a pattern
		// that includes a cast.
		return nullptr;
		}

// Fold this by inserting a select from the input values.		// Fold this by inserting a select from the input values.
Value *NewSI = Builder->CreateSelect(SI.getCondition(), TI->getOperand(0),		Value *NewSI = Builder->CreateSelect(SI.getCondition(), TI->getOperand(0),
FI->getOperand(0), SI.getName()+".v");		FI->getOperand(0), SI.getName()+".v");
return CastInst::Create(Instruction::CastOps(TI->getOpcode()), NewSI,		return CastInst::Create(Instruction::CastOps(TI->getOpcode()), NewSI,
TI->getType());		TI->getType());
}		}

// Only handle binary operators here.		// TODO: This function ends awkwardly in unreachable - fix to be more normal.
if (!isa<BinaryOperator>(TI))
		// Only handle binary operators with one-use here. As with the cast case
		// above, it may be possible to relax the one-use constraint, but that needs
		// be examined carefully since it may not reduce the total number of
		// instructions.
		if (!isa<BinaryOperator>(TI) \|\| !TI->hasOneUse() \|\| !FI->hasOneUse())
return nullptr;		return nullptr;

// Figure out if the operations have any operands in common.		// Figure out if the operations have any operands in common.
Value MatchOp, OtherOpT, *OtherOpF;		Value MatchOp, OtherOpT, *OtherOpF;
bool MatchIsOpZero;		bool MatchIsOpZero;
if (TI->getOperand(0) == FI->getOperand(0)) {		if (TI->getOperand(0) == FI->getOperand(0)) {
MatchOp = TI->getOperand(0);		MatchOp = TI->getOperand(0);
OtherOpT = TI->getOperand(1);		OtherOpT = TI->getOperand(1);
▲ Show 20 Lines • Show All 897 Lines • ▼ Show 20 Lines	Instruction *InstCombiner::visitSelectInst(SelectInst &SI) {
// See if we are selecting two values based on a comparison of the two values.		// See if we are selecting two values based on a comparison of the two values.
if (ICmpInst *ICI = dyn_cast<ICmpInst>(CondVal))		if (ICmpInst *ICI = dyn_cast<ICmpInst>(CondVal))
if (Instruction *Result = visitSelectInstWithICmp(SI, ICI))		if (Instruction *Result = visitSelectInstWithICmp(SI, ICI))
return Result;		return Result;

if (Instruction Add = foldAddSubSelect(SI, Builder))		if (Instruction Add = foldAddSubSelect(SI, Builder))
return Add;		return Add;

		// Turn (select C, (op X, Y), (op X, Z)) -> (op X, (select C, Y, Z))
auto *TI = dyn_cast<Instruction>(TrueVal);		auto *TI = dyn_cast<Instruction>(TrueVal);
auto *FI = dyn_cast<Instruction>(FalseVal);		auto *FI = dyn_cast<Instruction>(FalseVal);
if (TI && FI && TI->hasOneUse() && FI->hasOneUse()) {		if (TI && FI && TI->getOpcode() == FI->getOpcode())
// Turn (select C, (op X, Y), (op X, Z)) -> (op X, (select C, Y, Z))
if (TI->getOpcode() == FI->getOpcode())
if (Instruction *IV = FoldSelectOpOp(SI, TI, FI))		if (Instruction *IV = FoldSelectOpOp(SI, TI, FI))
return IV;		return IV;
}

// See if we can fold the select into one of our operands.		// See if we can fold the select into one of our operands.
if (SI.getType()->isIntOrIntVectorTy() \|\| SI.getType()->isFPOrFPVectorTy()) {		if (SI.getType()->isIntOrIntVectorTy() \|\| SI.getType()->isFPOrFPVectorTy()) {
if (Instruction *FoldI = FoldSelectIntoOp(SI, TrueVal, FalseVal))		if (Instruction *FoldI = FoldSelectIntoOp(SI, TrueVal, FalseVal))
return FoldI;		return FoldI;

Value LHS, RHS, LHS2, RHS2;		Value LHS, RHS, LHS2, RHS2;
Instruction::CastOps CastOp;		Instruction::CastOps CastOp;
▲ Show 20 Lines • Show All 163 Lines • Show Last 20 Lines

llvm/trunk/test/Transforms/InstCombine/select.ll

; RUN: opt < %s -instcombine -S \| FileCheck %s		; RUN: opt < %s -instcombine -S \| FileCheck %s
; This test makes sure that these instructions are properly eliminated.		; This test makes sure that these instructions are properly eliminated.
; PR1822		; PR1822

target datalayout = "e-p:64:64-p1:16:16-p2:32:32:32-p3:64:64:64"		target datalayout = "e-p:64:64-p1:16:16-p2:32:32:32-p3:64:64:64"

define i32 @test1(i32 %A, i32 %B) {		define i32 @test1(i32 %A, i32 %B) {
%C = select i1 false, i32 %A, i32 %B		%C = select i1 false, i32 %A, i32 %B
ret i32 %C		ret i32 %C
; CHECK-LABEL: @test1(		; CHECK-LABEL: @test1(
; CHECK: ret i32 %B		; CHECK: ret i32 %B
}		}

define i32 @test2(i32 %A, i32 %B) {		define i32 @test2(i32 %A, i32 %B) {
%C = select i1 true, i32 %A, i32 %B		%C = select i1 true, i32 %A, i32 %B
ret i32 %C		ret i32 %C
; CHECK-LABEL: @test2(		; CHECK-LABEL: @test2(
; CHECK: ret i32 %A		; CHECK: ret i32 %A
}		}


define i32 @test3(i1 %C, i32 %I) {		define i32 @test3(i1 %C, i32 %I) {
; V = I		; V = I
%V = select i1 %C, i32 %I, i32 %I		%V = select i1 %C, i32 %I, i32 %I
ret i32 %V		ret i32 %V
; CHECK-LABEL: @test3(		; CHECK-LABEL: @test3(
; CHECK: ret i32 %I		; CHECK: ret i32 %I
}		}

define i1 @test4(i1 %C) {		define i1 @test4(i1 %C) {
; V = C		; V = C
%V = select i1 %C, i1 true, i1 false		%V = select i1 %C, i1 true, i1 false
ret i1 %V		ret i1 %V
; CHECK-LABEL: @test4(		; CHECK-LABEL: @test4(
; CHECK: ret i1 %C		; CHECK: ret i1 %C
}		}

define i1 @test5(i1 %C) {		define i1 @test5(i1 %C) {
; V = !C		; V = !C
%V = select i1 %C, i1 false, i1 true		%V = select i1 %C, i1 false, i1 true
ret i1 %V		ret i1 %V
; CHECK-LABEL: @test5(		; CHECK-LABEL: @test5(
; CHECK: xor i1 %C, true		; CHECK: xor i1 %C, true
; CHECK: ret i1		; CHECK: ret i1
}		}

define i32 @test6(i1 %C) {		define i32 @test6(i1 %C) {
; V = cast C to int		; V = cast C to int
%V = select i1 %C, i32 1, i32 0		%V = select i1 %C, i32 1, i32 0
ret i32 %V		ret i32 %V
; CHECK-LABEL: @test6(		; CHECK-LABEL: @test6(
; CHECK: %V = zext i1 %C to i32		; CHECK: %V = zext i1 %C to i32
; CHECK: ret i32 %V		; CHECK: ret i32 %V
}		}

define i1 @test7(i1 %C, i1 %X) {		define i1 @test7(i1 %C, i1 %X) {
; R = or C, X		; R = or C, X
%R = select i1 %C, i1 true, i1 %X		%R = select i1 %C, i1 true, i1 %X
ret i1 %R		ret i1 %R
; CHECK-LABEL: @test7(		; CHECK-LABEL: @test7(
; CHECK: %R = or i1 %C, %X		; CHECK: %R = or i1 %C, %X
; CHECK: ret i1 %R		; CHECK: ret i1 %R
}		}

define i1 @test8(i1 %C, i1 %X) {		define i1 @test8(i1 %C, i1 %X) {
; R = and C, X		; R = and C, X
%R = select i1 %C, i1 %X, i1 false		%R = select i1 %C, i1 %X, i1 false
ret i1 %R		ret i1 %R
; CHECK-LABEL: @test8(		; CHECK-LABEL: @test8(
; CHECK: %R = and i1 %C, %X		; CHECK: %R = and i1 %C, %X
; CHECK: ret i1 %R		; CHECK: ret i1 %R
}		}

define i1 @test9(i1 %C, i1 %X) {		define i1 @test9(i1 %C, i1 %X) {
; R = and !C, X		; R = and !C, X
%R = select i1 %C, i1 false, i1 %X		%R = select i1 %C, i1 false, i1 %X
ret i1 %R		ret i1 %R
; CHECK-LABEL: @test9(		; CHECK-LABEL: @test9(
; CHECK: xor i1 %C, true		; CHECK: xor i1 %C, true
; CHECK: %R = and i1		; CHECK: %R = and i1
; CHECK: ret i1 %R		; CHECK: ret i1 %R
}		}

define i1 @test10(i1 %C, i1 %X) {		define i1 @test10(i1 %C, i1 %X) {
; R = or !C, X		; R = or !C, X
%R = select i1 %C, i1 %X, i1 true		%R = select i1 %C, i1 %X, i1 true
ret i1 %R		ret i1 %R
; CHECK-LABEL: @test10(		; CHECK-LABEL: @test10(
; CHECK: xor i1 %C, true		; CHECK: xor i1 %C, true
; CHECK: %R = or i1		; CHECK: %R = or i1
; CHECK: ret i1 %R		; CHECK: ret i1 %R
}		}

define i32 @test11(i32 %a) {		define i32 @test11(i32 %a) {
%C = icmp eq i32 %a, 0		%C = icmp eq i32 %a, 0
%R = select i1 %C, i32 0, i32 1		%R = select i1 %C, i32 0, i32 1
ret i32 %R		ret i32 %R
; CHECK-LABEL: @test11(		; CHECK-LABEL: @test11(
; CHECK: icmp ne i32 %a, 0		; CHECK: icmp ne i32 %a, 0
; CHECK: %R = zext i1		; CHECK: %R = zext i1
; CHECK: ret i32 %R		; CHECK: ret i32 %R
}		}

define i32 @test12(i1 %cond, i32 %a) {		define i32 @test12(i1 %cond, i32 %a) {
%b = or i32 %a, 1		%b = or i32 %a, 1
%c = select i1 %cond, i32 %b, i32 %a		%c = select i1 %cond, i32 %b, i32 %a
ret i32 %c		ret i32 %c
; CHECK-LABEL: @test12(		; CHECK-LABEL: @test12(
; CHECK: %b = zext i1 %cond to i32		; CHECK: %b = zext i1 %cond to i32
; CHECK: %c = or i32 %b, %a		; CHECK: %c = or i32 %b, %a
; CHECK: ret i32 %c		; CHECK: ret i32 %c
}		}

define i32 @test12a(i1 %cond, i32 %a) {		define i32 @test12a(i1 %cond, i32 %a) {
%b = ashr i32 %a, 1		%b = ashr i32 %a, 1
%c = select i1 %cond, i32 %b, i32 %a		%c = select i1 %cond, i32 %b, i32 %a
ret i32 %c		ret i32 %c
; CHECK-LABEL: @test12a(		; CHECK-LABEL: @test12a(
; CHECK: %b = zext i1 %cond to i32		; CHECK: %b = zext i1 %cond to i32
; CHECK: %c = ashr i32 %a, %b		; CHECK: %c = ashr i32 %a, %b
; CHECK: ret i32 %c		; CHECK: ret i32 %c
}		}

define i32 @test12b(i1 %cond, i32 %a) {		define i32 @test12b(i1 %cond, i32 %a) {
%b = ashr i32 %a, 1		%b = ashr i32 %a, 1
%c = select i1 %cond, i32 %a, i32 %b		%c = select i1 %cond, i32 %a, i32 %b
ret i32 %c		ret i32 %c
; CHECK-LABEL: @test12b(		; CHECK-LABEL: @test12b(
; CHECK: zext i1 %cond to i32		; CHECK: zext i1 %cond to i32
; CHECK: %b = xor i32		; CHECK: %b = xor i32
; CHECK: %c = ashr i32 %a, %b		; CHECK: %c = ashr i32 %a, %b
; CHECK: ret i32 %c		; CHECK: ret i32 %c
}		}

define i32 @test13(i32 %a, i32 %b) {		define i32 @test13(i32 %a, i32 %b) {
%C = icmp eq i32 %a, %b		%C = icmp eq i32 %a, %b
%V = select i1 %C, i32 %a, i32 %b		%V = select i1 %C, i32 %a, i32 %b
ret i32 %V		ret i32 %V
; CHECK-LABEL: @test13(		; CHECK-LABEL: @test13(
; CHECK: ret i32 %b		; CHECK: ret i32 %b
}		}

define i32 @test13a(i32 %a, i32 %b) {		define i32 @test13a(i32 %a, i32 %b) {
%C = icmp ne i32 %a, %b		%C = icmp ne i32 %a, %b
%V = select i1 %C, i32 %a, i32 %b		%V = select i1 %C, i32 %a, i32 %b
ret i32 %V		ret i32 %V
; CHECK-LABEL: @test13a(		; CHECK-LABEL: @test13a(
; CHECK: ret i32 %a		; CHECK: ret i32 %a
}		}

define i32 @test13b(i32 %a, i32 %b) {		define i32 @test13b(i32 %a, i32 %b) {
%C = icmp eq i32 %a, %b		%C = icmp eq i32 %a, %b
%V = select i1 %C, i32 %b, i32 %a		%V = select i1 %C, i32 %b, i32 %a
ret i32 %V		ret i32 %V
; CHECK-LABEL: @test13b(		; CHECK-LABEL: @test13b(
; CHECK: ret i32 %a		; CHECK: ret i32 %a
}		}

define i1 @test14a(i1 %C, i32 %X) {		define i1 @test14a(i1 %C, i32 %X) {
%V = select i1 %C, i32 %X, i32 0		%V = select i1 %C, i32 %X, i32 0
; (X < 1) \| !C		; (X < 1) \| !C
%R = icmp slt i32 %V, 1		%R = icmp slt i32 %V, 1
ret i1 %R		ret i1 %R
; CHECK-LABEL: @test14a(		; CHECK-LABEL: @test14a(
; CHECK: icmp slt i32 %X, 1		; CHECK: icmp slt i32 %X, 1
; CHECK: xor i1 %C, true		; CHECK: xor i1 %C, true
; CHECK: or i1		; CHECK: or i1
; CHECK: ret i1 %R		; CHECK: ret i1 %R
}		}

define i1 @test14b(i1 %C, i32 %X) {		define i1 @test14b(i1 %C, i32 %X) {
%V = select i1 %C, i32 0, i32 %X		%V = select i1 %C, i32 0, i32 %X
; (X < 1) \| C		; (X < 1) \| C
%R = icmp slt i32 %V, 1		%R = icmp slt i32 %V, 1
ret i1 %R		ret i1 %R
; CHECK-LABEL: @test14b(		; CHECK-LABEL: @test14b(
; CHECK: icmp slt i32 %X, 1		; CHECK: icmp slt i32 %X, 1
; CHECK: or i1		; CHECK: or i1
; CHECK: ret i1 %R		; CHECK: ret i1 %R
}		}

;; Code sequence for (X & 16) ? 16 : 0		;; Code sequence for (X & 16) ? 16 : 0
define i32 @test15a(i32 %X) {		define i32 @test15a(i32 %X) {
%t1 = and i32 %X, 16		%t1 = and i32 %X, 16
%t2 = icmp eq i32 %t1, 0		%t2 = icmp eq i32 %t1, 0
%t3 = select i1 %t2, i32 0, i32 16		%t3 = select i1 %t2, i32 0, i32 16
ret i32 %t3		ret i32 %t3
; CHECK-LABEL: @test15a(		; CHECK-LABEL: @test15a(
; CHECK: %t1 = and i32 %X, 16		; CHECK: %t1 = and i32 %X, 16
; CHECK: ret i32 %t1		; CHECK: ret i32 %t1
}		}

;; Code sequence for (X & 32) ? 0 : 24		;; Code sequence for (X & 32) ? 0 : 24
define i32 @test15b(i32 %X) {		define i32 @test15b(i32 %X) {
%t1 = and i32 %X, 32		%t1 = and i32 %X, 32
%t2 = icmp eq i32 %t1, 0		%t2 = icmp eq i32 %t1, 0
%t3 = select i1 %t2, i32 32, i32 0		%t3 = select i1 %t2, i32 32, i32 0
ret i32 %t3		ret i32 %t3
; CHECK-LABEL: @test15b(		; CHECK-LABEL: @test15b(
; CHECK: %t1 = and i32 %X, 32		; CHECK: %t1 = and i32 %X, 32
; CHECK: xor i32 %t1, 32		; CHECK: xor i32 %t1, 32
; CHECK: ret i32		; CHECK: ret i32
}		}

;; Alternate code sequence for (X & 16) ? 16 : 0		;; Alternate code sequence for (X & 16) ? 16 : 0
define i32 @test15c(i32 %X) {		define i32 @test15c(i32 %X) {
%t1 = and i32 %X, 16		%t1 = and i32 %X, 16
%t2 = icmp eq i32 %t1, 16		%t2 = icmp eq i32 %t1, 16
%t3 = select i1 %t2, i32 16, i32 0		%t3 = select i1 %t2, i32 16, i32 0
ret i32 %t3		ret i32 %t3
; CHECK-LABEL: @test15c(		; CHECK-LABEL: @test15c(
; CHECK: %t1 = and i32 %X, 16		; CHECK: %t1 = and i32 %X, 16
; CHECK: ret i32 %t1		; CHECK: ret i32 %t1
}		}

;; Alternate code sequence for (X & 16) ? 16 : 0		;; Alternate code sequence for (X & 16) ? 16 : 0
define i32 @test15d(i32 %X) {		define i32 @test15d(i32 %X) {
%t1 = and i32 %X, 16		%t1 = and i32 %X, 16
%t2 = icmp ne i32 %t1, 0		%t2 = icmp ne i32 %t1, 0
%t3 = select i1 %t2, i32 16, i32 0		%t3 = select i1 %t2, i32 16, i32 0
ret i32 %t3		ret i32 %t3
; CHECK-LABEL: @test15d(		; CHECK-LABEL: @test15d(
; CHECK: %t1 = and i32 %X, 16		; CHECK: %t1 = and i32 %X, 16
; CHECK: ret i32 %t1		; CHECK: ret i32 %t1
}		}

;; (a & 128) ? 256 : 0		;; (a & 128) ? 256 : 0
define i32 @test15e(i32 %X) {		define i32 @test15e(i32 %X) {
▲ Show 20 Lines • Show All 66 Lines • ▼ Show 20 Lines
; CHECK-LABEL: @test15j(		; CHECK-LABEL: @test15j(
; CHECK-NEXT: %t1 = shl i32 %X, 8		; CHECK-NEXT: %t1 = shl i32 %X, 8
; CHECK-NEXT: %1 = and i32 %t1, 512		; CHECK-NEXT: %1 = and i32 %t1, 512
; CHECK-NEXT: %2 = add nuw nsw i32 %1, 577		; CHECK-NEXT: %2 = add nuw nsw i32 %1, 577
; CHECK-NEXT: ret i32 %2		; CHECK-NEXT: ret i32 %2
}		}

define i32 @test16(i1 %C, i32* %P) {		define i32 @test16(i1 %C, i32* %P) {
%P2 = select i1 %C, i32* %P, i32* null		%P2 = select i1 %C, i32* %P, i32* null
%V = load i32, i32* %P2		%V = load i32, i32* %P2
ret i32 %V		ret i32 %V
; CHECK-LABEL: @test16(		; CHECK-LABEL: @test16(
; CHECK-NEXT: %V = load i32, i32* %P		; CHECK-NEXT: %V = load i32, i32* %P
; CHECK: ret i32 %V		; CHECK: ret i32 %V
}		}

;; It may be legal to load from a null address in a non-zero address space		;; It may be legal to load from a null address in a non-zero address space
define i32 @test16_neg(i1 %C, i32 addrspace(1)* %P) {		define i32 @test16_neg(i1 %C, i32 addrspace(1)* %P) {
Show All 11 Lines	define i32 @test16_neg2(i1 %C, i32 addrspace(1)* %P) {
ret i32 %V		ret i32 %V
; CHECK-LABEL: @test16_neg2		; CHECK-LABEL: @test16_neg2
; CHECK-NEXT: %P2 = select i1 %C, i32 addrspace(1)* null, i32 addrspace(1)* %P		; CHECK-NEXT: %P2 = select i1 %C, i32 addrspace(1)* null, i32 addrspace(1)* %P
; CHECK-NEXT: %V = load i32, i32 addrspace(1)* %P2		; CHECK-NEXT: %V = load i32, i32 addrspace(1)* %P2
; CHECK: ret i32 %V		; CHECK: ret i32 %V
}		}

define i1 @test17(i32* %X, i1 %C) {		define i1 @test17(i32* %X, i1 %C) {
%R = select i1 %C, i32* %X, i32* null		%R = select i1 %C, i32* %X, i32* null
%RV = icmp eq i32* %R, null		%RV = icmp eq i32* %R, null
ret i1 %RV		ret i1 %RV
; CHECK-LABEL: @test17(		; CHECK-LABEL: @test17(
; CHECK: icmp eq i32* %X, null		; CHECK: icmp eq i32* %X, null
; CHECK: xor i1 %C, true		; CHECK: xor i1 %C, true
; CHECK: %RV = or i1		; CHECK: %RV = or i1
; CHECK: ret i1 %RV		; CHECK: ret i1 %RV
}		}

define i32 @test18(i32 %X, i32 %Y, i1 %C) {		define i32 @test18(i32 %X, i32 %Y, i1 %C) {
%R = select i1 %C, i32 %X, i32 0		%R = select i1 %C, i32 %X, i32 0
%V = sdiv i32 %Y, %R		%V = sdiv i32 %Y, %R
ret i32 %V		ret i32 %V
; CHECK-LABEL: @test18(		; CHECK-LABEL: @test18(
; CHECK: %V = sdiv i32 %Y, %X		; CHECK: %V = sdiv i32 %Y, %X
; CHECK: ret i32 %V		; CHECK: ret i32 %V
}		}

define i32 @test19(i32 %x) {		define i32 @test19(i32 %x) {
%tmp = icmp ugt i32 %x, 2147483647		%tmp = icmp ugt i32 %x, 2147483647
%retval = select i1 %tmp, i32 -1, i32 0		%retval = select i1 %tmp, i32 -1, i32 0
ret i32 %retval		ret i32 %retval
; CHECK-LABEL: @test19(		; CHECK-LABEL: @test19(
; CHECK-NEXT: ashr i32 %x, 31		; CHECK-NEXT: ashr i32 %x, 31
; CHECK-NEXT: ret i32		; CHECK-NEXT: ret i32
}		}

define i32 @test20(i32 %x) {		define i32 @test20(i32 %x) {
%tmp = icmp slt i32 %x, 0		%tmp = icmp slt i32 %x, 0
%retval = select i1 %tmp, i32 -1, i32 0		%retval = select i1 %tmp, i32 -1, i32 0
ret i32 %retval		ret i32 %retval
; CHECK-LABEL: @test20(		; CHECK-LABEL: @test20(
; CHECK-NEXT: ashr i32 %x, 31		; CHECK-NEXT: ashr i32 %x, 31
; CHECK-NEXT: ret i32		; CHECK-NEXT: ret i32
}		}

define i64 @test21(i32 %x) {		define i64 @test21(i32 %x) {
%tmp = icmp slt i32 %x, 0		%tmp = icmp slt i32 %x, 0
%retval = select i1 %tmp, i64 -1, i64 0		%retval = select i1 %tmp, i64 -1, i64 0
ret i64 %retval		ret i64 %retval
; CHECK-LABEL: @test21(		; CHECK-LABEL: @test21(
; CHECK-NEXT: ashr i32 %x, 31		; CHECK-NEXT: ashr i32 %x, 31
; CHECK-NEXT: sext i32		; CHECK-NEXT: sext i32
; CHECK-NEXT: ret i64		; CHECK-NEXT: ret i64
}		}

define i16 @test22(i32 %x) {		define i16 @test22(i32 %x) {
%tmp = icmp slt i32 %x, 0		%tmp = icmp slt i32 %x, 0
%retval = select i1 %tmp, i16 -1, i16 0		%retval = select i1 %tmp, i16 -1, i16 0
ret i16 %retval		ret i16 %retval
; CHECK-LABEL: @test22(		; CHECK-LABEL: @test22(
; CHECK-NEXT: ashr i32 %x, 31		; CHECK-NEXT: ashr i32 %x, 31
; CHECK-NEXT: trunc i32		; CHECK-NEXT: trunc i32
; CHECK-NEXT: ret i16		; CHECK-NEXT: ret i16
}		}

define i1 @test23(i1 %a, i1 %b) {		define i1 @test23(i1 %a, i1 %b) {
%c = select i1 %a, i1 %b, i1 %a		%c = select i1 %a, i1 %b, i1 %a
ret i1 %c		ret i1 %c
; CHECK-LABEL: @test23(		; CHECK-LABEL: @test23(
; CHECK-NEXT: %c = and i1 %a, %b		; CHECK-NEXT: %c = and i1 %a, %b
; CHECK-NEXT: ret i1 %c		; CHECK-NEXT: ret i1 %c
}		}

define i1 @test24(i1 %a, i1 %b) {		define i1 @test24(i1 %a, i1 %b) {
%c = select i1 %a, i1 %a, i1 %b		%c = select i1 %a, i1 %a, i1 %b
ret i1 %c		ret i1 %c
; CHECK-LABEL: @test24(		; CHECK-LABEL: @test24(
; CHECK-NEXT: %c = or i1 %a, %b		; CHECK-NEXT: %c = or i1 %a, %b
; CHECK-NEXT: ret i1 %c		; CHECK-NEXT: ret i1 %c
}		}

define i32 @test25(i1 %c) {		define i32 @test25(i1 %c) {
entry:		entry:
br i1 %c, label %jump, label %ret		br i1 %c, label %jump, label %ret
jump:		jump:
br label %ret		br label %ret
ret:		ret:
%a = phi i1 [true, %jump], [false, %entry]		%a = phi i1 [true, %jump], [false, %entry]
%b = select i1 %a, i32 10, i32 20		%b = select i1 %a, i32 10, i32 20
ret i32 %b		ret i32 %b
; CHECK-LABEL: @test25(		; CHECK-LABEL: @test25(
; CHECK: %a = phi i32 [ 10, %jump ], [ 20, %entry ]		; CHECK: %a = phi i32 [ 10, %jump ], [ 20, %entry ]
; CHECK-NEXT: ret i32 %a		; CHECK-NEXT: ret i32 %a
}		}

define i32 @test26(i1 %cond) {		define i32 @test26(i1 %cond) {
entry:		entry:
br i1 %cond, label %jump, label %ret		br i1 %cond, label %jump, label %ret
jump:		jump:
%c = or i1 false, false		%c = or i1 false, false
br label %ret		br label %ret
ret:		ret:
%a = phi i1 [true, %entry], [%c, %jump]		%a = phi i1 [true, %entry], [%c, %jump]
%b = select i1 %a, i32 20, i32 10		%b = select i1 %a, i32 20, i32 10
ret i32 %b		ret i32 %b
; CHECK-LABEL: @test26(		; CHECK-LABEL: @test26(
; CHECK: %a = phi i32 [ 20, %entry ], [ 10, %jump ]		; CHECK: %a = phi i32 [ 20, %entry ], [ 10, %jump ]
; CHECK-NEXT: ret i32 %a		; CHECK-NEXT: ret i32 %a
}		}

define i32 @test27(i1 %c, i32 %A, i32 %B) {		define i32 @test27(i1 %c, i32 %A, i32 %B) {
entry:		entry:
br i1 %c, label %jump, label %ret		br i1 %c, label %jump, label %ret
jump:		jump:
br label %ret		br label %ret
ret:		ret:
%a = phi i1 [true, %jump], [false, %entry]		%a = phi i1 [true, %jump], [false, %entry]
%b = select i1 %a, i32 %A, i32 %B		%b = select i1 %a, i32 %A, i32 %B
ret i32 %b		ret i32 %b
; CHECK-LABEL: @test27(		; CHECK-LABEL: @test27(
; CHECK: %a = phi i32 [ %A, %jump ], [ %B, %entry ]		; CHECK: %a = phi i32 [ %A, %jump ], [ %B, %entry ]
; CHECK-NEXT: ret i32 %a		; CHECK-NEXT: ret i32 %a
}		}

define i32 @test28(i1 %cond, i32 %A, i32 %B) {		define i32 @test28(i1 %cond, i32 %A, i32 %B) {
entry:		entry:
br i1 %cond, label %jump, label %ret		br i1 %cond, label %jump, label %ret
jump:		jump:
br label %ret		br label %ret
ret:		ret:
%c = phi i32 [%A, %jump], [%B, %entry]		%c = phi i32 [%A, %jump], [%B, %entry]
%a = phi i1 [true, %jump], [false, %entry]		%a = phi i1 [true, %jump], [false, %entry]
%b = select i1 %a, i32 %A, i32 %c		%b = select i1 %a, i32 %A, i32 %c
ret i32 %b		ret i32 %b
; CHECK-LABEL: @test28(		; CHECK-LABEL: @test28(
; CHECK: %a = phi i32 [ %A, %jump ], [ %B, %entry ]		; CHECK: %a = phi i32 [ %A, %jump ], [ %B, %entry ]
; CHECK-NEXT: ret i32 %a		; CHECK-NEXT: ret i32 %a
}		}

define i32 @test29(i1 %cond, i32 %A, i32 %B) {		define i32 @test29(i1 %cond, i32 %A, i32 %B) {
entry:		entry:
br i1 %cond, label %jump, label %ret		br i1 %cond, label %jump, label %ret
jump:		jump:
br label %ret		br label %ret
ret:		ret:
%c = phi i32 [%A, %jump], [%B, %entry]		%c = phi i32 [%A, %jump], [%B, %entry]
%a = phi i1 [true, %jump], [false, %entry]		%a = phi i1 [true, %jump], [false, %entry]
br label %next		br label %next

next:		next:
%b = select i1 %a, i32 %A, i32 %c		%b = select i1 %a, i32 %A, i32 %c
ret i32 %b		ret i32 %b
; CHECK-LABEL: @test29(		; CHECK-LABEL: @test29(
; CHECK: %a = phi i32 [ %A, %jump ], [ %B, %entry ]		; CHECK: %a = phi i32 [ %A, %jump ], [ %B, %entry ]
; CHECK: ret i32 %a		; CHECK: ret i32 %a
}		}


; SMAX(SMAX(x, y), x) -> SMAX(x, y)		; SMAX(SMAX(x, y), x) -> SMAX(x, y)
define i32 @test30(i32 %x, i32 %y) {		define i32 @test30(i32 %x, i32 %y) {
%cmp = icmp sgt i32 %x, %y		%cmp = icmp sgt i32 %x, %y
%cond = select i1 %cmp, i32 %x, i32 %y		%cond = select i1 %cmp, i32 %x, i32 %y

%cmp5 = icmp sgt i32 %cond, %x		%cmp5 = icmp sgt i32 %cond, %x
%retval = select i1 %cmp5, i32 %cond, i32 %x		%retval = select i1 %cmp5, i32 %cond, i32 %x
ret i32 %retval		ret i32 %retval
; CHECK-LABEL: @test30(		; CHECK-LABEL: @test30(
; CHECK: ret i32 %cond		; CHECK: ret i32 %cond
}		}

; UMAX(UMAX(x, y), x) -> UMAX(x, y)		; UMAX(UMAX(x, y), x) -> UMAX(x, y)
define i32 @test31(i32 %x, i32 %y) {		define i32 @test31(i32 %x, i32 %y) {
%cmp = icmp ugt i32 %x, %y		%cmp = icmp ugt i32 %x, %y
%cond = select i1 %cmp, i32 %x, i32 %y		%cond = select i1 %cmp, i32 %x, i32 %y
%cmp5 = icmp ugt i32 %cond, %x		%cmp5 = icmp ugt i32 %cond, %x
%retval = select i1 %cmp5, i32 %cond, i32 %x		%retval = select i1 %cmp5, i32 %cond, i32 %x
ret i32 %retval		ret i32 %retval
; CHECK-LABEL: @test31(		; CHECK-LABEL: @test31(
; CHECK: ret i32 %cond		; CHECK: ret i32 %cond
}		}

▲ Show 20 Lines • Show All 213 Lines • ▼ Show 20 Lines
define i48 @test51(<3 x i1> %icmp, <3 x i16> %tmp) {		define i48 @test51(<3 x i1> %icmp, <3 x i16> %tmp) {
; CHECK-LABEL: @test51(		; CHECK-LABEL: @test51(
%select = select <3 x i1> %icmp, <3 x i16> zeroinitializer, <3 x i16> %tmp		%select = select <3 x i1> %icmp, <3 x i16> zeroinitializer, <3 x i16> %tmp
; CHECK: select <3 x i1>		; CHECK: select <3 x i1>
%tmp2 = bitcast <3 x i16> %select to i48		%tmp2 = bitcast <3 x i16> %select to i48
ret i48 %tmp2		ret i48 %tmp2
}		}

		; Allow select promotion even if there are multiple uses of bitcasted ops.
		; Hoisting the selects allows later pattern matching to see that these are min/max ops.

		define void @min_max_bitcast(<4 x float> %a, <4 x float> %b, <4 x i32>* %ptr1, <4 x i32>* %ptr2) {
		; CHECK-LABEL: @min_max_bitcast(
		; CHECK-NEXT: [[CMP:%.*]] = fcmp olt <4 x float> %a, %b
		; CHECK-NEXT: [[SEL1_V:%.*]] = select <4 x i1> [[CMP]], <4 x float> %a, <4 x float> %b
		; CHECK-NEXT: [[SEL2_V:%.*]] = select <4 x i1> [[CMP]], <4 x float> %b, <4 x float> %a
		; CHECK-NEXT: [[TMP1:%.]] = bitcast <4 x i32> %ptr1 to <4 x float>*
		; CHECK-NEXT: store <4 x float> [[SEL1_V]], <4 x float>* [[TMP1]], align 16
		; CHECK-NEXT: [[TMP2:%.]] = bitcast <4 x i32> %ptr2 to <4 x float>*
		; CHECK-NEXT: store <4 x float> [[SEL2_V]], <4 x float>* [[TMP2]], align 16
		; CHECK-NEXT: ret void
		;
		%cmp = fcmp olt <4 x float> %a, %b
		%bc1 = bitcast <4 x float> %a to <4 x i32>
		%bc2 = bitcast <4 x float> %b to <4 x i32>
		%sel1 = select <4 x i1> %cmp, <4 x i32> %bc1, <4 x i32> %bc2
		%sel2 = select <4 x i1> %cmp, <4 x i32> %bc2, <4 x i32> %bc1
		store <4 x i32> %sel1, <4 x i32>* %ptr1
		store <4 x i32> %sel2, <4 x i32>* %ptr2
		ret void
		}

		; To avoid potential backend problems, we don't do the same transform for other casts.

		define void @truncs_before_selects(<4 x float> %f1, <4 x float> %f2, <4 x i64> %a, <4 x i64> %b, <4 x i32>* %ptr1, <4 x i32>* %ptr2) {
		; CHECK-LABEL: @truncs_before_selects(
		; CHECK-NEXT: [[CMP:%.*]] = fcmp olt <4 x float> %f1, %f2
		; CHECK-NEXT: [[BC1:%.*]] = trunc <4 x i64> %a to <4 x i32>
		; CHECK-NEXT: [[BC2:%.*]] = trunc <4 x i64> %b to <4 x i32>
		; CHECK-NEXT: [[SEL1:%.*]] = select <4 x i1> [[CMP]], <4 x i32> [[BC1]], <4 x i32> [[BC2]]
		; CHECK-NEXT: [[SEL2:%.*]] = select <4 x i1> [[CMP]], <4 x i32> [[BC2]], <4 x i32> [[BC1]]
		; CHECK-NEXT: store <4 x i32> [[SEL1]], <4 x i32>* %ptr1, align 16
		; CHECK-NEXT: store <4 x i32> [[SEL2]], <4 x i32>* %ptr2, align 16
		; CHECK-NEXT: ret void
		;
		%cmp = fcmp olt <4 x float> %f1, %f2
		%bc1 = trunc <4 x i64> %a to <4 x i32>
		%bc2 = trunc <4 x i64> %b to <4 x i32>
		%sel1 = select <4 x i1> %cmp, <4 x i32> %bc1, <4 x i32> %bc2
		%sel2 = select <4 x i1> %cmp, <4 x i32> %bc2, <4 x i32> %bc1
		store <4 x i32> %sel1, <4 x i32>* %ptr1, align 16
		store <4 x i32> %sel2, <4 x i32>* %ptr2, align 16
		ret void
		}

; PR8575		; PR8575

define i32 @test52(i32 %n, i32 %m) nounwind {		define i32 @test52(i32 %n, i32 %m) nounwind {
; CHECK-LABEL: @test52(		; CHECK-LABEL: @test52(
%cmp = icmp sgt i32 %n, %m		%cmp = icmp sgt i32 %n, %m
%. = select i1 %cmp, i32 1, i32 3		%. = select i1 %cmp, i32 1, i32 3
%add = add nsw i32 %., 3		%add = add nsw i32 %., 3
%storemerge = select i1 %cmp, i32 %., i32 %add		%storemerge = select i1 %cmp, i32 %., i32 %add
Show All 16 Lines	define i32 @test54(i32 %X, i32 %Y) {
%A = ashr exact i32 %X, %Y		%A = ashr exact i32 %X, %Y
%B = icmp eq i32 %A, 0		%B = icmp eq i32 %A, 0
%C = select i1 %B, i32 %A, i32 1		%C = select i1 %B, i32 %A, i32 1
ret i32 %C		ret i32 %C
; CHECK-LABEL: @test54(		; CHECK-LABEL: @test54(
; CHECK-NOT: ashr		; CHECK-NOT: ashr
; CHECK-NOT: select		; CHECK-NOT: select
; CHECK: icmp ne i32 %X, 0		; CHECK: icmp ne i32 %X, 0
; CHECK: zext		; CHECK: zext
; CHECK: ret		; CHECK: ret
}		}

define i1 @test55(i1 %X, i32 %Y, i32 %Z) {		define i1 @test55(i1 %X, i32 %Y, i32 %Z) {
%A = ashr exact i32 %Y, %Z		%A = ashr exact i32 %Y, %Z
%B = select i1 %X, i32 %Y, i32 %A		%B = select i1 %X, i32 %Y, i32 %A
%C = icmp eq i32 %B, 0		%C = icmp eq i32 %B, 0
ret i1 %C		ret i1 %C
▲ Show 20 Lines • Show All 61 Lines • ▼ Show 20 Lines	define i32 @test61(i32* %ptr) {
%C = select i1 %B, i32 %A, i32 10		%C = select i1 %B, i32 %A, i32 10
ret i32 %C		ret i32 %C
; CHECK-LABEL: @test61(		; CHECK-LABEL: @test61(
; CHECK: ret i32 10		; CHECK: ret i32 10
}		}

define i1 @test62(i1 %A, i1 %B) {		define i1 @test62(i1 %A, i1 %B) {
%not = xor i1 %A, true		%not = xor i1 %A, true
%C = select i1 %A, i1 %not, i1 %B		%C = select i1 %A, i1 %not, i1 %B
ret i1 %C		ret i1 %C
; CHECK-LABEL: @test62(		; CHECK-LABEL: @test62(
; CHECK: %not = xor i1 %A, true		; CHECK: %not = xor i1 %A, true
; CHECK: %C = and i1 %not, %B		; CHECK: %C = and i1 %not, %B
; CHECK: ret i1 %C		; CHECK: ret i1 %C
}		}

define i1 @test63(i1 %A, i1 %B) {		define i1 @test63(i1 %A, i1 %B) {
%not = xor i1 %A, true		%not = xor i1 %A, true
%C = select i1 %A, i1 %B, i1 %not		%C = select i1 %A, i1 %B, i1 %not
ret i1 %C		ret i1 %C
; CHECK-LABEL: @test63(		; CHECK-LABEL: @test63(
; CHECK: %not = xor i1 %A, true		; CHECK: %not = xor i1 %A, true
; CHECK: %C = or i1 %B, %not		; CHECK: %C = or i1 %B, %not
; CHECK: ret i1 %C		; CHECK: ret i1 %C
}		}

; PR14131		; PR14131
▲ Show 20 Lines • Show All 755 Lines • Show Last 20 Lines