Diff 547726

llvm/include/llvm/Transforms/InstCombine/InstCombiner.h

Show First 20 Lines • Show All 46 Lines • ▼ Show 20 Lines	class LLVM_LIBRARY_VISIBILITY InstCombiner {
/// Only used to call target specific intrinsic combining.		/// Only used to call target specific intrinsic combining.
/// It must NOT be used for any other purpose, as InstCombine is a		/// It must NOT be used for any other purpose, as InstCombine is a
/// target-independent canonicalization transform.		/// target-independent canonicalization transform.
TargetTransformInfo &TTI;		TargetTransformInfo &TTI;

public:		public:
/// Maximum size of array considered when transforming.		/// Maximum size of array considered when transforming.
uint64_t MaxArraySizeForCombine = 0;		uint64_t MaxArraySizeForCombine = 0;
		/// Maximum bytes of data considered when transforming.
		uint64_t MaxDataSizeForCombine = 0;

/// An IRBuilder that automatically inserts new instructions into the		/// An IRBuilder that automatically inserts new instructions into the
/// worklist.		/// worklist.
using BuilderTy = IRBuilder<TargetFolder, IRBuilderCallbackInserter>;		using BuilderTy = IRBuilder<TargetFolder, IRBuilderCallbackInserter>;
BuilderTy &Builder;		BuilderTy &Builder;

protected:		protected:
/// A worklist of the instructions that need to be simplified.		/// A worklist of the instructions that need to be simplified.
▲ Show 20 Lines • Show All 484 Lines • Show Last 20 Lines

llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

//===- InstCombineCompares.cpp --------------------------------------------===//		//===- InstCombineCompares.cpp --------------------------------------------===//
//		//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.		// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
//		//
// This file implements the visitICmp and visitFCmp functions.		// This file implements the visitICmp and visitFCmp functions.
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "InstCombineInternal.h"		#include "InstCombineInternal.h"
#include "llvm/ADT/APSInt.h"		#include "llvm/ADT/APSInt.h"
		#include "llvm/ADT/MapVector.h"
#include "llvm/ADT/SetVector.h"		#include "llvm/ADT/SetVector.h"
#include "llvm/ADT/Statistic.h"		#include "llvm/ADT/Statistic.h"
#include "llvm/Analysis/CaptureTracking.h"		#include "llvm/Analysis/CaptureTracking.h"
#include "llvm/Analysis/CmpInstAnalysis.h"		#include "llvm/Analysis/CmpInstAnalysis.h"
#include "llvm/Analysis/ConstantFolding.h"		#include "llvm/Analysis/ConstantFolding.h"
#include "llvm/Analysis/InstructionSimplify.h"		#include "llvm/Analysis/InstructionSimplify.h"
#include "llvm/Analysis/VectorUtils.h"		#include "llvm/Analysis/VectorUtils.h"
#include "llvm/IR/ConstantRange.h"		#include "llvm/IR/ConstantRange.h"
		#include "llvm/IR/Constants.h"
#include "llvm/IR/DataLayout.h"		#include "llvm/IR/DataLayout.h"
#include "llvm/IR/GetElementPtrTypeIterator.h"		#include "llvm/IR/GetElementPtrTypeIterator.h"
#include "llvm/IR/IntrinsicInst.h"		#include "llvm/IR/IntrinsicInst.h"
#include "llvm/IR/PatternMatch.h"		#include "llvm/IR/PatternMatch.h"
		#include "llvm/Support/Casting.h"
#include "llvm/Support/KnownBits.h"		#include "llvm/Support/KnownBits.h"
#include "llvm/Transforms/InstCombine/InstCombiner.h"		#include "llvm/Transforms/InstCombine/InstCombiner.h"

using namespace llvm;		using namespace llvm;
using namespace PatternMatch;		using namespace PatternMatch;

#define DEBUG_TYPE "instcombine"		#define DEBUG_TYPE "instcombine"

▲ Show 20 Lines • Show All 68 Lines • ▼ Show 20 Lines
/// this into some simple computation that does not need the load. For example		/// this into some simple computation that does not need the load. For example
/// we can optimize "icmp eq (load (gep "foo", 0, i)), 0" into "icmp eq i, 3".		/// we can optimize "icmp eq (load (gep "foo", 0, i)), 0" into "icmp eq i, 3".
///		///
/// If AndCst is non-null, then the loaded value is masked with that constant		/// If AndCst is non-null, then the loaded value is masked with that constant
/// before doing the comparison. This handles cases like "A[i]&4 == 0".		/// before doing the comparison. This handles cases like "A[i]&4 == 0".
Instruction *InstCombinerImpl::foldCmpLoadFromIndexedGlobal(		Instruction *InstCombinerImpl::foldCmpLoadFromIndexedGlobal(
LoadInst LI, GetElementPtrInst GEP, GlobalVariable *GV, CmpInst &ICI,		LoadInst LI, GetElementPtrInst GEP, GlobalVariable *GV, CmpInst &ICI,
ConstantInt *AndCst) {		ConstantInt *AndCst) {
if (LI->isVolatile() \|\| LI->getType() != GEP->getResultElementType() \|\|		if (LI->isVolatile() \|\| !GV->isConstant() \|\| !GV->hasDefinitiveInitializer())
GV->getValueType() != GEP->getSourceElementType() \|\|
!GV->isConstant() \|\| !GV->hasDefinitiveInitializer())
return nullptr;		return nullptr;

Constant *Init = GV->getInitializer();		Constant *Init = GV->getInitializer();
if (!isa<ConstantArray>(Init) && !isa<ConstantDataArray>(Init))		uint64_t DataSize = DL.getTypeAllocSize(Init->getType());
return nullptr;

uint64_t ArrayElementCount = Init->getType()->getArrayNumElements();
// Don't blow up on huge arrays.		// Don't blow up on huge arrays.
if (ArrayElementCount > MaxArraySizeForCombine)		if (DataSize > MaxDataSizeForCombine)
return nullptr;		return nullptr;

// There are many forms of this optimization we can handle, for now, just do		Type *LoadedTy = LI->getType();
// the simple index into a single-dimensional array.		uint64_t LoadedTySize = DL.getTypeAllocSize(LoadedTy);
//		uint64_t PtrBitwidth = DL.getIndexSizeInBits(GEP->getPointerAddressSpace());
// Require: GEP GV, 0, i {{, constant indices}}		Type *PtrIdxTy = DL.getIndexType(GEP->getType());
if (GEP->getNumOperands() < 3 \|\|
!isa<ConstantInt>(GEP->getOperand(1)) \|\|
!cast<ConstantInt>(GEP->getOperand(1))->isZero() \|\|
isa<Constant>(GEP->getOperand(2)))
return nullptr;

// Check that indices after the variable are constants and in-range for the
// type they index. Collect the indices. This is typically for arrays of
// structs.
SmallVector<unsigned, 4> LaterIndices;

Type *EltTy = Init->getType()->getArrayElementType();
for (unsigned i = 3, e = GEP->getNumOperands(); i != e; ++i) {
ConstantInt *Idx = dyn_cast<ConstantInt>(GEP->getOperand(i));
if (!Idx) return nullptr; // Variable index.

uint64_t IdxVal = Idx->getZExtValue();
if ((unsigned)IdxVal != IdxVal) return nullptr; // Too large array index.

if (StructType *STy = dyn_cast<StructType>(EltTy))
EltTy = STy->getElementType(IdxVal);
else if (ArrayType *ATy = dyn_cast<ArrayType>(EltTy)) {
if (IdxVal >= ATy->getNumElements()) return nullptr;
EltTy = ATy->getElementType();
} else {
return nullptr; // Unknown type.
}

LaterIndices.push_back(IdxVal);		MapVector<Value *, APInt> VariableOffsets;
}		APInt ConstantOffset(PtrBitwidth, 0);
		GEP->collectOffset(GEP->getModule()->getDataLayout(), PtrBitwidth,
		VariableOffsets, ConstantOffset);

		// Restrict to one variable currently.
		if (VariableOffsets.size() != 1)
		return nullptr;

		// There are many forms of this optimization we can handle.
		// Limit to one variable currently.
		// Possible TODO: Fold: cmp(A[ax + by + ... + C], Rhs) <=> cmp(ax + by + ....
		// + C, IndexRhs)
enum { Overdefined = -3, Undefined = -2 };		enum { Overdefined = -3, Undefined = -2 };

// Variables for our state machines.		// Variables for our state machines.

// FirstTrueElement/SecondTrueElement - Used to emit a comparison of the form		// FirstTrueElement/SecondTrueElement - Used to emit a comparison of the form
// "i == 47 \| i == 87", where 47 is the first index the condition is true for,		// "i == 47 \| i == 87", where 47 is the first index the condition is true for,
// and 87 is the second (and last) index. FirstTrueElement is -2 when		// and 87 is the second (and last) index. FirstTrueElement is -2 when
// undefined, otherwise set to the first true element. SecondTrueElement is		// undefined, otherwise set to the first true element. SecondTrueElement is
Show All 12 Lines	Instruction *InstCombinerImpl::foldCmpLoadFromIndexedGlobal(
/// use relative comparisons and don't want 0-1 to match -1.		/// use relative comparisons and don't want 0-1 to match -1.
int TrueRangeEnd = Undefined, FalseRangeEnd = Undefined;		int TrueRangeEnd = Undefined, FalseRangeEnd = Undefined;

// MagicBitvector - This is a magic bitvector where we set a bit if the		// MagicBitvector - This is a magic bitvector where we set a bit if the
// comparison is true for element 'i'. If there are 64 elements or less in		// comparison is true for element 'i'. If there are 64 elements or less in
// the array, this will fully represent all the comparison results.		// the array, this will fully represent all the comparison results.
uint64_t MagicBitvector = 0;		uint64_t MagicBitvector = 0;

		Value *Idx = nullptr;

// Scan the array and see if one of our patterns matches.		// Scan the array and see if one of our patterns matches.
Constant *CompareRHS = cast<Constant>(ICI.getOperand(1));		Constant *ComparedRHS = cast<Constant>(ICI.getOperand(1));
for (unsigned i = 0, e = ArrayElementCount; i != e; ++i) {		APInt LongestStep = VariableOffsets.front().second;
Constant *Elt = Init->getAggregateElement(i);		uint64_t LongestStepZExt = LongestStep.getZExtValue();
if (!Elt) return nullptr;		int64_t BeginOffset = ConstantOffset.getSExtValue();

// If this is indexing an array of structures, get the structure element.		// Make BeginOffset the smallest offset >= 0
if (!LaterIndices.empty()) {		if (BeginOffset % LongestStepZExt == 0)
Elt = ConstantFoldExtractValueInstruction(Elt, LaterIndices);		BeginOffset = 0;
		else if (BeginOffset < 0)
		BeginOffset += (-BeginOffset / LongestStepZExt + 1) * LongestStepZExt;
		else if (BeginOffset > 0)
		BeginOffset -= (BeginOffset / LongestStepZExt) * LongestStepZExt;

		uint64_t ElementCountToTraverse = (DataSize - BeginOffset) / LongestStepZExt;

		// Don't traverse too many times.
		if (ElementCountToTraverse > MaxArraySizeForCombine)
		return nullptr;

		for (uint64_t i = 0; i < ElementCountToTraverse; ++i) {
		APInt CurrentOffset(i * LongestStep + BeginOffset);
		Constant *Elt =
		ConstantFoldLoadFromConstPtr(GV, LoadedTy, CurrentOffset, DL);

if (!Elt)		if (!Elt)
return nullptr;		return nullptr;
}

// If the element is masked, handle it.		// If the element is masked, handle it.
if (AndCst) {		if (AndCst) {
Elt = ConstantFoldBinaryOpOperands(Instruction::And, Elt, AndCst, DL);		Elt = ConstantFoldBinaryOpOperands(Instruction::And, Elt, AndCst, DL);
if (!Elt)		if (!Elt)
return nullptr;		return nullptr;
}		}

// Find out if the comparison would be true or false for the i'th element.		// Find out if the comparison would be true or false for the i'th element.
Constant *C = ConstantFoldCompareInstOperands(ICI.getPredicate(), Elt,		Constant *C = ConstantFoldCompareInstOperands(ICI.getPredicate(), Elt,
CompareRHS, DL, &TLI);		ComparedRHS, DL, &TLI);
// If the result is undef for this element, ignore it.		// If the result is undef for this element, ignore it.
if (isa<UndefValue>(C)) {		if (isa<UndefValue>(C)) {
// Extend range state machines to cover this element in case there is an		// Extend range state machines to cover this element in case there is an
// undef in the middle of the range.		// undef in the middle of the range.
if (TrueRangeEnd == (int)i-1)		if (TrueRangeEnd == (int)i - 1)
TrueRangeEnd = i;		TrueRangeEnd = i;
if (FalseRangeEnd == (int)i-1)		if (FalseRangeEnd == (int)i - 1)
FalseRangeEnd = i;		FalseRangeEnd = i;
continue;		continue;
}		}

// If we can't compute the result for any of the elements, we have to give		// If we can't compute the result for any of the elements, we have to give
// up evaluating the entire conditional.		// up evaluating the entire conditional.
if (!isa<ConstantInt>(C)) return nullptr;		if (!isa<ConstantInt>(C))
		return nullptr;

// Otherwise, we know if the comparison is true or false for this element,		// Otherwise, we know if the comparison is true or false for this element,
// update our state machines.		// update our state machines.
bool IsTrueForElt = !cast<ConstantInt>(C)->isZero();		bool IsTrueForElt = !cast<ConstantInt>(C)->isZero();

// State machine for single/double/range index comparison.		// State machine for single/double/range index comparison.
if (IsTrueForElt) {		if (IsTrueForElt) {
// Update the TrueElement state machine.		// Update the TrueElement state machine.
if (FirstTrueElement == Undefined)		if (FirstTrueElement == Undefined)
FirstTrueElement = TrueRangeEnd = i; // First true element.		FirstTrueElement = TrueRangeEnd = i; // First true element.
else {		else {
// Update double-compare state machine.		// Update double-compare state machine.
if (SecondTrueElement == Undefined)		if (SecondTrueElement == Undefined)
SecondTrueElement = i;		SecondTrueElement = i;
else		else
SecondTrueElement = Overdefined;		SecondTrueElement = Overdefined;

// Update range state machine.		// Update range state machine.
if (TrueRangeEnd == (int)i-1)		if (TrueRangeEnd == (int)i - 1)
TrueRangeEnd = i;		TrueRangeEnd = i;
else		else
TrueRangeEnd = Overdefined;		TrueRangeEnd = Overdefined;
}		}
} else {		} else {
// Update the FalseElement state machine.		// Update the FalseElement state machine.
if (FirstFalseElement == Undefined)		if (FirstFalseElement == Undefined)
FirstFalseElement = FalseRangeEnd = i; // First false element.		FirstFalseElement = FalseRangeEnd = i; // First false element.
else {		else {
// Update double-compare state machine.		// Update double-compare state machine.
if (SecondFalseElement == Undefined)		if (SecondFalseElement == Undefined)
SecondFalseElement = i;		SecondFalseElement = i;
else		else
SecondFalseElement = Overdefined;		SecondFalseElement = Overdefined;

// Update range state machine.		// Update range state machine.
if (FalseRangeEnd == (int)i-1)		if (FalseRangeEnd == (int)i - 1)
FalseRangeEnd = i;		FalseRangeEnd = i;
else		else
FalseRangeEnd = Overdefined;		FalseRangeEnd = Overdefined;
}		}
}		}

// If this element is in range, update our magic bitvector.		// If this element is in range, update our magic bitvector.
if (i < 64 && IsTrueForElt)		if (i < 64 && IsTrueForElt)
MagicBitvector \|= 1ULL << i;		MagicBitvector \|= 1ULL << i;

// If all of our states become overdefined, bail out early. Since the		// If all of our states become overdefined, bail out early. Since the
// predicate is expensive, only check it every 8 elements. This is only		// predicate is expensive, only check it every 8 elements. This is only
// really useful for really huge arrays.		// really useful for really huge arrays.
if ((i & 8) == 0 && i >= 64 && SecondTrueElement == Overdefined &&		if ((i & 8) == 0 && i >= 64 && SecondTrueElement == Overdefined &&
SecondFalseElement == Overdefined && TrueRangeEnd == Overdefined &&		SecondFalseElement == Overdefined && TrueRangeEnd == Overdefined &&
FalseRangeEnd == Overdefined)		FalseRangeEnd == Overdefined)
return nullptr;		return nullptr;
}		}

// Now that we've scanned the entire array, emit our new comparison(s). We		// Now that we've scanned the entire array, emit our new comparison(s). We
// order the state machines in complexity of the generated code.		// order the state machines in complexity of the generated code.
Value *Idx = GEP->getOperand(2);

// If the index is larger than the pointer offset size of the target, truncate
// the index down like the GEP would do implicitly. We don't have to do this
// for an inbounds GEP because the index can't be out of range.
if (!GEP->isInBounds()) {
Type *PtrIdxTy = DL.getIndexType(GEP->getType());
unsigned OffsetSize = PtrIdxTy->getIntegerBitWidth();
if (Idx->getType()->getPrimitiveSizeInBits().getFixedValue() > OffsetSize)
Idx = Builder.CreateTrunc(Idx, PtrIdxTy);
}

// If inbounds keyword is not present, Idx * ElementSize can overflow.		// If inbounds keyword is not present, Idx * LongestStep can overflow.
// Let's assume that ElementSize is 2 and the wanted value is at offset 0.		// Let's assume that LongestStep is 2 and the wanted value is at offset 0.
// Then, there are two possible values for Idx to match offset 0:		// Then, there are two possible values for Idx to match offset 0:
// 0x00..00, 0x80..00.		// 0x00..00, 0x80..00.
// Emitting 'icmp eq Idx, 0' isn't correct in this case because the		// Emitting 'icmp eq Idx, 0' isn't correct in this case because the
// comparison is false if Idx was 0x80..00.		// comparison is false if Idx was 0x80..00.
// We need to erase the highest countTrailingZeros(ElementSize) bits of Idx.		// We need to erase the highest countTrailingZeros(ElementSize) bits of Idx.
unsigned ElementSize =
DL.getTypeAllocSize(Init->getType()->getArrayElementType());
auto MaskIdx = [&](Value *Idx) {		auto MaskIdx = [&](Value *Idx) {
if (!GEP->isInBounds() && llvm::countr_zero(ElementSize) != 0) {		if (!GEP->isInBounds() && llvm::countr_zero(LongestStepZExt) != 0) {
Value *Mask = ConstantInt::get(Idx->getType(), -1);		Value *Mask = ConstantInt::get(Idx->getType(), -1);
Mask = Builder.CreateLShr(Mask, llvm::countr_zero(ElementSize));		Mask = Builder.CreateLShr(Mask, llvm::countr_zero(LongestStepZExt));
Idx = Builder.CreateAnd(Idx, Mask);		Idx = Builder.CreateAnd(Idx, Mask);
}		}
return Idx;		return Idx;
};		};

		// Build the index expression lazily.
		auto GenerateIndexIfNull = [&](Value *CurIdx) {
		if (CurIdx)
		return CurIdx;

		// Initial bias for index. For example, when we fold C[x + 3] into
		// x < 2, we actually regard it as x < 5 - 3
		Value *Idx =
		ConstantInt::get(PtrIdxTy->getContext(),
		(BeginOffset - ConstantOffset).sdiv(LongestStepZExt));
		for (auto [Var, Coefficient] : VariableOffsets) {
		uint64_t VarBitWidth = Var->getType()->getScalarSizeInBits();
		uint64_t IdxBitWidth = Idx->getType()->getScalarSizeInBits();
		Type *WiderType =
		VarBitWidth > IdxBitWidth ? Var->getType() : Idx->getType();

		Var = Builder.CreateSExtOrTrunc(Var, WiderType);
		Idx = Builder.CreateSExtOrTrunc(Idx, WiderType);
		APInt MinCoeffi = Coefficient.sdiv(LongestStep)
		.sextOrTrunc(WiderType->getScalarSizeInBits());
		Value *Mul =
		Builder.CreateMul(Var, ConstantInt::get(WiderType, MinCoeffi));
		Idx = Builder.CreateAdd(Idx, Mul);
		}

		// If the index is larger than the pointer offset size of the target,
		// truncate the index down like the GEP would do implicitly. We don't have
		// to do this for an inbounds GEP because the index can't be out of range.
		if (!GEP->isInBounds() &&
		Idx->getType()->getScalarSizeInBits() > PtrBitwidth)
		Idx = Builder.CreateTrunc(Idx, PtrIdxTy);

		return Idx;
		};

// If the comparison is only true for one or two elements, emit direct		// If the comparison is only true for one or two elements, emit direct
// comparisons.		// comparisons.
if (SecondTrueElement != Overdefined) {		if (SecondTrueElement != Overdefined) {
Idx = MaskIdx(Idx);		Idx = MaskIdx(GenerateIndexIfNull(Idx));
// None true -> false.		// None true -> false.
if (FirstTrueElement == Undefined)		if (FirstTrueElement == Undefined)
return replaceInstUsesWith(ICI, Builder.getFalse());		return replaceInstUsesWith(ICI, Builder.getFalse());

Value *FirstTrueIdx = ConstantInt::get(Idx->getType(), FirstTrueElement);		Value *FirstTrueIdx = ConstantInt::get(Idx->getType(), FirstTrueElement);

// True for one element -> 'i == 47'.		// True for one element -> 'i == 47'.
if (SecondTrueElement == Undefined)		if (SecondTrueElement == Undefined)
return new ICmpInst(ICmpInst::ICMP_EQ, Idx, FirstTrueIdx);		return new ICmpInst(ICmpInst::ICMP_EQ, Idx, FirstTrueIdx);

// True for two elements -> 'i == 47 \| i == 72'.		// True for two elements -> 'i == 47 \| i == 72'.
Value *C1 = Builder.CreateICmpEQ(Idx, FirstTrueIdx);		Value *C1 = Builder.CreateICmpEQ(Idx, FirstTrueIdx);
Value *SecondTrueIdx = ConstantInt::get(Idx->getType(), SecondTrueElement);		Value *SecondTrueIdx = ConstantInt::get(Idx->getType(), SecondTrueElement);
Value *C2 = Builder.CreateICmpEQ(Idx, SecondTrueIdx);		Value *C2 = Builder.CreateICmpEQ(Idx, SecondTrueIdx);
return BinaryOperator::CreateOr(C1, C2);		return BinaryOperator::CreateOr(C1, C2);
}		}

// If the comparison is only false for one or two elements, emit direct		// If the comparison is only false for one or two elements, emit direct
// comparisons.		// comparisons.
if (SecondFalseElement != Overdefined) {		if (SecondFalseElement != Overdefined) {
Idx = MaskIdx(Idx);		Idx = MaskIdx(GenerateIndexIfNull(Idx));
// None false -> true.		// None false -> true.
if (FirstFalseElement == Undefined)		if (FirstFalseElement == Undefined)
return replaceInstUsesWith(ICI, Builder.getTrue());		return replaceInstUsesWith(ICI, Builder.getTrue());

Value *FirstFalseIdx = ConstantInt::get(Idx->getType(), FirstFalseElement);		Value *FirstFalseIdx = ConstantInt::get(Idx->getType(), FirstFalseElement);

// False for one element -> 'i != 47'.		// False for one element -> 'i != 47'.
if (SecondFalseElement == Undefined)		if (SecondFalseElement == Undefined)
return new ICmpInst(ICmpInst::ICMP_NE, Idx, FirstFalseIdx);		return new ICmpInst(ICmpInst::ICMP_NE, Idx, FirstFalseIdx);

// False for two elements -> 'i != 47 & i != 72'.		// False for two elements -> 'i != 47 & i != 72'.
Value *C1 = Builder.CreateICmpNE(Idx, FirstFalseIdx);		Value *C1 = Builder.CreateICmpNE(Idx, FirstFalseIdx);
Value *SecondFalseIdx = ConstantInt::get(Idx->getType(),SecondFalseElement);		Value *SecondFalseIdx =
		ConstantInt::get(Idx->getType(), SecondFalseElement);
Value *C2 = Builder.CreateICmpNE(Idx, SecondFalseIdx);		Value *C2 = Builder.CreateICmpNE(Idx, SecondFalseIdx);
return BinaryOperator::CreateAnd(C1, C2);		return BinaryOperator::CreateAnd(C1, C2);
}		}

// If the comparison can be replaced with a range comparison for the elements		// If the comparison can be replaced with a range comparison for the elements
// where it is true, emit the range check.		// where it is true, emit the range check.
if (TrueRangeEnd != Overdefined) {		if (TrueRangeEnd != Overdefined) {
assert(TrueRangeEnd != FirstTrueElement && "Should emit single compare");		assert(TrueRangeEnd != FirstTrueElement && "Should emit single compare");
Idx = MaskIdx(Idx);		Idx = MaskIdx(GenerateIndexIfNull(Idx));

// Generate (i-FirstTrue) <u (TrueRangeEnd-FirstTrue+1).		// Generate (i-FirstTrue) <u (TrueRangeEnd-FirstTrue+1).
if (FirstTrueElement) {		if (FirstTrueElement) {
Value *Offs = ConstantInt::get(Idx->getType(), -FirstTrueElement);		Value *Offs = ConstantInt::get(Idx->getType(), -FirstTrueElement);
Idx = Builder.CreateAdd(Idx, Offs);		Idx = Builder.CreateAdd(Idx, Offs);
}		}

Value *End = ConstantInt::get(Idx->getType(),		Value *End =
TrueRangeEnd-FirstTrueElement+1);		ConstantInt::get(PtrIdxTy, TrueRangeEnd - FirstTrueElement + 1);
return new ICmpInst(ICmpInst::ICMP_ULT, Idx, End);		return new ICmpInst(ICmpInst::ICMP_ULT, Idx, End);
}		}

// False range check.		// False range check.
if (FalseRangeEnd != Overdefined) {		if (FalseRangeEnd != Overdefined) {
assert(FalseRangeEnd != FirstFalseElement && "Should emit single compare");		assert(FalseRangeEnd != FirstFalseElement && "Should emit single compare");
Idx = MaskIdx(Idx);		Idx = MaskIdx(GenerateIndexIfNull(Idx));
// Generate (i-FirstFalse) >u (FalseRangeEnd-FirstFalse).		// Generate (i-FirstFalse) >u (FalseRangeEnd-FirstFalse).
if (FirstFalseElement) {		if (FirstFalseElement) {
Value *Offs = ConstantInt::get(Idx->getType(), -FirstFalseElement);		Value *Offs = ConstantInt::get(Idx->getType(), -FirstFalseElement);
Idx = Builder.CreateAdd(Idx, Offs);		Idx = Builder.CreateAdd(Idx, Offs);
}		}

Value *End = ConstantInt::get(Idx->getType(),		Value *End =
FalseRangeEnd-FirstFalseElement);		ConstantInt::get(Idx->getType(), FalseRangeEnd - FirstFalseElement);
return new ICmpInst(ICmpInst::ICMP_UGT, Idx, End);		return new ICmpInst(ICmpInst::ICMP_UGT, Idx, End);
}		}

// If a magic bitvector captures the entire comparison state		// If a magic bitvector captures the entire comparison state
// of this load, replace it with computation that does:		// of this load, replace it with computation that does:
// ((magic_cst >> i) & 1) != 0		// ((magic_cst >> i) & 1) != 0
{		{
Type *Ty = nullptr;		Type *Ty = nullptr;

// Look for an appropriate type:		// Look for an appropriate type:
// - The type of Idx if the magic fits		// - The type of Idx if the magic fits
// - The smallest fitting legal type		// - The smallest fitting legal type
if (ArrayElementCount <= Idx->getType()->getIntegerBitWidth())
Ty = Idx->getType();		if (ElementCountToTraverse <= PtrIdxTy->getIntegerBitWidth())
		Ty = PtrIdxTy;
else		else
Ty = DL.getSmallestLegalIntType(Init->getContext(), ArrayElementCount);		Ty = DL.getSmallestLegalIntType(Init->getContext(),
		ElementCountToTraverse);

if (Ty) {		if (Ty) {
Idx = MaskIdx(Idx);		Idx = MaskIdx(GenerateIndexIfNull(Idx));
Value *V = Builder.CreateIntCast(Idx, Ty, false);		Value *V = Builder.CreateIntCast(Idx, Ty, false);
V = Builder.CreateLShr(ConstantInt::get(Ty, MagicBitvector), V);		V = Builder.CreateLShr(ConstantInt::get(Ty, MagicBitvector), V);
V = Builder.CreateAnd(ConstantInt::get(Ty, 1), V);		V = Builder.CreateAnd(ConstantInt::get(Ty, 1), V);
return new ICmpInst(ICmpInst::ICMP_NE, V, ConstantInt::get(Ty, 0));		return new ICmpInst(ICmpInst::ICMP_NE, V, ConstantInt::get(Ty, 0));
}		}
}		}

return nullptr;		return nullptr;
▲ Show 20 Lines • Show All 7,262 Lines • Show Last 20 Lines

llvm/lib/Transforms/InstCombine/InstructionCombining.cpp

Show First 20 Lines • Show All 4,326 Lines • ▼ Show 20 Lines	while (true) {

++NumWorklistIterations;		++NumWorklistIterations;
LLVM_DEBUG(dbgs() << "\n\nINSTCOMBINE ITERATION #" << Iteration << " on "		LLVM_DEBUG(dbgs() << "\n\nINSTCOMBINE ITERATION #" << Iteration << " on "
<< F.getName() << "\n");		<< F.getName() << "\n");

InstCombinerImpl IC(Worklist, Builder, F.hasMinSize(), AA, AC, TLI, TTI, DT,		InstCombinerImpl IC(Worklist, Builder, F.hasMinSize(), AA, AC, TLI, TTI, DT,
ORE, BFI, PSI, DL, LI);		ORE, BFI, PSI, DL, LI);
IC.MaxArraySizeForCombine = MaxArraySize;		IC.MaxArraySizeForCombine = MaxArraySize;
		IC.MaxDataSizeForCombine = MaxArraySize * 8;

bool MadeChangeInThisIteration = IC.prepareWorklist(F, RPOT);		bool MadeChangeInThisIteration = IC.prepareWorklist(F, RPOT);
MadeChangeInThisIteration \|= IC.run();		MadeChangeInThisIteration \|= IC.run();
if (!MadeChangeInThisIteration)		if (!MadeChangeInThisIteration)
break;		break;

MadeIRChange = true;		MadeIRChange = true;
if (Iteration > MaxIterations) {		if (Iteration > MaxIterations) {
report_fatal_error(		report_fatal_error(
▲ Show 20 Lines • Show All 135 Lines • Show Last 20 Lines

llvm/test/Transforms/InstCombine/load-cmp.ll

Show First 20 Lines • Show All 209 Lines • ▼ Show 20 Lines	;
%p = getelementptr inbounds %Foo, ptr @GS, i32 %x, i32 0		%p = getelementptr inbounds %Foo, ptr @GS, i32 %x, i32 0
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 9		%r = icmp eq i32 %q, 9
ret i1 %r		ret i1 %r
}		}

define i1 @test10_struct_noinbounds(i32 %x) {		define i1 @test10_struct_noinbounds(i32 %x) {
; CHECK-LABEL: @test10_struct_noinbounds(		; CHECK-LABEL: @test10_struct_noinbounds(
; CHECK-NEXT: [[P:%.]] = getelementptr [[FOO:%.]], ptr @GS, i32 [[X:%.*]], i32 0		; CHECK-NEXT: ret i1 false
; CHECK-NEXT: [[Q:%.*]] = load i32, ptr [[P]], align 8
; CHECK-NEXT: [[R:%.*]] = icmp eq i32 [[Q]], 9
; CHECK-NEXT: ret i1 [[R]]
;		;
%p = getelementptr %Foo, ptr @GS, i32 %x, i32 0		%p = getelementptr %Foo, ptr @GS, i32 %x, i32 0
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 9		%r = icmp eq i32 %q, 9
ret i1 %r		ret i1 %r
}		}

; Test that the GEP indices are converted before we ever get here		; Test that the GEP indices are converted before we ever get here
Show All 17 Lines	;
%p = getelementptr inbounds %Foo, ptr @GS, i64 %x, i32 0		%p = getelementptr inbounds %Foo, ptr @GS, i64 %x, i32 0
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 0		%r = icmp eq i32 %q, 0
ret i1 %r		ret i1 %r
}		}

define i1 @test10_struct_noinbounds_i16(i16 %x) {		define i1 @test10_struct_noinbounds_i16(i16 %x) {
; CHECK-LABEL: @test10_struct_noinbounds_i16(		; CHECK-LABEL: @test10_struct_noinbounds_i16(
; CHECK-NEXT: [[TMP1:%.]] = sext i16 [[X:%.]] to i32		; CHECK-NEXT: ret i1 false
; CHECK-NEXT: [[P:%.]] = getelementptr [[FOO:%.]], ptr @GS, i32 [[TMP1]], i32 0
; CHECK-NEXT: [[Q:%.*]] = load i32, ptr [[P]], align 8
; CHECK-NEXT: [[R:%.*]] = icmp eq i32 [[Q]], 0
; CHECK-NEXT: ret i1 [[R]]
;		;
%p = getelementptr %Foo, ptr @GS, i16 %x, i32 0		%p = getelementptr %Foo, ptr @GS, i16 %x, i32 0
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 0		%r = icmp eq i32 %q, 0
ret i1 %r		ret i1 %r
}		}

define i1 @test10_struct_arr(i32 %x) {		define i1 @test10_struct_arr(i32 %x) {
; CHECK-LABEL: @test10_struct_arr(		; CHECK-LABEL: @test10_struct_arr(
; CHECK-NEXT: [[R:%.]] = icmp ne i32 [[X:%.]], 1		; CHECK-NEXT: [[TMP1:%.]] = and i32 [[X:%.]], -3
		; CHECK-NEXT: [[R:%.*]] = icmp eq i32 [[TMP1]], 0
; CHECK-NEXT: ret i1 [[R]]		; CHECK-NEXT: ret i1 [[R]]
;		;
%p = getelementptr inbounds [4 x %Foo], ptr @GStructArr, i32 0, i32 %x, i32 2		%p = getelementptr inbounds [4 x %Foo], ptr @GStructArr, i32 0, i32 %x, i32 2
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 9		%r = icmp eq i32 %q, 9
ret i1 %r		ret i1 %r
}		}

define i1 @test10_struct_arr_noinbounds(i32 %x) {		define i1 @test10_struct_arr_noinbounds(i32 %x) {
; CHECK-LABEL: @test10_struct_arr_noinbounds(		; CHECK-LABEL: @test10_struct_arr_noinbounds(
; CHECK-NEXT: [[TMP1:%.]] = and i32 [[X:%.]], 268435455		; CHECK-NEXT: [[TMP1:%.]] = and i32 [[X:%.]], 268435453
; CHECK-NEXT: [[R:%.*]] = icmp ne i32 [[TMP1]], 1		; CHECK-NEXT: [[R:%.*]] = icmp eq i32 [[TMP1]], 0
; CHECK-NEXT: ret i1 [[R]]		; CHECK-NEXT: ret i1 [[R]]
;		;
%p = getelementptr [4 x %Foo], ptr @GStructArr, i32 0, i32 %x, i32 2		%p = getelementptr [4 x %Foo], ptr @GStructArr, i32 0, i32 %x, i32 2
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 9		%r = icmp eq i32 %q, 9
ret i1 %r		ret i1 %r
}		}

define i1 @test10_struct_arr_i16(i16 %x) {		define i1 @test10_struct_arr_i16(i16 %x) {
; CHECK-LABEL: @test10_struct_arr_i16(		; CHECK-LABEL: @test10_struct_arr_i16(
; CHECK-NEXT: [[R:%.]] = icmp ne i16 [[X:%.]], 1		; CHECK-NEXT: [[TMP1:%.]] = and i16 [[X:%.]], -3
		; CHECK-NEXT: [[R:%.*]] = icmp eq i16 [[TMP1]], 0
; CHECK-NEXT: ret i1 [[R]]		; CHECK-NEXT: ret i1 [[R]]
;		;
%p = getelementptr inbounds [4 x %Foo], ptr @GStructArr, i16 0, i16 %x, i32 2		%p = getelementptr inbounds [4 x %Foo], ptr @GStructArr, i16 0, i16 %x, i32 2
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 9		%r = icmp eq i32 %q, 9
ret i1 %r		ret i1 %r
}		}

define i1 @test10_struct_arr_i64(i64 %x) {		define i1 @test10_struct_arr_i64(i64 %x) {
; CHECK-LABEL: @test10_struct_arr_i64(		; CHECK-LABEL: @test10_struct_arr_i64(
; CHECK-NEXT: [[TMP1:%.]] = and i64 [[X:%.]], 4294967295		; CHECK-NEXT: [[TMP1:%.]] = and i64 [[X:%.]], 4294967293
; CHECK-NEXT: [[R:%.*]] = icmp ne i64 [[TMP1]], 1		; CHECK-NEXT: [[R:%.*]] = icmp eq i64 [[TMP1]], 0
; CHECK-NEXT: ret i1 [[R]]		; CHECK-NEXT: ret i1 [[R]]
;		;
%p = getelementptr inbounds [4 x %Foo], ptr @GStructArr, i64 0, i64 %x, i32 2		%p = getelementptr inbounds [4 x %Foo], ptr @GStructArr, i64 0, i64 %x, i32 2
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 9		%r = icmp eq i32 %q, 9
ret i1 %r		ret i1 %r
}		}

define i1 @test10_struct_arr_noinbounds_i16(i16 %x) {		define i1 @test10_struct_arr_noinbounds_i16(i16 %x) {
; CHECK-LABEL: @test10_struct_arr_noinbounds_i16(		; CHECK-LABEL: @test10_struct_arr_noinbounds_i16(
; CHECK-NEXT: [[TMP1:%.]] = sext i16 [[X:%.]] to i32		; CHECK-NEXT: [[TMP1:%.]] = sext i16 [[X:%.]] to i32
; CHECK-NEXT: [[TMP2:%.*]] = and i32 [[TMP1]], 268435455		; CHECK-NEXT: [[TMP2:%.*]] = and i32 [[TMP1]], 268435453
; CHECK-NEXT: [[R:%.*]] = icmp ne i32 [[TMP2]], 1		; CHECK-NEXT: [[R:%.*]] = icmp eq i32 [[TMP2]], 0
; CHECK-NEXT: ret i1 [[R]]		; CHECK-NEXT: ret i1 [[R]]
;		;
%p = getelementptr [4 x %Foo], ptr @GStructArr, i32 0, i16 %x, i32 2		%p = getelementptr [4 x %Foo], ptr @GStructArr, i32 0, i16 %x, i32 2
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 9		%r = icmp eq i32 %q, 9
ret i1 %r		ret i1 %r
}		}

define i1 @test10_struct_arr_noinbounds_i64(i64 %x) {		define i1 @test10_struct_arr_noinbounds_i64(i64 %x) {
; CHECK-LABEL: @test10_struct_arr_noinbounds_i64(		; CHECK-LABEL: @test10_struct_arr_noinbounds_i64(
; CHECK-NEXT: [[TMP1:%.]] = and i64 [[X:%.]], 268435455		; CHECK-NEXT: [[TMP1:%.]] = and i64 [[X:%.]], 268435453
; CHECK-NEXT: [[R:%.*]] = icmp ne i64 [[TMP1]], 1		; CHECK-NEXT: [[R:%.*]] = icmp eq i64 [[TMP1]], 0
; CHECK-NEXT: ret i1 [[R]]		; CHECK-NEXT: ret i1 [[R]]
;		;
%p = getelementptr [4 x %Foo], ptr @GStructArr, i32 0, i64 %x, i32 2		%p = getelementptr [4 x %Foo], ptr @GStructArr, i32 0, i64 %x, i32 2
%q = load i32, ptr %p		%q = load i32, ptr %p
%r = icmp eq i32 %q, 9		%r = icmp eq i32 %q, 9
ret i1 %r		ret i1 %r
}		}


@CG = constant [4 x i32] [i32 1, i32 2, i32 3, i32 4]		@CG = constant [4 x i32] [i32 1, i32 2, i32 3, i32 4]

		; TODO: Fold it globally.
define i1 @cmp_load_constant_array0(i64 %x){		define i1 @cmp_load_constant_array0(i64 %x){
; CHECK-LABEL: @cmp_load_constant_array0(		; CHECK-LABEL: @cmp_load_constant_array0(
; CHECK-NEXT: entry:		; CHECK-NEXT: entry:
; CHECK-NEXT: [[COND:%.]] = icmp ult i64 [[X:%.]], 2		; CHECK-NEXT: [[COND:%.]] = icmp ult i64 [[X:%.]], 2
; CHECK-NEXT: br i1 [[COND]], label [[CASE1:%.]], label [[CASE2:%.]]		; CHECK-NEXT: br i1 [[COND]], label [[CASE1:%.]], label [[CASE2:%.]]
; CHECK: case2:		; CHECK: case2:
; CHECK-NEXT: ret i1 false		; CHECK-NEXT: ret i1 false
; CHECK: case1:		; CHECK: case1:
; CHECK-NEXT: [[TMP0:%.*]] = trunc i64 [[X]] to i32		; CHECK-NEXT: [[TMP0:%.*]] = and i64 [[X]], 4294967294
; CHECK-NEXT: [[ISOK_PTR:%.*]] = getelementptr inbounds i32, ptr @CG, i32 [[TMP0]]		; CHECK-NEXT: [[COND_INFERRED:%.*]] = icmp eq i64 [[TMP0]], 0
		XChyAuthorUnsubmitted Not Done Reply Inline Actions Optimized well locally, but not globally. XChy: Optimized well locally, but not globally.
; CHECK-NEXT: [[ISOK:%.*]] = load i32, ptr [[ISOK_PTR]], align 4
; CHECK-NEXT: [[COND_INFERRED:%.*]] = icmp ult i32 [[ISOK]], 3
; CHECK-NEXT: ret i1 [[COND_INFERRED]]		; CHECK-NEXT: ret i1 [[COND_INFERRED]]
;		;
entry:		entry:
%cond = icmp ult i64 %x, 2		%cond = icmp ult i64 %x, 2
br i1 %cond, label %case1, label %case2		br i1 %cond, label %case1, label %case2

case2:		case2:
ret i1 0		ret i1 0

case1:		case1:
%isOK_ptr = getelementptr inbounds i32, ptr @CG, i64 %x		%isOK_ptr = getelementptr inbounds i32, ptr @CG, i64 %x
%isOK = load i32, ptr %isOK_ptr		%isOK = load i32, ptr %isOK_ptr
%cond_inferred = icmp ult i32 %isOK, 3		%cond_inferred = icmp ult i32 %isOK, 3
ret i1 %cond_inferred		ret i1 %cond_inferred
}		}

define i1 @cmp_load_constant_array1(i64 %x){		define i1 @cmp_load_constant_array1(i64 %x){
; CHECK-LABEL: @cmp_load_constant_array1(		; CHECK-LABEL: @cmp_load_constant_array1(
; CHECK-NEXT: entry:		; CHECK-NEXT: entry:
; CHECK-NEXT: [[COND:%.]] = icmp ult i64 [[X:%.]], 2		; CHECK-NEXT: [[COND:%.]] = icmp ult i64 [[X:%.]], 2
; CHECK-NEXT: br i1 [[COND]], label [[CASE1:%.]], label [[CASE2:%.]]		; CHECK-NEXT: br i1 [[COND]], label [[CASE1:%.]], label [[CASE2:%.]]
; CHECK: case2:		; CHECK: case2:
; CHECK-NEXT: ret i1 false		; CHECK-NEXT: ret i1 false
; CHECK: case1:		; CHECK: case1:
; CHECK-NEXT: [[TMP0:%.*]] = trunc i64 [[X]] to i32		; CHECK-NEXT: ret i1 false
; CHECK-NEXT: [[ISOK_PTR:%.*]] = getelementptr inbounds i32, ptr @CG, i32 [[TMP0]]
; CHECK-NEXT: [[ISOK:%.*]] = load i32, ptr [[ISOK_PTR]], align 4
; CHECK-NEXT: [[COND_INFERRED:%.*]] = icmp ugt i32 [[ISOK]], 10
; CHECK-NEXT: ret i1 [[COND_INFERRED]]
;		;
entry:		entry:
%cond = icmp ult i64 %x, 2		%cond = icmp ult i64 %x, 2
br i1 %cond, label %case1, label %case2		br i1 %cond, label %case1, label %case2

case2:		case2:
ret i1 0		ret i1 0

Show All 10 Lines
; CHECK-LABEL: @cmp_load_constant_array_messy(		; CHECK-LABEL: @cmp_load_constant_array_messy(
; CHECK-NEXT: entry:		; CHECK-NEXT: entry:
; CHECK-NEXT: [[COND:%.]] = icmp slt i64 [[X:%.]], 6		; CHECK-NEXT: [[COND:%.]] = icmp slt i64 [[X:%.]], 6
; CHECK-NEXT: br i1 [[COND]], label [[CASE1:%.]], label [[CASE2:%.]]		; CHECK-NEXT: br i1 [[COND]], label [[CASE1:%.]], label [[CASE2:%.]]
; CHECK: case2:		; CHECK: case2:
; CHECK-NEXT: ret i1 false		; CHECK-NEXT: ret i1 false
; CHECK: case1:		; CHECK: case1:
; CHECK-NEXT: [[TMP0:%.*]] = trunc i64 [[X]] to i32		; CHECK-NEXT: [[TMP0:%.*]] = trunc i64 [[X]] to i32
; CHECK-NEXT: [[ISOK_PTR:%.*]] = getelementptr i32, ptr @CG_MESSY, i32 [[TMP0]]		; CHECK-NEXT: [[TMP1:%.*]] = and i32 [[TMP0]], 1073741823
; CHECK-NEXT: [[ISOK:%.*]] = load i32, ptr [[ISOK_PTR]], align 4		; CHECK-NEXT: [[TMP2:%.*]] = lshr i32 373, [[TMP1]]
; CHECK-NEXT: [[COND_INFERRED:%.*]] = icmp slt i32 [[ISOK]], 5		; CHECK-NEXT: [[TMP3:%.*]] = and i32 [[TMP2]], 1
		; CHECK-NEXT: [[COND_INFERRED:%.*]] = icmp ne i32 [[TMP3]], 0
; CHECK-NEXT: ret i1 [[COND_INFERRED]]		; CHECK-NEXT: ret i1 [[COND_INFERRED]]
;		;
entry:		entry:
%cond = icmp slt i64 %x, 6		%cond = icmp slt i64 %x, 6
br i1 %cond, label %case1, label %case2		br i1 %cond, label %case1, label %case2

case2:		case2:
ret i1 0		ret i1 0

case1:		case1:
%isOK_ptr = getelementptr i32, ptr @CG_MESSY, i64 %x		%isOK_ptr = getelementptr i32, ptr @CG_MESSY, i64 %x
%isOK = load i32, ptr %isOK_ptr		%isOK = load i32, ptr %isOK_ptr
%cond_inferred = icmp slt i32 %isOK, 5		%cond_inferred = icmp slt i32 %isOK, 5
ret i1 %cond_inferred		ret i1 %cond_inferred
}		}

define i1 @cmp_diff_load_constant_array_messy0(i64 %x){		define i1 @cmp_diff_load_constant_array_messy0(i64 %x){
; CHECK-LABEL: @cmp_diff_load_constant_array_messy0(		; CHECK-LABEL: @cmp_diff_load_constant_array_messy0(
; CHECK-NEXT: [[TMP1:%.]] = trunc i64 [[X:%.]] to i32		; CHECK-NEXT: [[TMP1:%.]] = trunc i64 [[X:%.]] to i32
; CHECK-NEXT: [[ISOK_PTR:%.*]] = getelementptr i32, ptr @CG_MESSY, i32 [[TMP1]]		; CHECK-NEXT: [[TMP2:%.*]] = and i32 [[TMP1]], 1073741823
; CHECK-NEXT: [[ISOK:%.*]] = load i16, ptr [[ISOK_PTR]], align 4		; CHECK-NEXT: [[TMP3:%.*]] = lshr i32 373, [[TMP2]]
; CHECK-NEXT: [[COND_INFERRED:%.*]] = icmp slt i16 [[ISOK]], 5		; CHECK-NEXT: [[TMP4:%.*]] = and i32 [[TMP3]], 1
		; CHECK-NEXT: [[COND_INFERRED:%.*]] = icmp ne i32 [[TMP4]], 0
; CHECK-NEXT: ret i1 [[COND_INFERRED]]		; CHECK-NEXT: ret i1 [[COND_INFERRED]]
;		;
%isOK_ptr = getelementptr i32, ptr @CG_MESSY, i64 %x		%isOK_ptr = getelementptr i32, ptr @CG_MESSY, i64 %x
%isOK = load i16, ptr %isOK_ptr		%isOK = load i16, ptr %isOK_ptr
%cond_inferred = icmp slt i16 %isOK, 5		%cond_inferred = icmp slt i16 %isOK, 5
ret i1 %cond_inferred		ret i1 %cond_inferred
}		}

define i1 @cmp_diff_load_constant_array_messy1(i64 %x){		define i1 @cmp_diff_load_constant_array_messy1(i64 %x){
; CHECK-LABEL: @cmp_diff_load_constant_array_messy1(		; CHECK-LABEL: @cmp_diff_load_constant_array_messy1(
; CHECK-NEXT: [[TMP1:%.]] = trunc i64 [[X:%.]] to i32		; CHECK-NEXT: [[TMP1:%.]] = and i64 [[X:%.]], 4294967295
; CHECK-NEXT: [[ISOK_PTR:%.*]] = getelementptr i6, ptr @CG_MESSY, i32 [[TMP1]]		; CHECK-NEXT: [[TMP2:%.*]] = lshr i64 66160388071, [[TMP1]]
; CHECK-NEXT: [[ISOK:%.*]] = load i16, ptr [[ISOK_PTR]], align 2		; CHECK-NEXT: [[TMP3:%.*]] = and i64 [[TMP2]], 1
; CHECK-NEXT: [[COND_INFERRED:%.*]] = icmp slt i16 [[ISOK]], 5		; CHECK-NEXT: [[COND_INFERRED:%.*]] = icmp ne i64 [[TMP3]], 0
; CHECK-NEXT: ret i1 [[COND_INFERRED]]		; CHECK-NEXT: ret i1 [[COND_INFERRED]]
;		;
%isOK_ptr = getelementptr i6, ptr @CG_MESSY, i64 %x		%isOK_ptr = getelementptr i6, ptr @CG_MESSY, i64 %x
%isOK = load i16, ptr %isOK_ptr		%isOK = load i16, ptr %isOK_ptr
%cond_inferred = icmp slt i16 %isOK, 5		%cond_inferred = icmp slt i16 %isOK, 5
ret i1 %cond_inferred		ret i1 %cond_inferred
}		}

define i1 @cmp_load_constant_array_fail0(i64 %x, i32 %y) {		define i1 @cmp_load_constant_array_fail0(i64 %x, i32 %y) {
; CHECK-LABEL: @cmp_load_constant_array_fail0(		; CHECK-LABEL: @cmp_load_constant_array_fail0(
; CHECK-NEXT: entry:		; CHECK-NEXT: entry:
Show All 16 Lines	case2:
ret i1 0		ret i1 0

case1:		case1:
%isOK_ptr = getelementptr inbounds i32, ptr @CG, i64 %x		%isOK_ptr = getelementptr inbounds i32, ptr @CG, i64 %x
%isOK = load i32, ptr %isOK_ptr		%isOK = load i32, ptr %isOK_ptr
%cond_inferred = icmp ult i32 %isOK, %y		%cond_inferred = icmp ult i32 %isOK, %y
ret i1 %cond_inferred		ret i1 %cond_inferred
}		}

llvm/test/Transforms/InstCombine/opaque-ptr.ll

Show First 20 Lines • Show All 469 Lines • ▼ Show 20 Lines	;
%gep = getelementptr [4 x i8], ptr @ary, i64 0, i64 %idx		%gep = getelementptr [4 x i8], ptr @ary, i64 0, i64 %idx
%load = load i8, ptr %gep		%load = load i8, ptr %gep
%cmp = icmp eq i8 %load, 3		%cmp = icmp eq i8 %load, 3
ret i1 %cmp		ret i1 %cmp
}		}

define i1 @cmp_load_gep_global_different_load_type(i64 %idx) {		define i1 @cmp_load_gep_global_different_load_type(i64 %idx) {
; CHECK-LABEL: @cmp_load_gep_global_different_load_type(		; CHECK-LABEL: @cmp_load_gep_global_different_load_type(
; CHECK-NEXT: [[GEP:%.]] = getelementptr [4 x i8], ptr @ary, i64 0, i64 [[IDX:%.]]		; CHECK-NEXT: ret i1 false
; CHECK-NEXT: [[LOAD:%.*]] = load i16, ptr [[GEP]], align 2
; CHECK-NEXT: [[CMP:%.*]] = icmp eq i16 [[LOAD]], 3
; CHECK-NEXT: ret i1 [[CMP]]
;		;
%gep = getelementptr [4 x i8], ptr @ary, i64 0, i64 %idx		%gep = getelementptr [4 x i8], ptr @ary, i64 0, i64 %idx
%load = load i16, ptr %gep		%load = load i16, ptr %gep
%cmp = icmp eq i16 %load, 3		%cmp = icmp eq i16 %load, 3
ret i1 %cmp		ret i1 %cmp
}		}

define i1 @cmp_load_gep_global_different_gep_type(i64 %idx) {		define i1 @cmp_load_gep_global_different_gep_type(i64 %idx) {
; CHECK-LABEL: @cmp_load_gep_global_different_gep_type(		; CHECK-LABEL: @cmp_load_gep_global_different_gep_type(
; CHECK-NEXT: [[GEP:%.]] = getelementptr [4 x i16], ptr @ary, i64 0, i64 [[IDX:%.]]		; CHECK-NEXT: ret i1 false
; CHECK-NEXT: [[LOAD:%.*]] = load i16, ptr [[GEP]], align 2
; CHECK-NEXT: [[CMP:%.*]] = icmp eq i16 [[LOAD]], 3
; CHECK-NEXT: ret i1 [[CMP]]
;		;
%gep = getelementptr [4 x i16], ptr @ary, i64 0, i64 %idx		%gep = getelementptr [4 x i16], ptr @ary, i64 0, i64 %idx
%load = load i16, ptr %gep		%load = load i16, ptr %gep
%cmp = icmp eq i16 %load, 3		%cmp = icmp eq i16 %load, 3
ret i1 %cmp		ret i1 %cmp
}		}

define ptr @phi_of_gep(i1 %c, ptr %p) {		define ptr @phi_of_gep(i1 %c, ptr %p) {
▲ Show 20 Lines • Show All 181 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Fold icmp(constants[x]) when the range of x is given
Needs ReviewPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 547726

llvm/include/llvm/Transforms/InstCombine/InstCombiner.h

llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp

llvm/lib/Transforms/InstCombine/InstructionCombining.cpp

llvm/test/Transforms/InstCombine/load-cmp.ll

llvm/test/Transforms/InstCombine/opaque-ptr.ll

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Fold icmp(constants[x]) when the range of x is givenNeeds ReviewPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 547726

llvm/include/llvm/Transforms/InstCombine/InstCombiner.h

llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp

llvm/lib/Transforms/InstCombine/InstructionCombining.cpp

llvm/test/Transforms/InstCombine/load-cmp.ll

llvm/test/Transforms/InstCombine/opaque-ptr.ll

[InstCombine] Fold icmp(constants[x]) when the range of x is given
Needs ReviewPublic