diff --git a/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp b/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp --- a/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp +++ b/llvm/lib/Transforms/Vectorize/LoopVectorize.cpp @@ -1079,6 +1079,8 @@ if (Instr && Instr->hasPoisonGeneratingFlags()) { if (auto *VPW = dyn_cast(CurRec)) VPW->dropPoisonGeneratingFlags(); + else if (auto *GEP = dyn_cast(CurRec)) + GEP->dropPoisonGeneratingFlags(); else State.MayGeneratePoisonRecipes.insert(CurRec); } diff --git a/llvm/lib/Transforms/Vectorize/VPlan.h b/llvm/lib/Transforms/Vectorize/VPlan.h --- a/llvm/lib/Transforms/Vectorize/VPlan.h +++ b/llvm/lib/Transforms/Vectorize/VPlan.h @@ -943,6 +943,7 @@ OverflowingBinOp, PossiblyExactOp, FPMathOp, + InBoundsOp, Other }; OperationType OpType; @@ -950,6 +951,7 @@ unsigned HasNUW : 1; unsigned HasNSW : 1; unsigned IsExact : 1; + unsigned IsInBounds : 1; unsigned AllowReassoc : 1; unsigned NoNaNs : 1; unsigned NoInfs : 1; @@ -981,6 +983,9 @@ } else if (auto *Op = dyn_cast(&I)) { IsExact = Op->isExact(); OpType = OperationType::PossiblyExactOp; + } else if (auto *GEP = dyn_cast(&I)) { + IsInBounds = GEP->isInBounds(); + OpType = OperationType::InBoundsOp; } else if (auto *Op = dyn_cast(&I)) { FastMathFlags FMF = Op->getFastMathFlags(); AllowReassoc = FMF.allowReassoc(); @@ -999,6 +1004,7 @@ HasNUW = false; HasNSW = false; IsExact = false; + IsInBounds = false; NoNaNs = false; NoInfs = false; } @@ -1018,7 +1024,11 @@ "Exact flag not available"); return IsExact; } - + bool isInBounds() const { + assert(OpType == OperationType::InBoundsOp && + "inbounds flag not available"); + return IsInBounds; + } FastMathFlags getFastMathFlags() const { assert(OpType == OperationType::FPMathOp && "FMFs not available"); FastMathFlags FMFs; @@ -1043,6 +1053,8 @@ I->setHasNoSignedWrap(); } else if (OpType == OperationType::FPMathOp && getFastMathFlags().any()) I->setFastMathFlags(getFastMathFlags()); + else if (OpType == OperationType::InBoundsOp && isInBounds()) + cast(I)->setIsInBounds(); } }; @@ -1173,7 +1185,9 @@ }; /// A recipe for handling GEP instructions. -class VPWidenGEPRecipe : public VPRecipeBase, public VPValue { +class VPWidenGEPRecipe : public VPRecipeBase, + public VPValue, + public VPOpWithIRFlags { bool isPointerLoopInvariant() const { return getOperand(0)->isDefinedOutsideVectorRegions(); } @@ -1191,7 +1205,8 @@ public: template VPWidenGEPRecipe(GetElementPtrInst *GEP, iterator_range Operands) - : VPRecipeBase(VPDef::VPWidenGEPSC, Operands), VPValue(this, GEP) {} + : VPRecipeBase(VPDef::VPWidenGEPSC, Operands), VPValue(this, GEP), + VPOpWithIRFlags(*GEP) {} ~VPWidenGEPRecipe() override = default; diff --git a/llvm/lib/Transforms/Vectorize/VPlanRecipes.cpp b/llvm/lib/Transforms/Vectorize/VPlanRecipes.cpp --- a/llvm/lib/Transforms/Vectorize/VPlanRecipes.cpp +++ b/llvm/lib/Transforms/Vectorize/VPlanRecipes.cpp @@ -800,6 +800,7 @@ // collectLoopScalars() and teach getVectorValue() to broadcast // the lane-zero scalar value. auto *Clone = State.Builder.Insert(GEP->clone()); + transferFlags(Clone); for (unsigned Part = 0; Part < State.UF; ++Part) { Value *EntryPart = State.Builder.CreateVectorSplat(State.VF, Clone); State.set(this, EntryPart, Part); @@ -831,18 +832,10 @@ Indices.push_back(State.get(Operand, Part)); } - // If the GEP instruction is vectorized and was in a basic block that - // needed predication, we can't propagate the poison-generating 'inbounds' - // flag. The control flow has been linearized and the GEP is no longer - // guarded by the predicate, which could make the 'inbounds' properties to - // no longer hold. - bool IsInBounds = - GEP->isInBounds() && State.MayGeneratePoisonRecipes.count(this) == 0; - // Create the new GEP. Note that this GEP may be a scalar if VF == 1, // but it should be a vector, otherwise. auto *NewGEP = State.Builder.CreateGEP(GEP->getSourceElementType(), Ptr, - Indices, "", IsInBounds); + Indices, "", isInBounds()); assert((State.VF.isScalar() || NewGEP->getType()->isVectorTy()) && "NewGEP is not a pointer vector"); State.set(this, NewGEP, Part);