diff --git a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp --- a/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp +++ b/llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp @@ -6434,24 +6434,35 @@ auto Op2Info = getOperandInfo(VL, OpIdx, /*EnableFP=*/false); SmallVector Operands(VL0->operand_values()); - InstructionCost ScalarEltCost = - TTI->getArithmeticInstrCost(E->getOpcode(), ScalarTy, CostKind, - Op1Info, Op2Info, - Operands, VL0); + InstructionCost ScalarCost = 0; + for (unsigned i = 0, e = VL.size(); i < e; ++i) + ScalarCost += TTI->getArithmeticInstrCost( + E->getOpcode(), ScalarTy, CostKind, Op1Info, Op2Info, Operands, + isa(VL[i]) ? cast(VL[i]) : nullptr); + if (NeedToShuffleReuses) { - CommonCost -= (EntryVF - VL.size()) * ScalarEltCost; + CommonCost -= + (EntryVF - VL.size()) * + TTI->getArithmeticInstrCost(E->getOpcode(), ScalarTy, CostKind, + Op1Info, Op2Info, Operands); } - InstructionCost ScalarCost = VecTy->getNumElements() * ScalarEltCost; + for (unsigned I = 0, Num = VL0->getNumOperands(); I < Num; ++I) { if (all_of(VL, [I](Value *V) { return isConstant(cast(V)->getOperand(I)); })) Operands[I] = ConstantVector::getNullValue(VecTy); } + + // Populate vector with context instructions. + SmallVector OpsForVector = {VL0}; + for (unsigned I = 1; I != VL.size(); ++I) + OpsForVector.push_back(cast(VL[I])); + InstructionCost VecCost = - TTI->getArithmeticInstrCost(E->getOpcode(), VecTy, CostKind, - Op1Info, Op2Info, - Operands, VL0); + TTI->getArithmeticInstrCost(E->getOpcode(), VecTy, CostKind, Op1Info, + Op2Info, Operands, OpsForVector); + LLVM_DEBUG(dumpTreeCosts(E, CommonCost, VecCost, ScalarCost)); return CommonCost + VecCost - ScalarCost; }