diff --git a/llvm/lib/Target/X86/X86TargetTransformInfo.cpp b/llvm/lib/Target/X86/X86TargetTransformInfo.cpp --- a/llvm/lib/Target/X86/X86TargetTransformInfo.cpp +++ b/llvm/lib/Target/X86/X86TargetTransformInfo.cpp @@ -3253,50 +3253,131 @@ return BaseT::getMemoryOpCost(Opcode, Src, Alignment, AddressSpace, CostKind); - // Handle non-power-of-two vectors such as <3 x float> and <48 x i16> - if (auto *VTy = dyn_cast(Src)) { - const unsigned NumElem = VTy->getNumElements(); - if (!isPowerOf2_32(NumElem)) { - // Factorize NumElem into sum of power-of-two. - InstructionCost Cost = 0; - unsigned NumElemDone = 0; - for (unsigned NumElemLeft = NumElem, Factor; - Factor = PowerOf2Floor(NumElemLeft), NumElemLeft > 0; - NumElemLeft -= Factor) { - Type *SubTy = FixedVectorType::get(VTy->getScalarType(), Factor); - unsigned SubTyBytes = SubTy->getPrimitiveSizeInBits() / 8; - - Cost += - getMemoryOpCost(Opcode, SubTy, Alignment, AddressSpace, CostKind); - - std::pair LST = - TLI->getTypeLegalizationCost(DL, SubTy); - if (!LST.second.isVector()) { - APInt DemandedElts = - APInt::getBitsSet(NumElem, NumElemDone, NumElemDone + Factor); - Cost += getScalarizationOverhead(VTy, DemandedElts, - Opcode == Instruction::Load, - Opcode == Instruction::Store); - } - - NumElemDone += Factor; - Alignment = commonAlignment(Alignment.valueOrOne(), SubTyBytes); - } - assert(NumElemDone == NumElem && "Processed wrong element count?"); - return Cost; - } - } - // Legalize the type. std::pair LT = TLI->getTypeLegalizationCost(DL, Src); - // Each load/store unit costs 1. - InstructionCost Cost = LT.first * 1; + auto *VTy = dyn_cast(Src); - // This isn't exactly right. We're using slow unaligned 32-byte accesses as a - // proxy for a double-pumped AVX memory interface such as on Sandybridge. - if (LT.second.getStoreSize() == 32 && ST->isUnalignedMem32Slow()) - Cost *= 2; + // Handle the simple case of non-vectors. + // NOTE: this assumes that legalization never creates vector from scalars! + if (!VTy || !LT.second.isVector()) + // Each load/store unit costs 1. + return LT.first * 1; + + bool IsLoad = Opcode == Instruction::Load; + + Type *EltTy = VTy->getElementType(); + + const int EltTyBits = DL.getTypeSizeInBits(EltTy); + + InstructionCost Cost = 0; + + // Source of truth: how many elements were there in the original IR vector? + const unsigned SrcNumElt = VTy->getNumElements(); + + // How far have we gotten? + int NumEltRemaining = SrcNumElt; + // Note that we intentionally capture by-reference, NumEltRemaining changes. + auto NumEltDone = [&]() { return SrcNumElt - NumEltRemaining; }; + + const int MaxLegalOpSizeBytes = divideCeil(LT.second.getSizeInBits(), 8); + + // Note that even if we can store 64 bits of an XMM, we still operate on XMM. + const unsigned XMMBits = 128; + if (XMMBits % EltTyBits != 0) + // Vector size must be a multiple of the element size. I.e. no padding. + return BaseT::getMemoryOpCost(Opcode, Src, Alignment, AddressSpace, + CostKind); + const int NumEltPerXMM = XMMBits / EltTyBits; + + auto *XMMVecTy = FixedVectorType::get(EltTy, NumEltPerXMM); + + for (int CurrOpSizeBytes = MaxLegalOpSizeBytes, SubVecEltsLeft = 0; + NumEltRemaining > 0; CurrOpSizeBytes /= 2) { + // How many elements would a single op deal with at once? + if ((8 * CurrOpSizeBytes) % EltTyBits != 0) + // Vector size must be a multiple of the element size. I.e. no padding. + return BaseT::getMemoryOpCost(Opcode, Src, Alignment, AddressSpace, + CostKind); + int CurrNumEltPerOp = (8 * CurrOpSizeBytes) / EltTyBits; + + assert(CurrOpSizeBytes > 0 && CurrNumEltPerOp > 0 && "How'd we get here?"); + assert((((NumEltRemaining * EltTyBits) < (2 * 8 * CurrOpSizeBytes)) || + (CurrOpSizeBytes == MaxLegalOpSizeBytes)) && + "Unless we haven't halved the op size yet, " + "we have less than two op's sized units of work left."); + + auto *CurrVecTy = CurrNumEltPerOp > NumEltPerXMM + ? FixedVectorType::get(EltTy, CurrNumEltPerOp) + : XMMVecTy; + + assert(CurrVecTy->getNumElements() % CurrNumEltPerOp == 0 && + "After halving sizes, the vector elt count is no longer a multiple " + "of number of elements per operation?"); + auto *CoalescedVecTy = + CurrNumEltPerOp == 1 + ? CurrVecTy + : FixedVectorType::get( + IntegerType::get(Src->getContext(), + EltTyBits * CurrNumEltPerOp), + CurrVecTy->getNumElements() / CurrNumEltPerOp); + assert(DL.getTypeSizeInBits(CoalescedVecTy) == + DL.getTypeSizeInBits(CurrVecTy) && + "coalesciing elements doesn't change vector width."); + + while (NumEltRemaining > 0) { + assert(SubVecEltsLeft >= 0 && "Subreg element count overconsumtion?"); + + // Can we use this vector size, as per the remaining element count? + // Iff the vector is naturally aligned, we can do a wide load regardless. + if (NumEltRemaining < CurrNumEltPerOp && + (!IsLoad || Alignment.valueOrOne() < CurrOpSizeBytes) && + CurrOpSizeBytes != 1) + break; // Try smalled vector size. + + bool Is0thSubVec = (NumEltDone() % LT.second.getVectorNumElements()) == 0; + + // If we have fully processed the previous reg, we need to replenish it. + if (SubVecEltsLeft == 0) { + SubVecEltsLeft += CurrVecTy->getNumElements(); + // And that's free only for the 0'th subvector of a legalized vector. + if (!Is0thSubVec) + Cost += getShuffleCost(IsLoad ? TTI::ShuffleKind::SK_InsertSubvector + : TTI::ShuffleKind::SK_ExtractSubvector, + VTy, None, NumEltDone(), CurrVecTy); + } + + // While we can directly load/store ZMM, YMM, and 64-bit halves of XMM, + // for smaller widths (32/16/8) we have to insert/extract them separately. + // Again, it's free for the 0'th subreg (if op is 32/64 bit wide, + // but let's pretend that it is also true for 16/8 bit wide ops...) + if (CurrOpSizeBytes <= 32 / 8 && !Is0thSubVec) { + int NumEltDoneInCurrXMM = NumEltDone() % NumEltPerXMM; + assert(NumEltDoneInCurrXMM % CurrNumEltPerOp == 0 && ""); + int CoalescedVecEltIdx = NumEltDoneInCurrXMM / CurrNumEltPerOp; + APInt DemandedElts = + APInt::getBitsSet(CoalescedVecTy->getNumElements(), + CoalescedVecEltIdx, CoalescedVecEltIdx + 1); + assert(DemandedElts.countPopulation() == 1 && "Inserting single value"); + Cost += getScalarizationOverhead(CoalescedVecTy, DemandedElts, IsLoad, + !IsLoad); + } + + // This isn't exactly right. We're using slow unaligned 32-byte accesses + // as a proxy for a double-pumped AVX memory interface such as on + // Sandybridge. + if (CurrOpSizeBytes == 32 && ST->isUnalignedMem32Slow()) + Cost += 2; + else + Cost += 1; + + SubVecEltsLeft -= CurrNumEltPerOp; + NumEltRemaining -= CurrNumEltPerOp; + Alignment = commonAlignment(Alignment.valueOrOne(), CurrOpSizeBytes); + } + } + + assert(NumEltRemaining <= 0 && "Should have processed all the elements."); return Cost; } diff --git a/llvm/test/Analysis/CostModel/X86/interleaved-load-i16-stride-3.ll b/llvm/test/Analysis/CostModel/X86/interleaved-load-i16-stride-3.ll --- a/llvm/test/Analysis/CostModel/X86/interleaved-load-i16-stride-3.ll +++ b/llvm/test/Analysis/CostModel/X86/interleaved-load-i16-stride-3.ll @@ -9,8 +9,8 @@ ; CHECK: LV: Checking a loop in "test" ; CHECK: LV: Found an estimated cost of 1 for VF 1 For instruction: %v0 = load i16, i16* %in0, align 2 -; CHECK: LV: Found an estimated cost of 14 for VF 2 For instruction: %v0 = load i16, i16* %in0, align 2 -; CHECK: LV: Found an estimated cost of 30 for VF 4 For instruction: %v0 = load i16, i16* %in0, align 2 +; CHECK: LV: Found an estimated cost of 15 for VF 2 For instruction: %v0 = load i16, i16* %in0, align 2 +; CHECK: LV: Found an estimated cost of 31 for VF 4 For instruction: %v0 = load i16, i16* %in0, align 2 ; CHECK: LV: Found an estimated cost of 58 for VF 8 For instruction: %v0 = load i16, i16* %in0, align 2 ; CHECK: LV: Found an estimated cost of 171 for VF 16 For instruction: %v0 = load i16, i16* %in0, align 2 diff --git a/llvm/test/Analysis/CostModel/X86/interleaved-store-i16-stride-3.ll b/llvm/test/Analysis/CostModel/X86/interleaved-store-i16-stride-3.ll --- a/llvm/test/Analysis/CostModel/X86/interleaved-store-i16-stride-3.ll +++ b/llvm/test/Analysis/CostModel/X86/interleaved-store-i16-stride-3.ll @@ -9,8 +9,8 @@ ; CHECK: LV: Checking a loop in "test" ; CHECK: LV: Found an estimated cost of 1 for VF 1 For instruction: store i16 %v2, i16* %out2, align 2 -; CHECK: LV: Found an estimated cost of 14 for VF 2 For instruction: store i16 %v2, i16* %out2, align 2 -; CHECK: LV: Found an estimated cost of 34 for VF 4 For instruction: store i16 %v2, i16* %out2, align 2 +; CHECK: LV: Found an estimated cost of 15 for VF 2 For instruction: store i16 %v2, i16* %out2, align 2 +; CHECK: LV: Found an estimated cost of 35 for VF 4 For instruction: store i16 %v2, i16* %out2, align 2 ; CHECK: LV: Found an estimated cost of 66 for VF 8 For instruction: store i16 %v2, i16* %out2, align 2 ; CHECK: LV: Found an estimated cost of 171 for VF 16 For instruction: store i16 %v2, i16* %out2, align 2 diff --git a/llvm/test/Analysis/CostModel/X86/load_store.ll b/llvm/test/Analysis/CostModel/X86/load_store.ll --- a/llvm/test/Analysis/CostModel/X86/load_store.ll +++ b/llvm/test/Analysis/CostModel/X86/load_store.ll @@ -21,7 +21,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store double undef, double* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i8* undef, i8** undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i1 undef, i1* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i8> undef, <16 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i16> undef, <8 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, <4 x i32>* undef, align 4 @@ -35,7 +35,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i1> undef, <4 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i1> undef, <2 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i1> undef, <1 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i8> undef, <32 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x i16> undef, <16 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x i32> undef, <8 x i32>* undef, align 4 @@ -45,8 +45,8 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x float> undef, <8 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x double> undef, <4 x double>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x i8*> undef, <4 x i8*>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 32 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i8> undef, <64 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <32 x i16> undef, <32 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x i32> undef, <16 x i32>* undef, align 4 @@ -57,7 +57,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x float> undef, <16 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x double> undef, <8 x double>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x i8*> undef, <8 x i8*>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'stores_align4' @@ -72,7 +72,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store double undef, double* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i8* undef, i8** undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i1 undef, i1* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i8> undef, <16 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i16> undef, <8 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, <4 x i32>* undef, align 4 @@ -86,7 +86,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i1> undef, <4 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i1> undef, <2 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i1> undef, <1 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 16 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i8> undef, <32 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x i16> undef, <16 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x i32> undef, <8 x i32>* undef, align 4 @@ -96,8 +96,8 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x float> undef, <8 x float>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x double> undef, <4 x double>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x i8*> undef, <4 x i8*>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 32 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i8> undef, <64 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <32 x i16> undef, <32 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x i32> undef, <16 x i32>* undef, align 4 @@ -108,7 +108,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x float> undef, <16 x float>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x double> undef, <8 x double>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x i8*> undef, <8 x i8*>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'stores_align4' @@ -123,7 +123,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store double undef, double* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i8* undef, i8** undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i1 undef, i1* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i8> undef, <16 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i16> undef, <8 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, <4 x i32>* undef, align 4 @@ -137,7 +137,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i1> undef, <4 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i1> undef, <2 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i1> undef, <1 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i8> undef, <32 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i16> undef, <16 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i32> undef, <8 x i32>* undef, align 4 @@ -148,7 +148,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x double> undef, <4 x double>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8*> undef, <4 x i8*>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 16 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <64 x i8> undef, <64 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i16> undef, <32 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x i32> undef, <16 x i32>* undef, align 4 @@ -159,7 +159,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x float> undef, <16 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x double> undef, <8 x double>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x i8*> undef, <8 x i8*>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'stores_align4' @@ -287,10 +287,10 @@ ; Partial vectors with i64 elements (doubles as pointer-sized tests)) ; SSE2-LABEL: 'stores_partial_align4' ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x double> undef, <3 x double>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x double> undef, <5 x double>* undef, align 4 @@ -299,14 +299,14 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i32> undef, <1 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 4 @@ -327,156 +327,156 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 12 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'stores_partial_align4' ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x double> undef, <3 x double>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x double> undef, <5 x double>* undef, align 4 @@ -485,14 +485,14 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i32> undef, <1 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 4 @@ -513,156 +513,156 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'stores_partial_align4' ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x double> undef, <3 x double>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x double> undef, <5 x double>* undef, align 4 @@ -672,361 +672,361 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x float> undef, <2 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x float> undef, <3 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x float> undef, <5 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x float> undef, <6 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x float> undef, <6 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x float> undef, <7 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x float> undef, <9 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x float> undef, <10 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x float> undef, <11 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x float> undef, <12 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x float> undef, <13 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x float> undef, <14 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x float> undef, <14 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x float> undef, <15 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i16> undef, <1 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i16> undef, <2 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'stores_partial_align4' ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x double> undef, <3 x double>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x double> undef, <5 x double>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x double> undef, <6 x double>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x double> undef, <7 x double>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x double> undef, <6 x double>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x double> undef, <7 x double>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i32> undef, <1 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x float> undef, <2 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x float> undef, <3 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x float> undef, <5 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x float> undef, <6 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x float> undef, <6 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x float> undef, <7 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x float> undef, <9 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x float> undef, <10 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x float> undef, <10 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x float> undef, <11 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x float> undef, <12 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x float> undef, <13 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x float> undef, <14 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x float> undef, <15 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x float> undef, <12 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x float> undef, <13 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x float> undef, <14 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x float> undef, <15 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i16> undef, <1 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i16> undef, <2 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 11 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; store <1 x i64> undef, <1 x i64>* undef, align 4 @@ -1267,7 +1267,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store double undef, double* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i8* undef, i8** undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i1 undef, i1* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i8> undef, <16 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i16> undef, <8 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, <4 x i32>* undef, align 1 @@ -1281,7 +1281,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i1> undef, <4 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i1> undef, <2 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i1> undef, <1 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i8> undef, <32 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x i16> undef, <16 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x i32> undef, <8 x i32>* undef, align 1 @@ -1291,8 +1291,8 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x float> undef, <8 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x double> undef, <4 x double>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x i8*> undef, <4 x i8*>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 32 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i8> undef, <64 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <32 x i16> undef, <32 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x i32> undef, <16 x i32>* undef, align 1 @@ -1303,7 +1303,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x float> undef, <16 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x double> undef, <8 x double>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x i8*> undef, <8 x i8*>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'stores_align1' @@ -1318,7 +1318,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store double undef, double* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i8* undef, i8** undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i1 undef, i1* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i8> undef, <16 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i16> undef, <8 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, <4 x i32>* undef, align 1 @@ -1332,7 +1332,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i1> undef, <4 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i1> undef, <2 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i1> undef, <1 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 16 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i8> undef, <32 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x i16> undef, <16 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x i32> undef, <8 x i32>* undef, align 1 @@ -1342,8 +1342,8 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x float> undef, <8 x float>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x double> undef, <4 x double>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x i8*> undef, <4 x i8*>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 32 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i8> undef, <64 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <32 x i16> undef, <32 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x i32> undef, <16 x i32>* undef, align 1 @@ -1354,7 +1354,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x float> undef, <16 x float>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x double> undef, <8 x double>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x i8*> undef, <8 x i8*>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'stores_align1' @@ -1369,7 +1369,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store double undef, double* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i8* undef, i8** undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i1 undef, i1* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i8> undef, <16 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i16> undef, <8 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, <4 x i32>* undef, align 1 @@ -1383,7 +1383,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i1> undef, <4 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i1> undef, <2 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i1> undef, <1 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i8> undef, <32 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i16> undef, <16 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i32> undef, <8 x i32>* undef, align 1 @@ -1394,7 +1394,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x double> undef, <4 x double>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8*> undef, <4 x i8*>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 16 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <64 x i8> undef, <64 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i16> undef, <32 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x i32> undef, <16 x i32>* undef, align 1 @@ -1405,7 +1405,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x float> undef, <16 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x double> undef, <8 x double>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x i8*> undef, <8 x i8*>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'stores_align1' @@ -1533,10 +1533,10 @@ ; Partial vectors with i64 elements (doubles as pointer-sized tests)) ; SSE2-LABEL: 'stores_partial_align1' ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x double> undef, <3 x double>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x double> undef, <5 x double>* undef, align 1 @@ -1545,14 +1545,14 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i32> undef, <1 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 1 @@ -1573,156 +1573,156 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 12 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'stores_partial_align1' ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x double> undef, <3 x double>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x double> undef, <5 x double>* undef, align 1 @@ -1731,14 +1731,14 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i32> undef, <1 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 1 @@ -1759,156 +1759,156 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'stores_partial_align1' ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x double> undef, <3 x double>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x double> undef, <5 x double>* undef, align 1 @@ -1918,361 +1918,361 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x float> undef, <2 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x float> undef, <3 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x float> undef, <5 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x float> undef, <6 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x float> undef, <6 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x float> undef, <7 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x float> undef, <9 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x float> undef, <10 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x float> undef, <11 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x float> undef, <12 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x float> undef, <13 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x float> undef, <14 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x float> undef, <14 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x float> undef, <15 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i16> undef, <1 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i16> undef, <2 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'stores_partial_align1' ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x double> undef, <3 x double>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x double> undef, <5 x double>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x double> undef, <6 x double>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x double> undef, <7 x double>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x double> undef, <6 x double>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x double> undef, <7 x double>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i32> undef, <1 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x float> undef, <2 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x float> undef, <3 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x float> undef, <5 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x float> undef, <6 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x float> undef, <6 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x float> undef, <7 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x float> undef, <9 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x float> undef, <10 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x float> undef, <10 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x float> undef, <11 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x float> undef, <12 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x float> undef, <13 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x float> undef, <14 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x float> undef, <15 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x float> undef, <12 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x float> undef, <13 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x float> undef, <14 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x float> undef, <15 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i16> undef, <1 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i16> undef, <2 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 11 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; store <1 x i64> undef, <1 x i64>* undef, align 1 @@ -2513,7 +2513,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store double undef, double* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i8* undef, i8** undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i1 undef, i1* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i8> undef, <16 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i16> undef, <8 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, <4 x i32>* undef, align 64 @@ -2527,7 +2527,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i1> undef, <4 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i1> undef, <2 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i1> undef, <1 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i8> undef, <32 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x i16> undef, <16 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x i32> undef, <8 x i32>* undef, align 64 @@ -2537,8 +2537,8 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x float> undef, <8 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x double> undef, <4 x double>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x i8*> undef, <4 x i8*>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 32 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i8> undef, <64 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <32 x i16> undef, <32 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x i32> undef, <16 x i32>* undef, align 64 @@ -2549,7 +2549,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x float> undef, <16 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x double> undef, <8 x double>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x i8*> undef, <8 x i8*>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'stores_align64' @@ -2564,7 +2564,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store double undef, double* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i8* undef, i8** undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i1 undef, i1* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i8> undef, <16 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i16> undef, <8 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, <4 x i32>* undef, align 64 @@ -2578,7 +2578,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i1> undef, <4 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i1> undef, <2 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i1> undef, <1 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 16 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i8> undef, <32 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x i16> undef, <16 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x i32> undef, <8 x i32>* undef, align 64 @@ -2588,8 +2588,8 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x float> undef, <8 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x double> undef, <4 x double>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x i8*> undef, <4 x i8*>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 32 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i8> undef, <64 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <32 x i16> undef, <32 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x i32> undef, <16 x i32>* undef, align 64 @@ -2600,7 +2600,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <16 x float> undef, <16 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x double> undef, <8 x double>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <8 x i8*> undef, <8 x i8*>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'stores_align64' @@ -2615,7 +2615,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store double undef, double* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i8* undef, i8** undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i1 undef, i1* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <128 x i1> undef, <128 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i8> undef, <16 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i16> undef, <8 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, <4 x i32>* undef, align 64 @@ -2629,7 +2629,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i1> undef, <4 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i1> undef, <2 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i1> undef, <1 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <256 x i1> undef, <256 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i8> undef, <32 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <16 x i16> undef, <16 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i32> undef, <8 x i32>* undef, align 64 @@ -2640,7 +2640,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x double> undef, <4 x double>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8*> undef, <4 x i8*>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <32 x i1> undef, <32 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 16 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <512 x i1> undef, <512 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <64 x i8> undef, <64 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <32 x i16> undef, <32 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x i32> undef, <16 x i32>* undef, align 64 @@ -2651,7 +2651,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <16 x float> undef, <16 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x double> undef, <8 x double>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <8 x i8*> undef, <8 x i8*>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <64 x i1> undef, <64 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'stores_align64' @@ -2779,10 +2779,10 @@ ; Partial vectors with i64 elements (doubles as pointer-sized tests)) ; SSE2-LABEL: 'stores_partial_align64' ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x double> undef, <3 x double>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x double> undef, <5 x double>* undef, align 64 @@ -2791,14 +2791,14 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i32> undef, <1 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 64 @@ -2819,156 +2819,156 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 12 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'stores_partial_align64' ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x double> undef, <3 x double>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x double> undef, <5 x double>* undef, align 64 @@ -2977,14 +2977,14 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i32> undef, <1 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 64 @@ -3005,156 +3005,156 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'stores_partial_align64' ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x double> undef, <3 x double>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x double> undef, <5 x double>* undef, align 64 @@ -3164,361 +3164,361 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x float> undef, <2 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x float> undef, <3 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x float> undef, <5 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x float> undef, <6 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x float> undef, <6 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x float> undef, <7 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x float> undef, <9 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x float> undef, <10 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x float> undef, <11 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x float> undef, <12 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x float> undef, <13 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x float> undef, <14 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <14 x float> undef, <14 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x float> undef, <15 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i16> undef, <1 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i16> undef, <2 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'stores_partial_align64' ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i64> undef, <1 x i64>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i64> undef, <3 x i64>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i64> undef, <5 x i64>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i64> undef, <6 x i64>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i64> undef, <7 x i64>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x double> undef, <1 x double>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x double> undef, <3 x double>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x double> undef, <5 x double>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x double> undef, <6 x double>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x double> undef, <7 x double>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x double> undef, <6 x double>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x double> undef, <7 x double>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i32> undef, <1 x i32>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i32> undef, <2 x i32>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i32> undef, <3 x i32>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <5 x i32> undef, <5 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i32> undef, <6 x i32>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i32> undef, <7 x i32>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i32> undef, <9 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i32> undef, <10 x i32>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i32> undef, <11 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i32> undef, <12 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <13 x i32> undef, <13 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i32> undef, <14 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i32> undef, <15 x i32>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x float> undef, <1 x float>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x float> undef, <2 x float>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x float> undef, <3 x float>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x float> undef, <5 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x float> undef, <6 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x float> undef, <6 x float>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x float> undef, <7 x float>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x float> undef, <9 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x float> undef, <10 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x float> undef, <10 x float>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x float> undef, <11 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x float> undef, <12 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x float> undef, <13 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x float> undef, <14 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x float> undef, <15 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x float> undef, <12 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x float> undef, <13 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x float> undef, <14 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x float> undef, <15 x float>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i16> undef, <1 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i16> undef, <2 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i16> undef, <3 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i16> undef, <4 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i16> undef, <5 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i16> undef, <6 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i16> undef, <7 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <9 x i16> undef, <9 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <10 x i16> undef, <10 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <11 x i16> undef, <11 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i16> undef, <12 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i16> undef, <13 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i16> undef, <14 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i16> undef, <15 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i16> undef, <17 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <18 x i16> undef, <18 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <19 x i16> undef, <19 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i16> undef, <20 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i16> undef, <21 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <22 x i16> undef, <22 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <23 x i16> undef, <23 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i16> undef, <24 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <25 x i16> undef, <25 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <26 x i16> undef, <26 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <27 x i16> undef, <27 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i16> undef, <28 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <29 x i16> undef, <29 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i16> undef, <30 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i16> undef, <31 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <1 x i8> undef, <1 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <2 x i8> undef, <2 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <3 x i8> undef, <3 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i8> undef, <4 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <5 x i8> undef, <5 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <6 x i8> undef, <6 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <7 x i8> undef, <7 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <8 x i8> undef, <8 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i8> undef, <9 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i8> undef, <10 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <11 x i8> undef, <11 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i8> undef, <12 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <13 x i8> undef, <13 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <14 x i8> undef, <14 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <15 x i8> undef, <15 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <17 x i8> undef, <17 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <18 x i8> undef, <18 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <19 x i8> undef, <19 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <20 x i8> undef, <20 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <21 x i8> undef, <21 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <22 x i8> undef, <22 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <23 x i8> undef, <23 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i8> undef, <24 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i8> undef, <25 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i8> undef, <26 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <27 x i8> undef, <27 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i8> undef, <28 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <29 x i8> undef, <29 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <30 x i8> undef, <30 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <31 x i8> undef, <31 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <33 x i8> undef, <33 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <34 x i8> undef, <34 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <35 x i8> undef, <35 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <36 x i8> undef, <36 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <37 x i8> undef, <37 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <38 x i8> undef, <38 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <39 x i8> undef, <39 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i8> undef, <40 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i8> undef, <41 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i8> undef, <42 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <43 x i8> undef, <43 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i8> undef, <44 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <45 x i8> undef, <45 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <46 x i8> undef, <46 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <47 x i8> undef, <47 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i8> undef, <48 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <49 x i8> undef, <49 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <50 x i8> undef, <50 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <51 x i8> undef, <51 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <52 x i8> undef, <52 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <53 x i8> undef, <53 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: store <54 x i8> undef, <54 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 10 for instruction: store <55 x i8> undef, <55 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <56 x i8> undef, <56 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i8> undef, <57 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <58 x i8> undef, <58 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <59 x i8> undef, <59 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <60 x i8> undef, <60 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <61 x i8> undef, <61 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: store <62 x i8> undef, <62 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 11 for instruction: store <63 x i8> undef, <63 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <3 x i1> undef, <3 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <5 x i1> undef, <5 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <6 x i1> undef, <6 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <7 x i1> undef, <7 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <9 x i1> undef, <9 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <10 x i1> undef, <10 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <11 x i1> undef, <11 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <12 x i1> undef, <12 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <13 x i1> undef, <13 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <14 x i1> undef, <14 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <15 x i1> undef, <15 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <17 x i1> undef, <17 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <18 x i1> undef, <18 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <19 x i1> undef, <19 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <20 x i1> undef, <20 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <21 x i1> undef, <21 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <22 x i1> undef, <22 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <23 x i1> undef, <23 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <24 x i1> undef, <24 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <25 x i1> undef, <25 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <26 x i1> undef, <26 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <27 x i1> undef, <27 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <28 x i1> undef, <28 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <29 x i1> undef, <29 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <30 x i1> undef, <30 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <31 x i1> undef, <31 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <33 x i1> undef, <33 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <34 x i1> undef, <34 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <35 x i1> undef, <35 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <36 x i1> undef, <36 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <37 x i1> undef, <37 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <38 x i1> undef, <38 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <39 x i1> undef, <39 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <40 x i1> undef, <40 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <41 x i1> undef, <41 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <42 x i1> undef, <42 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <43 x i1> undef, <43 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <44 x i1> undef, <44 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <45 x i1> undef, <45 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <46 x i1> undef, <46 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <47 x i1> undef, <47 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <48 x i1> undef, <48 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <49 x i1> undef, <49 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <50 x i1> undef, <50 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <51 x i1> undef, <51 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <52 x i1> undef, <52 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <53 x i1> undef, <53 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <54 x i1> undef, <54 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <55 x i1> undef, <55 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <56 x i1> undef, <56 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <57 x i1> undef, <57 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <58 x i1> undef, <58 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <59 x i1> undef, <59 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <60 x i1> undef, <60 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <61 x i1> undef, <61 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <62 x i1> undef, <62 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: store <63 x i1> undef, <63 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; store <1 x i64> undef, <1 x i64>* undef, align 64 @@ -3759,7 +3759,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load double, double* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load i8*, i8** undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load i1*, i1** undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <16 x i8>, <16 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <8 x i16>, <8 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <4 x i32>, <4 x i32>* undef, align 4 @@ -3773,7 +3773,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <4 x i1>, <4 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <2 x i1>, <2 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <1 x i1>, <1 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <32 x i8>, <32 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <16 x i16>, <16 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %29 = load <8 x i32>, <8 x i32>* undef, align 4 @@ -3783,8 +3783,8 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <8 x float>, <8 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %34 = load <4 x double>, <4 x double>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %35 = load <4 x i8*>, <4 x i8*>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %38 = load <64 x i8>, <64 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %39 = load <32 x i16>, <32 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %40 = load <16 x i32>, <16 x i32>* undef, align 4 @@ -3795,7 +3795,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <16 x float>, <16 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <8 x double>, <8 x double>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %47 = load <8 x i8*>, <8 x i8*>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'loads_align4' @@ -3810,7 +3810,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load double, double* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load i8*, i8** undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load i1*, i1** undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <16 x i8>, <16 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <8 x i16>, <8 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <4 x i32>, <4 x i32>* undef, align 4 @@ -3824,7 +3824,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <4 x i1>, <4 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <2 x i1>, <2 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <1 x i1>, <1 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <32 x i8>, <32 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <16 x i16>, <16 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %29 = load <8 x i32>, <8 x i32>* undef, align 4 @@ -3834,8 +3834,8 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <8 x float>, <8 x float>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %34 = load <4 x double>, <4 x double>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %35 = load <4 x i8*>, <4 x i8*>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %38 = load <64 x i8>, <64 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %39 = load <32 x i16>, <32 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %40 = load <16 x i32>, <16 x i32>* undef, align 4 @@ -3846,7 +3846,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <16 x float>, <16 x float>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <8 x double>, <8 x double>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %47 = load <8 x i8*>, <8 x i8*>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'loads_align4' @@ -3861,7 +3861,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load double, double* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load i8*, i8** undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load i1*, i1** undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <16 x i8>, <16 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <8 x i16>, <8 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <4 x i32>, <4 x i32>* undef, align 4 @@ -3875,7 +3875,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <4 x i1>, <4 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <2 x i1>, <2 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <1 x i1>, <1 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %27 = load <32 x i8>, <32 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %28 = load <16 x i16>, <16 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %29 = load <8 x i32>, <8 x i32>* undef, align 4 @@ -3886,7 +3886,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %34 = load <4 x double>, <4 x double>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %35 = load <4 x i8*>, <4 x i8*>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %38 = load <64 x i8>, <64 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %39 = load <32 x i16>, <32 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %40 = load <16 x i32>, <16 x i32>* undef, align 4 @@ -3897,7 +3897,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <16 x float>, <16 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %46 = load <8 x double>, <8 x double>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <8 x i8*>, <8 x i8*>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'loads_align4' @@ -4025,212 +4025,212 @@ ; Partial vectors with i64 elements (doubles as pointer-sized tests)) ; SSE2-LABEL: 'loads_partial_align4' ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 13 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 36 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 13 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 13 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 13 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 68 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 36 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 4 -; SSE2-NEXT: Cost Model: Found an estimated cost of 68 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 14 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 4 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 4 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'loads_partial_align4' ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 4 @@ -4251,520 +4251,520 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 4 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 4 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 4 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'loads_partial_align4' ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 4 -; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 4 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 4 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'loads_partial_align4' ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 4 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 4 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 4 ; AVX512-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; load <1 x i64>, <1 x i64>* undef, align 4 @@ -5005,7 +5005,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load double, double* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load i8*, i8** undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load i1*, i1** undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <16 x i8>, <16 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <8 x i16>, <8 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <4 x i32>, <4 x i32>* undef, align 1 @@ -5019,7 +5019,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <4 x i1>, <4 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <2 x i1>, <2 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <1 x i1>, <1 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <32 x i8>, <32 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <16 x i16>, <16 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %29 = load <8 x i32>, <8 x i32>* undef, align 1 @@ -5029,8 +5029,8 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <8 x float>, <8 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %34 = load <4 x double>, <4 x double>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %35 = load <4 x i8*>, <4 x i8*>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %38 = load <64 x i8>, <64 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %39 = load <32 x i16>, <32 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %40 = load <16 x i32>, <16 x i32>* undef, align 1 @@ -5041,7 +5041,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <16 x float>, <16 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <8 x double>, <8 x double>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %47 = load <8 x i8*>, <8 x i8*>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'loads_align1' @@ -5056,7 +5056,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load double, double* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load i8*, i8** undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load i1*, i1** undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <16 x i8>, <16 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <8 x i16>, <8 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <4 x i32>, <4 x i32>* undef, align 1 @@ -5070,7 +5070,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <4 x i1>, <4 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <2 x i1>, <2 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <1 x i1>, <1 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <32 x i8>, <32 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <16 x i16>, <16 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %29 = load <8 x i32>, <8 x i32>* undef, align 1 @@ -5080,8 +5080,8 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <8 x float>, <8 x float>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %34 = load <4 x double>, <4 x double>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %35 = load <4 x i8*>, <4 x i8*>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %38 = load <64 x i8>, <64 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %39 = load <32 x i16>, <32 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %40 = load <16 x i32>, <16 x i32>* undef, align 1 @@ -5092,7 +5092,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <16 x float>, <16 x float>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <8 x double>, <8 x double>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %47 = load <8 x i8*>, <8 x i8*>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'loads_align1' @@ -5107,7 +5107,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load double, double* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load i8*, i8** undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load i1*, i1** undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <16 x i8>, <16 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <8 x i16>, <8 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <4 x i32>, <4 x i32>* undef, align 1 @@ -5121,7 +5121,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <4 x i1>, <4 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <2 x i1>, <2 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <1 x i1>, <1 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %27 = load <32 x i8>, <32 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %28 = load <16 x i16>, <16 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %29 = load <8 x i32>, <8 x i32>* undef, align 1 @@ -5132,7 +5132,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %34 = load <4 x double>, <4 x double>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %35 = load <4 x i8*>, <4 x i8*>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %38 = load <64 x i8>, <64 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %39 = load <32 x i16>, <32 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %40 = load <16 x i32>, <16 x i32>* undef, align 1 @@ -5143,7 +5143,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <16 x float>, <16 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %46 = load <8 x double>, <8 x double>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <8 x i8*>, <8 x i8*>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'loads_align1' @@ -5271,212 +5271,212 @@ ; Partial vectors with i64 elements (doubles as pointer-sized tests)) ; SSE2-LABEL: 'loads_partial_align1' ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 23 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 25 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 21 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 36 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 21 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 24 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 26 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 22 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 22 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 25 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 27 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 21 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 21 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 23 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 68 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 21 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 23 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 26 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 28 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 36 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 1 -; SSE2-NEXT: Cost Model: Found an estimated cost of 68 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 1 +; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 1 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'loads_partial_align1' ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 1 @@ -5497,520 +5497,520 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 1 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 1 +; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 1 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'loads_partial_align1' ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 1 -; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 1 +; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 1 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'loads_partial_align1' ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 1 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 1 +; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 1 ; AVX512-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; load <1 x i64>, <1 x i64>* undef, align 1 @@ -6251,7 +6251,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load double, double* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load i8*, i8** undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load i1*, i1** undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <16 x i8>, <16 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <8 x i16>, <8 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <4 x i32>, <4 x i32>* undef, align 64 @@ -6265,7 +6265,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <4 x i1>, <4 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <2 x i1>, <2 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <1 x i1>, <1 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <32 x i8>, <32 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <16 x i16>, <16 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %29 = load <8 x i32>, <8 x i32>* undef, align 64 @@ -6275,8 +6275,8 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <8 x float>, <8 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %34 = load <4 x double>, <4 x double>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %35 = load <4 x i8*>, <4 x i8*>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %38 = load <64 x i8>, <64 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %39 = load <32 x i16>, <32 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %40 = load <16 x i32>, <16 x i32>* undef, align 64 @@ -6287,7 +6287,7 @@ ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <16 x float>, <16 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <8 x double>, <8 x double>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %47 = load <8 x i8*>, <8 x i8*>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'loads_align64' @@ -6302,7 +6302,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load double, double* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load i8*, i8** undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load i1*, i1** undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <16 x i8>, <16 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <8 x i16>, <8 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <4 x i32>, <4 x i32>* undef, align 64 @@ -6316,7 +6316,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <4 x i1>, <4 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <2 x i1>, <2 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <1 x i1>, <1 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <32 x i8>, <32 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <16 x i16>, <16 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %29 = load <8 x i32>, <8 x i32>* undef, align 64 @@ -6326,8 +6326,8 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <8 x float>, <8 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %34 = load <4 x double>, <4 x double>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %35 = load <4 x i8*>, <4 x i8*>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 32 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %38 = load <64 x i8>, <64 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %39 = load <32 x i16>, <32 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %40 = load <16 x i32>, <16 x i32>* undef, align 64 @@ -6338,7 +6338,7 @@ ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %45 = load <16 x float>, <16 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <8 x double>, <8 x double>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %47 = load <8 x i8*>, <8 x i8*>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'loads_align64' @@ -6353,7 +6353,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load double, double* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load i8*, i8** undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load i1*, i1** undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <128 x i1>, <128 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <16 x i8>, <16 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <8 x i16>, <8 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <4 x i32>, <4 x i32>* undef, align 64 @@ -6367,7 +6367,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <4 x i1>, <4 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <2 x i1>, <2 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <1 x i1>, <1 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %26 = load <256 x i1>, <256 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %27 = load <32 x i8>, <32 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %28 = load <16 x i16>, <16 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %29 = load <8 x i32>, <8 x i32>* undef, align 64 @@ -6378,7 +6378,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %34 = load <4 x double>, <4 x double>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %35 = load <4 x i8*>, <4 x i8*>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <32 x i1>, <32 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %37 = load <512 x i1>, <512 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %38 = load <64 x i8>, <64 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %39 = load <32 x i16>, <32 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %40 = load <16 x i32>, <16 x i32>* undef, align 64 @@ -6389,7 +6389,7 @@ ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <16 x float>, <16 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %46 = load <8 x double>, <8 x double>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <8 x i8*>, <8 x i8*>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <64 x i1>, <64 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'loads_align64' @@ -6517,746 +6517,746 @@ ; Partial vectors with i64 elements (doubles as pointer-sized tests)) ; SSE2-LABEL: 'loads_partial_align64' ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 16 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 36 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 68 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 18 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 19 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 20 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 34 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 35 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 36 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 64 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 67 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 64 -; SSE2-NEXT: Cost Model: Found an estimated cost of 68 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 64 +; SSE2-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 64 ; SSE2-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; SSE41-LABEL: 'loads_partial_align64' ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 64 -; SSE41-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 64 +; SSE41-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 64 ; SSE41-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX-LABEL: 'loads_partial_align64' ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 64 -; AVX-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 64 +; AVX-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 64 ; AVX-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; ; AVX512-LABEL: 'loads_partial_align64' ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %1 = load <1 x i64>, <1 x i64>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %2 = load <3 x i64>, <3 x i64>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %3 = load <5 x i64>, <5 x i64>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %4 = load <6 x i64>, <6 x i64>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %5 = load <7 x i64>, <7 x i64>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %6 = load <1 x double>, <1 x double>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %7 = load <3 x double>, <3 x double>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %8 = load <5 x double>, <5 x double>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %9 = load <6 x double>, <6 x double>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %10 = load <7 x double>, <7 x double>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %11 = load <1 x i32>, <1 x i32>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %12 = load <2 x i32>, <2 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %13 = load <3 x i32>, <3 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %14 = load <5 x i32>, <5 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %15 = load <6 x i32>, <6 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %16 = load <7 x i32>, <7 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %17 = load <9 x i32>, <9 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %18 = load <10 x i32>, <10 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %19 = load <11 x i32>, <11 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %20 = load <12 x i32>, <12 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %21 = load <13 x i32>, <13 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %22 = load <14 x i32>, <14 x i32>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %23 = load <15 x i32>, <15 x i32>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %24 = load <1 x float>, <1 x float>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %25 = load <2 x float>, <2 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %26 = load <3 x float>, <3 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %27 = load <5 x float>, <5 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %28 = load <6 x float>, <6 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %29 = load <7 x float>, <7 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %30 = load <9 x float>, <9 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %31 = load <10 x float>, <10 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %32 = load <11 x float>, <11 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %33 = load <12 x float>, <12 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %34 = load <13 x float>, <13 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %35 = load <14 x float>, <14 x float>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %36 = load <15 x float>, <15 x float>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %37 = load <1 x i16>, <1 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %38 = load <2 x i16>, <2 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %39 = load <3 x i16>, <3 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %40 = load <4 x i16>, <4 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %41 = load <5 x i16>, <5 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %42 = load <6 x i16>, <6 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %43 = load <7 x i16>, <7 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %44 = load <9 x i16>, <9 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %45 = load <10 x i16>, <10 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %46 = load <11 x i16>, <11 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %47 = load <12 x i16>, <12 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %48 = load <13 x i16>, <13 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %49 = load <14 x i16>, <14 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %50 = load <15 x i16>, <15 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %51 = load <17 x i16>, <17 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %52 = load <18 x i16>, <18 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %53 = load <19 x i16>, <19 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %54 = load <20 x i16>, <20 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %55 = load <21 x i16>, <21 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %56 = load <22 x i16>, <22 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %57 = load <23 x i16>, <23 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %58 = load <24 x i16>, <24 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %59 = load <25 x i16>, <25 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %60 = load <26 x i16>, <26 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %61 = load <27 x i16>, <27 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %62 = load <28 x i16>, <28 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %63 = load <29 x i16>, <29 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %64 = load <30 x i16>, <30 x i16>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %65 = load <31 x i16>, <31 x i16>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %66 = load <1 x i8>, <1 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %67 = load <2 x i8>, <2 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %68 = load <3 x i8>, <3 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %69 = load <4 x i8>, <4 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %70 = load <5 x i8>, <5 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %71 = load <6 x i8>, <6 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %72 = load <7 x i8>, <7 x i8>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %73 = load <8 x i8>, <8 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 64 -; AVX512-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %74 = load <9 x i8>, <9 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %75 = load <10 x i8>, <10 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %76 = load <11 x i8>, <11 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %77 = load <12 x i8>, <12 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %78 = load <13 x i8>, <13 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %79 = load <14 x i8>, <14 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %80 = load <15 x i8>, <15 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %81 = load <17 x i8>, <17 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %82 = load <18 x i8>, <18 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %83 = load <19 x i8>, <19 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %84 = load <20 x i8>, <20 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %85 = load <21 x i8>, <21 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %86 = load <22 x i8>, <22 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %87 = load <23 x i8>, <23 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %88 = load <24 x i8>, <24 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %89 = load <25 x i8>, <25 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %90 = load <26 x i8>, <26 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %91 = load <27 x i8>, <27 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %92 = load <28 x i8>, <28 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %93 = load <29 x i8>, <29 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %94 = load <30 x i8>, <30 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %95 = load <31 x i8>, <31 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %96 = load <33 x i8>, <33 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %97 = load <34 x i8>, <34 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %98 = load <35 x i8>, <35 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %99 = load <36 x i8>, <36 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %100 = load <37 x i8>, <37 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %101 = load <38 x i8>, <38 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %102 = load <39 x i8>, <39 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %103 = load <40 x i8>, <40 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %104 = load <41 x i8>, <41 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %105 = load <42 x i8>, <42 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %106 = load <43 x i8>, <43 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %107 = load <44 x i8>, <44 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %108 = load <45 x i8>, <45 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %109 = load <46 x i8>, <46 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %110 = load <47 x i8>, <47 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %111 = load <48 x i8>, <48 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %112 = load <49 x i8>, <49 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %113 = load <50 x i8>, <50 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %114 = load <51 x i8>, <51 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %115 = load <52 x i8>, <52 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %116 = load <53 x i8>, <53 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %117 = load <54 x i8>, <54 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %118 = load <55 x i8>, <55 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %119 = load <56 x i8>, <56 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %120 = load <57 x i8>, <57 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %121 = load <58 x i8>, <58 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %122 = load <59 x i8>, <59 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %123 = load <60 x i8>, <60 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %124 = load <61 x i8>, <61 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %125 = load <62 x i8>, <62 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %126 = load <63 x i8>, <63 x i8>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %127 = load <3 x i1>, <3 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %128 = load <5 x i1>, <5 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %129 = load <6 x i1>, <6 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %130 = load <7 x i1>, <7 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %131 = load <9 x i1>, <9 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %132 = load <10 x i1>, <10 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %133 = load <11 x i1>, <11 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %134 = load <12 x i1>, <12 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %135 = load <13 x i1>, <13 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %136 = load <14 x i1>, <14 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %137 = load <15 x i1>, <15 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %138 = load <17 x i1>, <17 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %139 = load <18 x i1>, <18 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %140 = load <19 x i1>, <19 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %141 = load <20 x i1>, <20 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %142 = load <21 x i1>, <21 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %143 = load <22 x i1>, <22 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %144 = load <23 x i1>, <23 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %145 = load <24 x i1>, <24 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %146 = load <25 x i1>, <25 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %147 = load <26 x i1>, <26 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %148 = load <27 x i1>, <27 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %149 = load <28 x i1>, <28 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %150 = load <29 x i1>, <29 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %151 = load <30 x i1>, <30 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %152 = load <31 x i1>, <31 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %153 = load <33 x i1>, <33 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %154 = load <34 x i1>, <34 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %155 = load <35 x i1>, <35 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %156 = load <36 x i1>, <36 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %157 = load <37 x i1>, <37 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %158 = load <38 x i1>, <38 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %159 = load <39 x i1>, <39 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %160 = load <40 x i1>, <40 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %161 = load <41 x i1>, <41 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %162 = load <42 x i1>, <42 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %163 = load <43 x i1>, <43 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %164 = load <44 x i1>, <44 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %165 = load <45 x i1>, <45 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %166 = load <46 x i1>, <46 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %167 = load <47 x i1>, <47 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %168 = load <48 x i1>, <48 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %169 = load <49 x i1>, <49 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %170 = load <50 x i1>, <50 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %171 = load <51 x i1>, <51 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %172 = load <52 x i1>, <52 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %173 = load <53 x i1>, <53 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %174 = load <54 x i1>, <54 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %175 = load <55 x i1>, <55 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %176 = load <56 x i1>, <56 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %177 = load <57 x i1>, <57 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %178 = load <58 x i1>, <58 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %179 = load <59 x i1>, <59 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %180 = load <60 x i1>, <60 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %181 = load <61 x i1>, <61 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %182 = load <62 x i1>, <62 x i1>* undef, align 64 +; AVX512-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %183 = load <63 x i1>, <63 x i1>* undef, align 64 ; AVX512-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 undef ; load <1 x i64>, <1 x i64>* undef, align 64