Index: llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp =================================================================== --- llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp +++ llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp @@ -666,12 +666,17 @@ // currently have here. return 0; - APInt PseudoAddr = APInt::getAllOnes(DL.getPointerSizeInBits()); - // Add a cost of address load + the cost of the vector load. - return RISCVMatInt::getIntMatCost(PseudoAddr, DL.getPointerSizeInBits(), - getST()->getFeatureBits()) + - getMemoryOpCost(Instruction::Load, Ty, DL.getABITypeAlign(Ty), - /*AddressSpace=*/0, CostKind); + if (OpInfo.isUniform()) + // vmv.x.i, vmv.v.x, or vfmv.v.f + // We ignore the cost of the scalar constant materialization to be consistent + // with how we treat scalar constants themselves just above. + return 1; + + // Add a cost of address generation + the cost of the vector load. The + // address is expected to be a PC relative offset to a constant pool entry + // using auipc/addi. + return 2 + getMemoryOpCost(Instruction::Load, Ty, DL.getABITypeAlign(Ty), + /*AddressSpace=*/0, CostKind); } Index: llvm/test/Analysis/CostModel/RISCV/rvv-load-store.ll =================================================================== --- llvm/test/Analysis/CostModel/RISCV/rvv-load-store.ll +++ llvm/test/Analysis/CostModel/RISCV/rvv-load-store.ll @@ -297,17 +297,17 @@ ; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> undef, ptr %p, align 16 ; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store <4 x i32> zeroinitializer, ptr %p, align 16 ; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x i64> zeroinitializer, ptr %p, align 32 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 -; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: store <4 x i64> , ptr %p, align 32 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 -; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: store <4 x i64> , ptr %p, align 32 +; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <4 x i32> , ptr %p, align 16 +; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store <4 x i32> , ptr %p, align 16 ; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret void ; Index: llvm/test/Transforms/SLPVectorizer/RISCV/load-store.ll =================================================================== --- llvm/test/Transforms/SLPVectorizer/RISCV/load-store.ll +++ llvm/test/Transforms/SLPVectorizer/RISCV/load-store.ll @@ -222,7 +222,13 @@ define void @store_stepvector_i32(ptr %dest) { ; CHECK-LABEL: @store_stepvector_i32( ; CHECK-NEXT: entry: -; CHECK-NEXT: store <4 x i32> , ptr [[DEST:%.*]], align 4 +; CHECK-NEXT: store i32 0, ptr [[DEST:%.*]], align 4 +; CHECK-NEXT: [[INC1:%.*]] = getelementptr inbounds i32, ptr [[DEST]], i64 1 +; CHECK-NEXT: store i32 1, ptr [[INC1]], align 2 +; CHECK-NEXT: [[INC2:%.*]] = getelementptr inbounds i32, ptr [[DEST]], i64 2 +; CHECK-NEXT: store i32 2, ptr [[INC2]], align 2 +; CHECK-NEXT: [[INC3:%.*]] = getelementptr inbounds i32, ptr [[DEST]], i64 3 +; CHECK-NEXT: store i32 3, ptr [[INC3]], align 2 ; CHECK-NEXT: ret void ; ; DEFAULT-LABEL: @store_stepvector_i32( @@ -250,7 +256,13 @@ define void @store_arbitrary_constant_i32(ptr %dest) { ; CHECK-LABEL: @store_arbitrary_constant_i32( ; CHECK-NEXT: entry: -; CHECK-NEXT: store <4 x i32> , ptr [[DEST:%.*]], align 4 +; CHECK-NEXT: store i32 0, ptr [[DEST:%.*]], align 4 +; CHECK-NEXT: [[INC1:%.*]] = getelementptr inbounds i32, ptr [[DEST]], i64 1 +; CHECK-NEXT: store i32 -33, ptr [[INC1]], align 2 +; CHECK-NEXT: [[INC2:%.*]] = getelementptr inbounds i32, ptr [[DEST]], i64 2 +; CHECK-NEXT: store i32 44, ptr [[INC2]], align 2 +; CHECK-NEXT: [[INC3:%.*]] = getelementptr inbounds i32, ptr [[DEST]], i64 3 +; CHECK-NEXT: store i32 77, ptr [[INC3]], align 2 ; CHECK-NEXT: ret void ; ; DEFAULT-LABEL: @store_arbitrary_constant_i32( Index: llvm/test/Transforms/SLPVectorizer/RISCV/rvv-min-vector-size.ll =================================================================== --- llvm/test/Transforms/SLPVectorizer/RISCV/rvv-min-vector-size.ll +++ llvm/test/Transforms/SLPVectorizer/RISCV/rvv-min-vector-size.ll @@ -14,33 +14,33 @@ ; CHECK-128-NEXT: entry: ; CHECK-128-NEXT: store i64 0, i64* [[DA:%.*]], align 8 ; CHECK-128-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i64, i64* [[DA]], i64 1 -; CHECK-128-NEXT: store i64 1, i64* [[ARRAYIDX1]], align 8 +; CHECK-128-NEXT: store i64 0, i64* [[ARRAYIDX1]], align 8 ; CHECK-128-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds i64, i64* [[DA]], i64 2 -; CHECK-128-NEXT: store i64 2, i64* [[ARRAYIDX2]], align 8 +; CHECK-128-NEXT: store i64 0, i64* [[ARRAYIDX2]], align 8 ; CHECK-128-NEXT: [[ARRAYIDX3:%.*]] = getelementptr inbounds i64, i64* [[DA]], i64 3 -; CHECK-128-NEXT: store i64 3, i64* [[ARRAYIDX3]], align 8 +; CHECK-128-NEXT: store i64 0, i64* [[ARRAYIDX3]], align 8 ; CHECK-128-NEXT: ret void ; ; CHECK-256-LABEL: @foo( ; CHECK-256-NEXT: entry: ; CHECK-256-NEXT: [[TMP0:%.*]] = bitcast i64* [[DA:%.*]] to <4 x i64>* -; CHECK-256-NEXT: store <4 x i64> , <4 x i64>* [[TMP0]], align 8 +; CHECK-256-NEXT: store <4 x i64> zeroinitializer, <4 x i64>* [[TMP0]], align 8 ; CHECK-256-NEXT: ret void ; ; CHECK-512-LABEL: @foo( ; CHECK-512-NEXT: entry: ; CHECK-512-NEXT: [[TMP0:%.*]] = bitcast i64* [[DA:%.*]] to <4 x i64>* -; CHECK-512-NEXT: store <4 x i64> , <4 x i64>* [[TMP0]], align 8 +; CHECK-512-NEXT: store <4 x i64> zeroinitializer, <4 x i64>* [[TMP0]], align 8 ; CHECK-512-NEXT: ret void ; entry: store i64 0, i64* %da, align 8 %arrayidx1 = getelementptr inbounds i64, i64* %da, i64 1 - store i64 1, i64* %arrayidx1, align 8 + store i64 0, i64* %arrayidx1, align 8 %arrayidx2 = getelementptr inbounds i64, i64* %da, i64 2 - store i64 2, i64* %arrayidx2, align 8 + store i64 0, i64* %arrayidx2, align 8 %arrayidx3 = getelementptr inbounds i64, i64* %da, i64 3 - store i64 3, i64* %arrayidx3, align 8 + store i64 0, i64* %arrayidx3, align 8 ret void } @@ -49,14 +49,14 @@ ; CHECK-NEXT: entry: ; CHECK-NEXT: store i8 0, i8* [[DA:%.*]], align 8 ; CHECK-NEXT: [[ARRAYIDX1:%.*]] = getelementptr inbounds i8, i8* [[DA]], i8 1 -; CHECK-NEXT: store i8 1, i8* [[ARRAYIDX1]], align 8 +; CHECK-NEXT: store i8 0, i8* [[ARRAYIDX1]], align 8 ; CHECK-NEXT: [[ARRAYIDX2:%.*]] = getelementptr inbounds i8, i8* [[DA]], i8 2 ; CHECK-NEXT: ret void ; entry: store i8 0, i8* %da, align 8 %arrayidx1 = getelementptr inbounds i8, i8* %da, i8 1 - store i8 1, i8* %arrayidx1, align 8 + store i8 0, i8* %arrayidx1, align 8 %arrayidx2 = getelementptr inbounds i8, i8* %da, i8 2 ret void }