diff --git a/llvm/lib/Target/RISCV/RISCVISelLowering.h b/llvm/lib/Target/RISCV/RISCVISelLowering.h --- a/llvm/lib/Target/RISCV/RISCVISelLowering.h +++ b/llvm/lib/Target/RISCV/RISCVISelLowering.h @@ -85,6 +85,12 @@ // Splats an i64 scalar to a vector type (with element type i64) where the // scalar is a sign-extended i32. SPLAT_VECTOR_I64, + // Matches the semantics of vslidedown.vx or vslidedown.vi. The first operand + // is the pass-thru operand, the second is the source vector, and the third + // is the XLenVT index. + VSLIDEDOWN, + // Matches the semantics of the unmasked vid.v instruction. + VID, }; } // namespace RISCVISD @@ -269,6 +275,7 @@ SDValue lowerShiftLeftParts(SDValue Op, SelectionDAG &DAG) const; SDValue lowerShiftRightParts(SDValue Op, SelectionDAG &DAG, bool IsSRA) const; SDValue lowerSPLATVECTOR(SDValue Op, SelectionDAG &DAG) const; + SDValue lowerINSERTVECTORELT(SDValue Op, SelectionDAG &DAG) const; SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const; SDValue LowerINTRINSIC_W_CHAIN(SDValue Op, SelectionDAG &DAG) const; diff --git a/llvm/lib/Target/RISCV/RISCVISelLowering.cpp b/llvm/lib/Target/RISCV/RISCVISelLowering.cpp --- a/llvm/lib/Target/RISCV/RISCVISelLowering.cpp +++ b/llvm/lib/Target/RISCV/RISCVISelLowering.cpp @@ -371,9 +371,13 @@ setOperationAction(ISD::UMAX, VT, Legal); } - // We must custom-lower SPLAT_VECTOR vXi64 on RV32 - if (!Subtarget.is64Bit()) + // We must custom-lower certain vXi64 operations on RV32 due to the vector + // element type being illegal. + if (!Subtarget.is64Bit()) { setOperationAction(ISD::SPLAT_VECTOR, MVT::i64, Custom); + setOperationAction(ISD::INSERT_VECTOR_ELT, MVT::i64, Custom); + setOperationAction(ISD::EXTRACT_VECTOR_ELT, MVT::i64, Custom); + } // Expand various CCs to best match the RVV ISA, which natively supports UNE // but no other unordered comparisons, and supports all ordered comparisons @@ -684,6 +688,8 @@ } case ISD::SPLAT_VECTOR: return lowerSPLATVECTOR(Op, DAG); + case ISD::INSERT_VECTOR_ELT: + return lowerINSERTVECTORELT(Op, DAG); } } @@ -1121,6 +1127,12 @@ DAG.getConstant(CVal->getSExtValue(), DL, MVT::i32)); } + if (SplatVal.getOpcode() == ISD::SIGN_EXTEND && + SplatVal.getOperand(0).getValueType() == MVT::i32) { + return DAG.getNode(RISCVISD::SPLAT_VECTOR_I64, DL, VecVT, + SplatVal.getOperand(0)); + } + // Else, on RV32 we lower an i64-element SPLAT_VECTOR thus, being careful not // to accidentally sign-extend the 32-bit halves to the e64 SEW: // vmv.v.x vX, hi @@ -1148,6 +1160,38 @@ return DAG.getNode(ISD::OR, DL, VecVT, Lo, Hi); } +// Custom-lower INSERT_VECTOR_ELT where XLEN(Op.getOperand(0))->getZExtValue(); @@ -1447,6 +1491,45 @@ Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, NewOp)); break; } + case ISD::EXTRACT_VECTOR_ELT: { + // Custom-legalize an EXTRACT_VECTOR_ELT where XLEN XLEN, only the least-significant XLEN bits are + // transferred to the destination register. We issue two of these from the + // upper- and lower- halves of the SEW-bit vector element, slid down to the + // first element. + SDLoc DL(N); + SDValue Vec = N->getOperand(0); + SDValue Idx = N->getOperand(1); + EVT VecVT = Vec.getValueType(); + assert(!Subtarget.is64Bit() && N->getValueType(0) == MVT::i64 && + VecVT.getVectorElementType() == MVT::i64 && + "Unexpected EXTRACT_VECTOR_ELT legalization"); + + SDValue Slidedown = Vec; + // Unless the index is known to be 0, we must slide the vector down to get + // the desired element into index 0. + if (!isNullConstant(Idx)) + Slidedown = DAG.getNode(RISCVISD::VSLIDEDOWN, DL, VecVT, + DAG.getUNDEF(VecVT), Vec, Idx); + + // Extract the lower XLEN bits of the correct vector element. + SDValue EltLo = DAG.getNode(RISCVISD::VMV_X_S, DL, Subtarget.getXLenVT(), + Slidedown, Idx); + + // To extract the upper XLEN bits of the vector element, shift the first + // element right by 32 bits and re-extract the lower XLEN bits. + SDValue ThirtyTwoV = + DAG.getNode(RISCVISD::SPLAT_VECTOR_I64, DL, VecVT, + DAG.getConstant(32, DL, Subtarget.getXLenVT())); + SDValue LShr32 = DAG.getNode(ISD::SRL, DL, VecVT, Slidedown, ThirtyTwoV); + + SDValue EltHi = + DAG.getNode(RISCVISD::VMV_X_S, DL, Subtarget.getXLenVT(), LShr32, Idx); + + Results.push_back(DAG.getNode(ISD::BUILD_PAIR, DL, MVT::i64, EltLo, EltHi)); + break; + } case ISD::INTRINSIC_WO_CHAIN: { unsigned IntNo = cast(N->getOperand(0))->getZExtValue(); switch (IntNo) { @@ -3538,6 +3621,8 @@ NODE_NAME_CASE(GORCIW) NODE_NAME_CASE(VMV_X_S) NODE_NAME_CASE(SPLAT_VECTOR_I64) + NODE_NAME_CASE(VSLIDEDOWN) + NODE_NAME_CASE(VID) } // clang-format on return nullptr; diff --git a/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td b/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td --- a/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td +++ b/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td @@ -93,6 +93,15 @@ !dag(type, [operand], [name])); } +class FromFPR32 { + dag ret = !cond(!eq(!cast(operand), !cast(FPR64)): + (INSERT_SUBREG (IMPLICIT_DEF), input_dag, sub_32), + !eq(!cast(operand), !cast(FPR16)): + (EXTRACT_SUBREG input_dag, sub_16), + !eq(1, 1): + input_dag); +} + //===----------------------------------------------------------------------===// // Vector register and vector group type information. //===----------------------------------------------------------------------===// diff --git a/llvm/lib/Target/RISCV/RISCVInstrInfoVSDPatterns.td b/llvm/lib/Target/RISCV/RISCVInstrInfoVSDPatterns.td --- a/llvm/lib/Target/RISCV/RISCVInstrInfoVSDPatterns.td +++ b/llvm/lib/Target/RISCV/RISCVInstrInfoVSDPatterns.td @@ -494,3 +494,133 @@ 0, VLMax, fvti.SEW)>; } } // Predicates = [HasStdExtV, HasStdExtF] + +//===----------------------------------------------------------------------===// +// Vector Element Inserts/Extracts +//===----------------------------------------------------------------------===// + +// The built-in TableGen 'extractelt' and 'insertelt' nodes must return the +// same type as the vector element type. On RISC-V, XLenVT is the only legal +// integer type, so for integer inserts/extracts we use a custom node which +// returns XLenVT. +def riscv_insert_vector_elt + : SDNode<"ISD::INSERT_VECTOR_ELT", + SDTypeProfile<1, 3, [SDTCisSameAs<0, 1>, SDTCisVT<2, XLenVT>, + SDTCisPtrTy<3>]>, []>; +def riscv_extract_vector_elt + : SDNode<"ISD::EXTRACT_VECTOR_ELT", + SDTypeProfile<1, 2, [SDTCisVT<0, XLenVT>, SDTCisPtrTy<2>]>, []>; + +multiclass VPatInsertExtractElt_XI_Idx { + defvar vtilist = !if(IsFloat, AllFloatVectors, AllIntegerVectors); + defvar insertelt_node = !if(IsFloat, insertelt, riscv_insert_vector_elt); + defvar extractelt_node = !if(IsFloat, extractelt, riscv_extract_vector_elt); + foreach vti = vtilist in { + defvar MX = vti.LMul.MX; + defvar vmv_xf_s_inst = !cast(!if(IsFloat, "PseudoVFMV_F_S_", + "PseudoVMV_X_S_")#MX); + defvar vmv_s_xf_inst = !cast(!if(IsFloat, "PseudoVFMV_S_F_", + "PseudoVMV_S_X_")#MX); + defvar slideup_vi_inst = !cast("PseudoVSLIDEUP_VI_"#MX); + defvar slideup_vx_inst = !cast("PseudoVSLIDEUP_VX_"#MX); + defvar slidedown_vx_inst = !cast("PseudoVSLIDEDOWN_VX_"#MX); + defvar slidedown_vi_inst = !cast("PseudoVSLIDEDOWN_VI_"#MX); + + // Optimize element-extract operations where the index is 0 and so the + // vector doesn't need sliding up/down + def : Pat<(vti.Scalar (extractelt_node (vti.Vector vti.RegClass:$rs2), 0)), + FromFPR32.ret>; + + def : Pat<(vti.Scalar (extractelt_node (vti.Vector vti.RegClass:$rs2), + uimm5:$rs1)), + FromFPR32.ret>; + + def : Pat<(vti.Scalar (extractelt_node (vti.Vector vti.RegClass:$rs2), + GPR:$rs1)), + FromFPR32.ret>; + + // Optimize element-insert operations where the index is 0 and so the + // vector doesn't need sliding up/down + def : Pat<(vti.Vector (insertelt_node (vti.Vector vti.RegClass:$merge), + vti.ScalarRegClass:$rs1, 0)), + (vmv_s_xf_inst vti.RegClass:$merge, + ToFPR32.ret, + VLMax, vti.SEW)>; + + def : Pat<(vti.Vector (insertelt_node (vti.Vector vti.RegClass:$merge), + vti.ScalarRegClass:$rs1, uimm5:$rs2)), + (slideup_vi_inst + (vti.Vector vti.RegClass:$merge), + (vmv_s_xf_inst + (slidedown_vi_inst (vti.Vector (IMPLICIT_DEF)), + (vti.Vector vti.RegClass:$merge), + uimm5:$rs2, VLMax, vti.SEW), + ToFPR32.ret, + VLMax, vti.SEW), + uimm5:$rs2, VLMax, vti.SEW)>; + + def : Pat<(vti.Vector (insertelt_node (vti.Vector vti.RegClass:$merge), + vti.ScalarRegClass:$rs1, GPR:$rs2)), + (slideup_vx_inst + (vti.Vector vti.RegClass:$merge), + (vmv_s_xf_inst + (slidedown_vx_inst (vti.Vector (IMPLICIT_DEF)), + (vti.Vector vti.RegClass:$merge), + GPR:$rs2, VLMax, vti.SEW), + ToFPR32.ret, + VLMax, vti.SEW), + GPR:$rs2, VLMax, vti.SEW)>; + } +} + +let Predicates = [HasStdExtV] in +defm "" : VPatInsertExtractElt_XI_Idx; +let Predicates = [HasStdExtV, HasStdExtF] in +defm "" : VPatInsertExtractElt_XI_Idx; + +//===----------------------------------------------------------------------===// +// Miscellaneous RISCVISD SDNodes +//===----------------------------------------------------------------------===// + +def riscv_vid + : SDNode<"RISCVISD::VID", SDTypeProfile<1, 0, [SDTCisVec<0>]>, []>; + +def riscv_slidedown + : SDNode<"RISCVISD::VSLIDEDOWN", + SDTypeProfile<1, 3, [SDTCisVec<0>, SDTCisSameAs<1, 0>, + SDTCisSameAs<2, 0>, SDTCisVT<3, + XLenVT>]>, []>; + +let Predicates = [HasStdExtV] in { + +foreach vti = AllIntegerVectors in + def : Pat<(vti.Vector riscv_vid), + (!cast("PseudoVID_V_"#vti.LMul.MX) VLMax, vti.SEW)>; + +foreach vti = !listconcat(AllIntegerVectors, AllFloatVectors) in { + def : Pat<(vti.Vector (riscv_slidedown (vti.Vector vti.RegClass:$rs3), + (vti.Vector vti.RegClass:$rs1), + uimm5:$rs2)), + (!cast("PseudoVSLIDEDOWN_VI_"#vti.LMul.MX) + vti.RegClass:$rs3, vti.RegClass:$rs1, uimm5:$rs2, + VLMax, vti.SEW)>; + + def : Pat<(vti.Vector (riscv_slidedown (vti.Vector vti.RegClass:$rs3), + (vti.Vector vti.RegClass:$rs1), + GPR:$rs2)), + (!cast("PseudoVSLIDEDOWN_VX_"#vti.LMul.MX) + vti.RegClass:$rs3, vti.RegClass:$rs1, GPR:$rs2, + VLMax, vti.SEW)>; +} +} // Predicates = [HasStdExtV] diff --git a/llvm/test/CodeGen/RISCV/rvv/extractelt-fp-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/extractelt-fp-rv32.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/extractelt-fp-rv32.ll @@ -0,0 +1,532 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=riscv32 -mattr=+d,+experimental-zfh,+experimental-v -target-abi=ilp32d \ +; RUN: -verify-machineinstrs < %s | FileCheck %s + +define half @extractelt_nxv1f16_0( %v) { +; CHECK-LABEL: extractelt_nxv1f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv1f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv1f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv1f16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv1f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv2f16_0( %v) { +; CHECK-LABEL: extractelt_nxv2f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv2f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv2f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv2f16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv2f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv4f16_0( %v) { +; CHECK-LABEL: extractelt_nxv4f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv4f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv4f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv4f16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv4f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv8f16_0( %v) { +; CHECK-LABEL: extractelt_nxv8f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv8f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv8f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv8f16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv8f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv16f16_0( %v) { +; CHECK-LABEL: extractelt_nxv16f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv16f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv16f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv16f16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv16f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv32f16_0( %v) { +; CHECK-LABEL: extractelt_nxv32f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv32f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv32f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv32f16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv32f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define float @extractelt_nxv1f32_0( %v) { +; CHECK-LABEL: extractelt_nxv1f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv1f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv1f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv1f32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv1f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define float @extractelt_nxv2f32_0( %v) { +; CHECK-LABEL: extractelt_nxv2f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv2f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv2f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv2f32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv2f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define float @extractelt_nxv4f32_0( %v) { +; CHECK-LABEL: extractelt_nxv4f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv4f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv4f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv4f32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv4f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define float @extractelt_nxv8f32_0( %v) { +; CHECK-LABEL: extractelt_nxv8f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv8f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv8f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv8f32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv8f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define float @extractelt_nxv16f32_0( %v) { +; CHECK-LABEL: extractelt_nxv16f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv16f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv16f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv16f32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv16f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define double @extractelt_nxv1f64_0( %v) { +; CHECK-LABEL: extractelt_nxv1f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret double %r +} + +define double @extractelt_nxv1f64_imm( %v) { +; CHECK-LABEL: extractelt_nxv1f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret double %r +} + +define double @extractelt_nxv1f64_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv1f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret double %r +} + +define double @extractelt_nxv2f64_0( %v) { +; CHECK-LABEL: extractelt_nxv2f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret double %r +} + +define double @extractelt_nxv2f64_imm( %v) { +; CHECK-LABEL: extractelt_nxv2f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret double %r +} + +define double @extractelt_nxv2f64_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv2f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret double %r +} + +define double @extractelt_nxv4f64_0( %v) { +; CHECK-LABEL: extractelt_nxv4f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret double %r +} + +define double @extractelt_nxv4f64_imm( %v) { +; CHECK-LABEL: extractelt_nxv4f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret double %r +} + +define double @extractelt_nxv4f64_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv4f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret double %r +} + +define double @extractelt_nxv8f64_0( %v) { +; CHECK-LABEL: extractelt_nxv8f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret double %r +} + +define double @extractelt_nxv8f64_imm( %v) { +; CHECK-LABEL: extractelt_nxv8f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret double %r +} + +define double @extractelt_nxv8f64_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv8f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret double %r +} + diff --git a/llvm/test/CodeGen/RISCV/rvv/extractelt-fp-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/extractelt-fp-rv64.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/extractelt-fp-rv64.ll @@ -0,0 +1,532 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=riscv64 -mattr=+d,+experimental-zfh,+experimental-v -target-abi=lp64d \ +; RUN: -verify-machineinstrs < %s | FileCheck %s + +define half @extractelt_nxv1f16_0( %v) { +; CHECK-LABEL: extractelt_nxv1f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv1f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv1f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv1f16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv1f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv2f16_0( %v) { +; CHECK-LABEL: extractelt_nxv2f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv2f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv2f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv2f16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv2f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv4f16_0( %v) { +; CHECK-LABEL: extractelt_nxv4f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv4f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv4f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv4f16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv4f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv8f16_0( %v) { +; CHECK-LABEL: extractelt_nxv8f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv8f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv8f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv8f16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv8f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv16f16_0( %v) { +; CHECK-LABEL: extractelt_nxv16f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv16f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv16f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv16f16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv16f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define half @extractelt_nxv32f16_0( %v) { +; CHECK-LABEL: extractelt_nxv32f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret half %r +} + +define half @extractelt_nxv32f16_imm( %v) { +; CHECK-LABEL: extractelt_nxv32f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret half %r +} + +define half @extractelt_nxv32f16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv32f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: # kill: def $f10_h killed $f10_h killed $f10_f +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret half %r +} + +define float @extractelt_nxv1f32_0( %v) { +; CHECK-LABEL: extractelt_nxv1f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv1f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv1f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv1f32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv1f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define float @extractelt_nxv2f32_0( %v) { +; CHECK-LABEL: extractelt_nxv2f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv2f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv2f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv2f32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv2f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define float @extractelt_nxv4f32_0( %v) { +; CHECK-LABEL: extractelt_nxv4f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv4f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv4f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv4f32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv4f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define float @extractelt_nxv8f32_0( %v) { +; CHECK-LABEL: extractelt_nxv8f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv8f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv8f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv8f32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv8f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define float @extractelt_nxv16f32_0( %v) { +; CHECK-LABEL: extractelt_nxv16f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret float %r +} + +define float @extractelt_nxv16f32_imm( %v) { +; CHECK-LABEL: extractelt_nxv16f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret float %r +} + +define float @extractelt_nxv16f32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv16f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret float %r +} + +define double @extractelt_nxv1f64_0( %v) { +; CHECK-LABEL: extractelt_nxv1f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret double %r +} + +define double @extractelt_nxv1f64_imm( %v) { +; CHECK-LABEL: extractelt_nxv1f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret double %r +} + +define double @extractelt_nxv1f64_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv1f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret double %r +} + +define double @extractelt_nxv2f64_0( %v) { +; CHECK-LABEL: extractelt_nxv2f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret double %r +} + +define double @extractelt_nxv2f64_imm( %v) { +; CHECK-LABEL: extractelt_nxv2f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret double %r +} + +define double @extractelt_nxv2f64_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv2f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret double %r +} + +define double @extractelt_nxv4f64_0( %v) { +; CHECK-LABEL: extractelt_nxv4f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret double %r +} + +define double @extractelt_nxv4f64_imm( %v) { +; CHECK-LABEL: extractelt_nxv4f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret double %r +} + +define double @extractelt_nxv4f64_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv4f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret double %r +} + +define double @extractelt_nxv8f64_0( %v) { +; CHECK-LABEL: extractelt_nxv8f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret double %r +} + +define double @extractelt_nxv8f64_imm( %v) { +; CHECK-LABEL: extractelt_nxv8f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret double %r +} + +define double @extractelt_nxv8f64_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv8f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.f.s fa0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret double %r +} + diff --git a/llvm/test/CodeGen/RISCV/rvv/extractelt-int-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/extractelt-int-rv32.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/extractelt-int-rv32.ll @@ -0,0 +1,796 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=riscv32 -mattr=+d,+experimental-zfh,+experimental-v -target-abi=ilp32d \ +; RUN: -verify-machineinstrs < %s | FileCheck %s + +define i8 @extractelt_nxv1i8_0( %v) { +; CHECK-LABEL: extractelt_nxv1i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv1i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv1i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv1i8_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv1i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv2i8_0( %v) { +; CHECK-LABEL: extractelt_nxv2i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv2i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv2i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv2i8_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv2i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv4i8_0( %v) { +; CHECK-LABEL: extractelt_nxv4i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv4i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv4i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv4i8_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv4i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv8i8_0( %v) { +; CHECK-LABEL: extractelt_nxv8i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv8i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv8i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv8i8_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv8i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv16i8_0( %v) { +; CHECK-LABEL: extractelt_nxv16i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv16i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv16i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv16i8_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv16i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv32i8_0( %v) { +; CHECK-LABEL: extractelt_nxv32i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv32i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv32i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv32i8_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv32i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv64i8_0( %v) { +; CHECK-LABEL: extractelt_nxv64i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv64i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv64i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv64i8_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv64i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i16 @extractelt_nxv1i16_0( %v) { +; CHECK-LABEL: extractelt_nxv1i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv1i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv1i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv1i16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv1i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv2i16_0( %v) { +; CHECK-LABEL: extractelt_nxv2i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv2i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv2i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv2i16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv2i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv4i16_0( %v) { +; CHECK-LABEL: extractelt_nxv4i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv4i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv4i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv4i16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv4i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv8i16_0( %v) { +; CHECK-LABEL: extractelt_nxv8i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv8i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv8i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv8i16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv8i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv16i16_0( %v) { +; CHECK-LABEL: extractelt_nxv16i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv16i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv16i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv16i16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv16i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv32i16_0( %v) { +; CHECK-LABEL: extractelt_nxv32i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv32i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv32i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv32i16_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv32i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i32 @extractelt_nxv1i32_0( %v) { +; CHECK-LABEL: extractelt_nxv1i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv1i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv1i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv1i32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv1i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i32 @extractelt_nxv2i32_0( %v) { +; CHECK-LABEL: extractelt_nxv2i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv2i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv2i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv2i32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv2i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i32 @extractelt_nxv4i32_0( %v) { +; CHECK-LABEL: extractelt_nxv4i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv4i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv4i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv4i32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv4i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i32 @extractelt_nxv8i32_0( %v) { +; CHECK-LABEL: extractelt_nxv8i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv8i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv8i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv8i32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv8i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i32 @extractelt_nxv16i32_0( %v) { +; CHECK-LABEL: extractelt_nxv16i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv16i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv16i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv16i32_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv16i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i64 @extractelt_nxv1i64_0( %v) { +; CHECK-LABEL: extractelt_nxv1i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: addi a0, zero, 32 +; CHECK-NEXT: vsetvli a1, zero, e64,m1,ta,mu +; CHECK-NEXT: vsrl.vx v25, v16, a0 +; CHECK-NEXT: vmv.x.s a1, v25 +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i64 %r +} + +define i64 @extractelt_nxv1i64_imm( %v) { +; CHECK-LABEL: extractelt_nxv1i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsetvli a2, zero, e64,m1,ta,mu +; CHECK-NEXT: vsrl.vx v25, v25, a1 +; CHECK-NEXT: vmv.x.s a1, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i64 %r +} + +define i64 @extractelt_nxv1i64_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv1i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsetvli a2, zero, e64,m1,ta,mu +; CHECK-NEXT: vsrl.vx v25, v25, a1 +; CHECK-NEXT: vmv.x.s a1, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i64 %r +} + +define i64 @extractelt_nxv2i64_0( %v) { +; CHECK-LABEL: extractelt_nxv2i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: addi a0, zero, 32 +; CHECK-NEXT: vsetvli a1, zero, e64,m2,ta,mu +; CHECK-NEXT: vsrl.vx v26, v16, a0 +; CHECK-NEXT: vmv.x.s a1, v26 +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i64 %r +} + +define i64 @extractelt_nxv2i64_imm( %v) { +; CHECK-LABEL: extractelt_nxv2i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsetvli a2, zero, e64,m2,ta,mu +; CHECK-NEXT: vsrl.vx v26, v26, a1 +; CHECK-NEXT: vmv.x.s a1, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i64 %r +} + +define i64 @extractelt_nxv2i64_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv2i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsetvli a2, zero, e64,m2,ta,mu +; CHECK-NEXT: vsrl.vx v26, v26, a1 +; CHECK-NEXT: vmv.x.s a1, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i64 %r +} + +define i64 @extractelt_nxv4i64_0( %v) { +; CHECK-LABEL: extractelt_nxv4i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: addi a0, zero, 32 +; CHECK-NEXT: vsetvli a1, zero, e64,m4,ta,mu +; CHECK-NEXT: vsrl.vx v28, v16, a0 +; CHECK-NEXT: vmv.x.s a1, v28 +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i64 %r +} + +define i64 @extractelt_nxv4i64_imm( %v) { +; CHECK-LABEL: extractelt_nxv4i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsetvli a2, zero, e64,m4,ta,mu +; CHECK-NEXT: vsrl.vx v28, v28, a1 +; CHECK-NEXT: vmv.x.s a1, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i64 %r +} + +define i64 @extractelt_nxv4i64_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv4i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsetvli a2, zero, e64,m4,ta,mu +; CHECK-NEXT: vsrl.vx v28, v28, a1 +; CHECK-NEXT: vmv.x.s a1, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i64 %r +} + +define i64 @extractelt_nxv8i64_0( %v) { +; CHECK-LABEL: extractelt_nxv8i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: addi a0, zero, 32 +; CHECK-NEXT: vsetvli a1, zero, e64,m8,ta,mu +; CHECK-NEXT: vsrl.vx v8, v16, a0 +; CHECK-NEXT: vmv.x.s a1, v8 +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i64 %r +} + +define i64 @extractelt_nxv8i64_imm( %v) { +; CHECK-LABEL: extractelt_nxv8i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsetvli a2, zero, e64,m8,ta,mu +; CHECK-NEXT: vsrl.vx v8, v8, a1 +; CHECK-NEXT: vmv.x.s a1, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i64 %r +} + +define i64 @extractelt_nxv8i64_idx( %v, i32 %idx) { +; CHECK-LABEL: extractelt_nxv8i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsetvli a2, zero, e64,m8,ta,mu +; CHECK-NEXT: vsrl.vx v8, v8, a1 +; CHECK-NEXT: vmv.x.s a1, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i64 %r +} + diff --git a/llvm/test/CodeGen/RISCV/rvv/extractelt-int-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/extractelt-int-rv64.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/extractelt-int-rv64.ll @@ -0,0 +1,752 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=riscv64 -mattr=+d,+experimental-zfh,+experimental-v -target-abi=lp64d \ +; RUN: -verify-machineinstrs < %s | FileCheck %s + +define i8 @extractelt_nxv1i8_0( %v) { +; CHECK-LABEL: extractelt_nxv1i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv1i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv1i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv1i8_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv1i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv2i8_0( %v) { +; CHECK-LABEL: extractelt_nxv2i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv2i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv2i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv2i8_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv2i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv4i8_0( %v) { +; CHECK-LABEL: extractelt_nxv4i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv4i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv4i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv4i8_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv4i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv8i8_0( %v) { +; CHECK-LABEL: extractelt_nxv8i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv8i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv8i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv8i8_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv8i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv16i8_0( %v) { +; CHECK-LABEL: extractelt_nxv16i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv16i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv16i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv16i8_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv16i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv32i8_0( %v) { +; CHECK-LABEL: extractelt_nxv32i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv32i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv32i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv32i8_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv32i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i8 @extractelt_nxv64i8_0( %v) { +; CHECK-LABEL: extractelt_nxv64i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i8 %r +} + +define i8 @extractelt_nxv64i8_imm( %v) { +; CHECK-LABEL: extractelt_nxv64i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e8,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i8 %r +} + +define i8 @extractelt_nxv64i8_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv64i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i8 %r +} + +define i16 @extractelt_nxv1i16_0( %v) { +; CHECK-LABEL: extractelt_nxv1i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv1i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv1i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv1i16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv1i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv2i16_0( %v) { +; CHECK-LABEL: extractelt_nxv2i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv2i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv2i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv2i16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv2i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv4i16_0( %v) { +; CHECK-LABEL: extractelt_nxv4i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv4i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv4i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv4i16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv4i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv8i16_0( %v) { +; CHECK-LABEL: extractelt_nxv8i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv8i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv8i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv8i16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv8i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv16i16_0( %v) { +; CHECK-LABEL: extractelt_nxv16i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv16i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv16i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv16i16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv16i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i16 @extractelt_nxv32i16_0( %v) { +; CHECK-LABEL: extractelt_nxv32i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i16 %r +} + +define i16 @extractelt_nxv32i16_imm( %v) { +; CHECK-LABEL: extractelt_nxv32i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i16 %r +} + +define i16 @extractelt_nxv32i16_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv32i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i16 %r +} + +define i32 @extractelt_nxv1i32_0( %v) { +; CHECK-LABEL: extractelt_nxv1i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv1i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv1i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv1i32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv1i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i32 @extractelt_nxv2i32_0( %v) { +; CHECK-LABEL: extractelt_nxv2i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv2i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv2i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv2i32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv2i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i32 @extractelt_nxv4i32_0( %v) { +; CHECK-LABEL: extractelt_nxv4i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv4i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv4i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv4i32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv4i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i32 @extractelt_nxv8i32_0( %v) { +; CHECK-LABEL: extractelt_nxv8i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv8i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv8i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv8i32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv8i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i32 @extractelt_nxv16i32_0( %v) { +; CHECK-LABEL: extractelt_nxv16i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i32 %r +} + +define i32 @extractelt_nxv16i32_imm( %v) { +; CHECK-LABEL: extractelt_nxv16i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i32 %r +} + +define i32 @extractelt_nxv16i32_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv16i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i32 %r +} + +define i64 @extractelt_nxv1i64_0( %v) { +; CHECK-LABEL: extractelt_nxv1i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i64 %r +} + +define i64 @extractelt_nxv1i64_imm( %v) { +; CHECK-LABEL: extractelt_nxv1i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i64 %r +} + +define i64 @extractelt_nxv1i64_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv1i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.x.s a0, v25 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i64 %r +} + +define i64 @extractelt_nxv2i64_0( %v) { +; CHECK-LABEL: extractelt_nxv2i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i64 %r +} + +define i64 @extractelt_nxv2i64_imm( %v) { +; CHECK-LABEL: extractelt_nxv2i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i64 %r +} + +define i64 @extractelt_nxv2i64_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv2i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.x.s a0, v26 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i64 %r +} + +define i64 @extractelt_nxv4i64_0( %v) { +; CHECK-LABEL: extractelt_nxv4i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i64 %r +} + +define i64 @extractelt_nxv4i64_imm( %v) { +; CHECK-LABEL: extractelt_nxv4i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i64 %r +} + +define i64 @extractelt_nxv4i64_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv4i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.x.s a0, v28 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i64 %r +} + +define i64 @extractelt_nxv8i64_0( %v) { +; CHECK-LABEL: extractelt_nxv8i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v16 +; CHECK-NEXT: ret + %r = extractelement %v, i32 0 + ret i64 %r +} + +define i64 @extractelt_nxv8i64_imm( %v) { +; CHECK-LABEL: extractelt_nxv8i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 2 +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 2 + ret i64 %r +} + +define i64 @extractelt_nxv8i64_idx( %v, i32 signext %idx) { +; CHECK-LABEL: extractelt_nxv8i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli zero, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.x.s a0, v8 +; CHECK-NEXT: ret + %r = extractelement %v, i32 %idx + ret i64 %r +} + diff --git a/llvm/test/CodeGen/RISCV/rvv/insertelt-fp-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/insertelt-fp-rv32.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/insertelt-fp-rv32.ll @@ -0,0 +1,592 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=riscv32 -mattr=+d,+experimental-zfh,+experimental-v -target-abi=ilp32d \ +; RUN: -verify-machineinstrs < %s | FileCheck %s + +define @insertelt_nxv1f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv1f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv1f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv1f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv1f16_idx( %v, half %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv1f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv2f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv2f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv2f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv2f16_idx( %v, half %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv2f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv4f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv4f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv4f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv4f16_idx( %v, half %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv4f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv8f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv8f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv8f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv8f16_idx( %v, half %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv8f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv16f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv16f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv16f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv16f16_idx( %v, half %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv16f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv32f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv32f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv32f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv32f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv32f16_idx( %v, half %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv32f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv1f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv1f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv1f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv1f32_idx( %v, float %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv1f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv2f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv2f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv2f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv2f32_idx( %v, float %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv2f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv4f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv4f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv4f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv4f32_idx( %v, float %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv4f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv8f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv8f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv8f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv8f32_idx( %v, float %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv8f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv16f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv16f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv16f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv16f32_idx( %v, float %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv16f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1f64_0( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv1f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 0 + ret %r +} + +define @insertelt_nxv1f64_imm( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv1f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 3 + ret %r +} + +define @insertelt_nxv1f64_idx( %v, double %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv1f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e64,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2f64_0( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv2f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 0 + ret %r +} + +define @insertelt_nxv2f64_imm( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv2f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 3 + ret %r +} + +define @insertelt_nxv2f64_idx( %v, double %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv2f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a1, zero, e64,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4f64_0( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv4f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 0 + ret %r +} + +define @insertelt_nxv4f64_imm( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv4f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 3 + ret %r +} + +define @insertelt_nxv4f64_idx( %v, double %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv4f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a1, zero, e64,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8f64_0( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv8f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 0 + ret %r +} + +define @insertelt_nxv8f64_imm( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv8f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 3 + ret %r +} + +define @insertelt_nxv8f64_idx( %v, double %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv8f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a1, zero, e64,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 %idx + ret %r +} + diff --git a/llvm/test/CodeGen/RISCV/rvv/insertelt-fp-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/insertelt-fp-rv64.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/insertelt-fp-rv64.ll @@ -0,0 +1,592 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=riscv64 -mattr=+d,+experimental-zfh,+experimental-v -target-abi=lp64d \ +; RUN: -verify-machineinstrs < %s | FileCheck %s + +define @insertelt_nxv1f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv1f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv1f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv1f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv1f16_idx( %v, half %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv1f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv2f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv2f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv2f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv2f16_idx( %v, half %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv2f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv4f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv4f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv4f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv4f16_idx( %v, half %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv4f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv8f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv8f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv8f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv8f16_idx( %v, half %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv8f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv16f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv16f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv16f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv16f16_idx( %v, half %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv16f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv32f16_0( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv32f16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 0 + ret %r +} + +define @insertelt_nxv32f16_imm( %v, half %elt) { +; CHECK-LABEL: insertelt_nxv32f16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 3 + ret %r +} + +define @insertelt_nxv32f16_idx( %v, half %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv32f16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: # kill: def $f10_h killed $f10_h def $f10_f +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e16,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a0 +; CHECK-NEXT: ret + %r = insertelement %v, half %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv1f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv1f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv1f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv1f32_idx( %v, float %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv1f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv2f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv2f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv2f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv2f32_idx( %v, float %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv2f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv4f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv4f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv4f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv4f32_idx( %v, float %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv4f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv8f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv8f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv8f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv8f32_idx( %v, float %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv8f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16f32_0( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv16f32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 0 + ret %r +} + +define @insertelt_nxv16f32_imm( %v, float %elt) { +; CHECK-LABEL: insertelt_nxv16f32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 3 + ret %r +} + +define @insertelt_nxv16f32_idx( %v, float %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv16f32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e32,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a0 +; CHECK-NEXT: ret + %r = insertelement %v, float %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1f64_0( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv1f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 0 + ret %r +} + +define @insertelt_nxv1f64_imm( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv1f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 3 + ret %r +} + +define @insertelt_nxv1f64_idx( %v, double %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv1f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e64,m1,ta,mu +; CHECK-NEXT: vfmv.s.f v25, fa0 +; CHECK-NEXT: vsetvli a1, zero, e64,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2f64_0( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv2f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 0 + ret %r +} + +define @insertelt_nxv2f64_imm( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv2f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 3 + ret %r +} + +define @insertelt_nxv2f64_idx( %v, double %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv2f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e64,m2,ta,mu +; CHECK-NEXT: vfmv.s.f v26, fa0 +; CHECK-NEXT: vsetvli a1, zero, e64,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4f64_0( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv4f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 0 + ret %r +} + +define @insertelt_nxv4f64_imm( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv4f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 3 + ret %r +} + +define @insertelt_nxv4f64_idx( %v, double %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv4f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e64,m4,ta,mu +; CHECK-NEXT: vfmv.s.f v28, fa0 +; CHECK-NEXT: vsetvli a1, zero, e64,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8f64_0( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv8f64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v16, fa0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 0 + ret %r +} + +define @insertelt_nxv8f64_imm( %v, double %elt) { +; CHECK-LABEL: insertelt_nxv8f64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a0, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 3 + ret %r +} + +define @insertelt_nxv8f64_idx( %v, double %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv8f64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a0 +; CHECK-NEXT: vsetvli a1, zero, e64,m8,ta,mu +; CHECK-NEXT: vfmv.s.f v8, fa0 +; CHECK-NEXT: vsetvli a1, zero, e64,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a0 +; CHECK-NEXT: ret + %r = insertelement %v, double %elt, i32 %idx + ret %r +} + diff --git a/llvm/test/CodeGen/RISCV/rvv/insertelt-int-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/insertelt-int-rv32.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/insertelt-int-rv32.ll @@ -0,0 +1,988 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=riscv32 -mattr=+d,+experimental-zfh,+experimental-v -target-abi=ilp32d \ +; RUN: -verify-machineinstrs < %s | FileCheck %s + +define @insertelt_nxv1i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv1i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv1i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv1i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv2i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv2i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv2i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv4i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv4i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv4i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv8i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv8i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv8i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv16i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv16i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv16i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv32i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv32i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv32i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv32i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv32i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv32i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv64i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv64i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv64i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv64i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv64i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv64i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv1i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv1i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv1i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv2i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv2i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv2i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv4i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv4i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv4i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv8i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv8i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv8i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv16i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv16i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv16i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv32i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv32i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv32i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv32i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv32i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv32i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1i32_0( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv1i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv1i32_imm( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv1i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv1i32_idx( %v, i32 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv1i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2i32_0( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv2i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv2i32_imm( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv2i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv2i32_idx( %v, i32 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv2i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4i32_0( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv4i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv4i32_imm( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv4i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv4i32_idx( %v, i32 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv4i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8i32_0( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv8i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv8i32_imm( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv8i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv8i32_idx( %v, i32 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv8i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16i32_0( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv16i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv16i32_imm( %v, i32 %elt) { +; CHECK-LABEL: insertelt_nxv16i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv16i32_idx( %v, i32 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv16i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1i64_0( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv1i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.v.x v25, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v25, v25, a1 +; CHECK-NEXT: vmv.v.x v26, a0 +; CHECK-NEXT: vsll.vx v26, v26, a1 +; CHECK-NEXT: vsrl.vx v26, v26, a1 +; CHECK-NEXT: vor.vv v25, v26, v25 +; CHECK-NEXT: vid.v v26 +; CHECK-NEXT: vmseq.vi v0, v26, 0 +; CHECK-NEXT: vmerge.vvm v16, v16, v25, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 0 + ret %r +} + +define @insertelt_nxv1i64_imm( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv1i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.v.x v25, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v25, v25, a1 +; CHECK-NEXT: vmv.v.x v26, a0 +; CHECK-NEXT: vsll.vx v26, v26, a1 +; CHECK-NEXT: vsrl.vx v26, v26, a1 +; CHECK-NEXT: vor.vv v25, v26, v25 +; CHECK-NEXT: vid.v v26 +; CHECK-NEXT: vmseq.vi v0, v26, 3 +; CHECK-NEXT: vmerge.vvm v16, v16, v25, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 3 + ret %r +} + +define @insertelt_nxv1i64_idx( %v, i64 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv1i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a3, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.v.x v25, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v25, v25, a1 +; CHECK-NEXT: vmv.v.x v26, a0 +; CHECK-NEXT: vsll.vx v26, v26, a1 +; CHECK-NEXT: vsrl.vx v26, v26, a1 +; CHECK-NEXT: vor.vv v25, v26, v25 +; CHECK-NEXT: vid.v v26 +; CHECK-NEXT: vmseq.vx v0, v26, a2 +; CHECK-NEXT: vmerge.vvm v16, v16, v25, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2i64_0( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv2i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.v.x v26, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v26, v26, a1 +; CHECK-NEXT: vmv.v.x v28, a0 +; CHECK-NEXT: vsll.vx v28, v28, a1 +; CHECK-NEXT: vsrl.vx v28, v28, a1 +; CHECK-NEXT: vor.vv v26, v28, v26 +; CHECK-NEXT: vid.v v28 +; CHECK-NEXT: vmseq.vi v0, v28, 0 +; CHECK-NEXT: vmerge.vvm v16, v16, v26, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 0 + ret %r +} + +define @insertelt_nxv2i64_imm( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv2i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.v.x v26, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v26, v26, a1 +; CHECK-NEXT: vmv.v.x v28, a0 +; CHECK-NEXT: vsll.vx v28, v28, a1 +; CHECK-NEXT: vsrl.vx v28, v28, a1 +; CHECK-NEXT: vor.vv v26, v28, v26 +; CHECK-NEXT: vid.v v28 +; CHECK-NEXT: vmseq.vi v0, v28, 3 +; CHECK-NEXT: vmerge.vvm v16, v16, v26, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 3 + ret %r +} + +define @insertelt_nxv2i64_idx( %v, i64 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv2i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a3, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.v.x v26, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v26, v26, a1 +; CHECK-NEXT: vmv.v.x v28, a0 +; CHECK-NEXT: vsll.vx v28, v28, a1 +; CHECK-NEXT: vsrl.vx v28, v28, a1 +; CHECK-NEXT: vor.vv v26, v28, v26 +; CHECK-NEXT: vid.v v28 +; CHECK-NEXT: vmseq.vx v0, v28, a2 +; CHECK-NEXT: vmerge.vvm v16, v16, v26, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4i64_0( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv4i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.v.x v28, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v28, v28, a1 +; CHECK-NEXT: vmv.v.x v8, a0 +; CHECK-NEXT: vsll.vx v8, v8, a1 +; CHECK-NEXT: vsrl.vx v8, v8, a1 +; CHECK-NEXT: vor.vv v28, v8, v28 +; CHECK-NEXT: vid.v v8 +; CHECK-NEXT: vmseq.vi v0, v8, 0 +; CHECK-NEXT: vmerge.vvm v16, v16, v28, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 0 + ret %r +} + +define @insertelt_nxv4i64_imm( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv4i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.v.x v28, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v28, v28, a1 +; CHECK-NEXT: vmv.v.x v8, a0 +; CHECK-NEXT: vsll.vx v8, v8, a1 +; CHECK-NEXT: vsrl.vx v8, v8, a1 +; CHECK-NEXT: vor.vv v28, v8, v28 +; CHECK-NEXT: vid.v v8 +; CHECK-NEXT: vmseq.vi v0, v8, 3 +; CHECK-NEXT: vmerge.vvm v16, v16, v28, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 3 + ret %r +} + +define @insertelt_nxv4i64_idx( %v, i64 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv4i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a3, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.v.x v28, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v28, v28, a1 +; CHECK-NEXT: vmv.v.x v8, a0 +; CHECK-NEXT: vsll.vx v8, v8, a1 +; CHECK-NEXT: vsrl.vx v8, v8, a1 +; CHECK-NEXT: vor.vv v28, v8, v28 +; CHECK-NEXT: vid.v v8 +; CHECK-NEXT: vmseq.vx v0, v8, a2 +; CHECK-NEXT: vmerge.vvm v16, v16, v28, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8i64_0( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv8i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.v.x v8, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v8, v8, a1 +; CHECK-NEXT: vmv.v.x v24, a0 +; CHECK-NEXT: vsll.vx v24, v24, a1 +; CHECK-NEXT: vsrl.vx v24, v24, a1 +; CHECK-NEXT: vor.vv v8, v24, v8 +; CHECK-NEXT: vid.v v24 +; CHECK-NEXT: vmseq.vi v0, v24, 0 +; CHECK-NEXT: vmerge.vvm v16, v16, v8, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 0 + ret %r +} + +define @insertelt_nxv8i64_imm( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv8i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.v.x v8, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v8, v8, a1 +; CHECK-NEXT: vmv.v.x v24, a0 +; CHECK-NEXT: vsll.vx v24, v24, a1 +; CHECK-NEXT: vsrl.vx v24, v24, a1 +; CHECK-NEXT: vor.vv v8, v24, v8 +; CHECK-NEXT: vid.v v24 +; CHECK-NEXT: vmseq.vi v0, v24, 3 +; CHECK-NEXT: vmerge.vvm v16, v16, v8, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 3 + ret %r +} + +define @insertelt_nxv8i64_idx( %v, i64 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv8i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a3, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.v.x v8, a1 +; CHECK-NEXT: addi a1, zero, 32 +; CHECK-NEXT: vsll.vx v8, v8, a1 +; CHECK-NEXT: vmv.v.x v24, a0 +; CHECK-NEXT: vsll.vx v24, v24, a1 +; CHECK-NEXT: vsrl.vx v24, v24, a1 +; CHECK-NEXT: vor.vv v8, v24, v8 +; CHECK-NEXT: vid.v v24 +; CHECK-NEXT: vmseq.vx v0, v24, a2 +; CHECK-NEXT: vmerge.vvm v16, v16, v8, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 %idx + ret %r +} + +; Extra tests to check lowering of constant values +define @insertelt_nxv2i64_0_c10( %v) { +; CHECK-LABEL: insertelt_nxv2i64_0_c10: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,ta,mu +; CHECK-NEXT: vid.v v26 +; CHECK-NEXT: vmseq.vi v0, v26, 0 +; CHECK-NEXT: vmerge.vim v16, v16, 10, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 10, i32 0 + ret %r +} + +define @insertelt_nxv2i64_imm_c10( %v) { +; CHECK-LABEL: insertelt_nxv2i64_imm_c10: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,ta,mu +; CHECK-NEXT: vid.v v26 +; CHECK-NEXT: vmseq.vi v0, v26, 3 +; CHECK-NEXT: vmerge.vim v16, v16, 10, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 10, i32 3 + ret %r +} + +define @insertelt_nxv2i64_idx_c10( %v, i32 %idx) { +; CHECK-LABEL: insertelt_nxv2i64_idx_c10: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,ta,mu +; CHECK-NEXT: vid.v v26 +; CHECK-NEXT: vmseq.vx v0, v26, a0 +; CHECK-NEXT: vmerge.vim v16, v16, 10, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 10, i32 %idx + ret %r +} + +define @insertelt_nxv2i64_0_cn1( %v) { +; CHECK-LABEL: insertelt_nxv2i64_0_cn1: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,ta,mu +; CHECK-NEXT: vid.v v26 +; CHECK-NEXT: vmseq.vi v0, v26, 0 +; CHECK-NEXT: vmerge.vim v16, v16, -1, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 -1, i32 0 + ret %r +} + +define @insertelt_nxv2i64_imm_cn1( %v) { +; CHECK-LABEL: insertelt_nxv2i64_imm_cn1: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a0, zero, e64,m2,ta,mu +; CHECK-NEXT: vid.v v26 +; CHECK-NEXT: vmseq.vi v0, v26, 3 +; CHECK-NEXT: vmerge.vim v16, v16, -1, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 -1, i32 3 + ret %r +} + +define @insertelt_nxv2i64_idx_cn1( %v, i32 %idx) { +; CHECK-LABEL: insertelt_nxv2i64_idx_cn1: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,ta,mu +; CHECK-NEXT: vid.v v26 +; CHECK-NEXT: vmseq.vx v0, v26, a0 +; CHECK-NEXT: vmerge.vim v16, v16, -1, v0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 -1, i32 %idx + ret %r +} diff --git a/llvm/test/CodeGen/RISCV/rvv/insertelt-int-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/insertelt-int-rv64.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/insertelt-int-rv64.ll @@ -0,0 +1,844 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc -mtriple=riscv64 -mattr=+d,+experimental-zfh,+experimental-v -target-abi=lp64d \ +; RUN: -verify-machineinstrs < %s | FileCheck %s + +define @insertelt_nxv1i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv1i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv1i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv1i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,mf8,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv2i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv2i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv2i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv4i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv4i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv4i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv8i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv8i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv8i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv16i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv16i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv16i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv32i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv32i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv32i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv32i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv32i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv32i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv64i8_0( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv64i8_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 0 + ret %r +} + +define @insertelt_nxv64i8_imm( %v, i8 signext %elt) { +; CHECK-LABEL: insertelt_nxv64i8_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e8,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 3 + ret %r +} + +define @insertelt_nxv64i8_idx( %v, i8 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv64i8_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e8,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e8,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e8,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i8 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv1i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv1i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv1i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,mf4,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv2i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv2i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv2i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv4i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv4i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv4i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv8i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv8i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv8i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv16i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv16i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv16i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv32i16_0( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv32i16_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 0 + ret %r +} + +define @insertelt_nxv32i16_imm( %v, i16 signext %elt) { +; CHECK-LABEL: insertelt_nxv32i16_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 3 + ret %r +} + +define @insertelt_nxv32i16_idx( %v, i16 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv32i16_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e16,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e16,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e16,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i16 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1i32_0( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv1i32_imm( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv1i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv1i32_idx( %v, i32 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv1i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,mf2,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,mf2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2i32_0( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv2i32_imm( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv2i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv2i32_idx( %v, i32 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv2i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4i32_0( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv4i32_imm( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv4i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv4i32_idx( %v, i32 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv4i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8i32_0( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv8i32_imm( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv8i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv8i32_idx( %v, i32 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv8i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv16i32_0( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i32_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 0 + ret %r +} + +define @insertelt_nxv16i32_imm( %v, i32 signext %elt) { +; CHECK-LABEL: insertelt_nxv16i32_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 3 + ret %r +} + +define @insertelt_nxv16i32_idx( %v, i32 signext %elt, i32 signext %idx) { +; CHECK-LABEL: insertelt_nxv16i32_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a2, zero, e32,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e32,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e32,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i32 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv1i64_0( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv1i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 0 + ret %r +} + +define @insertelt_nxv1i64_imm( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv1i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vi v25, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslideup.vi v16, v25, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 3 + ret %r +} + +define @insertelt_nxv1i64_idx( %v, i64 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv1i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: sext.w a1, a1 +; CHECK-NEXT: vsetvli a2, zero, e64,m1,tu,mu +; CHECK-NEXT: vslidedown.vx v25, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e64,m1,ta,mu +; CHECK-NEXT: vmv.s.x v25, a0 +; CHECK-NEXT: vsetvli a0, zero, e64,m1,tu,mu +; CHECK-NEXT: vslideup.vx v16, v25, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv2i64_0( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv2i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 0 + ret %r +} + +define @insertelt_nxv2i64_imm( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv2i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vi v26, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslideup.vi v16, v26, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 3 + ret %r +} + +define @insertelt_nxv2i64_idx( %v, i64 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv2i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: sext.w a1, a1 +; CHECK-NEXT: vsetvli a2, zero, e64,m2,tu,mu +; CHECK-NEXT: vslidedown.vx v26, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e64,m2,ta,mu +; CHECK-NEXT: vmv.s.x v26, a0 +; CHECK-NEXT: vsetvli a0, zero, e64,m2,tu,mu +; CHECK-NEXT: vslideup.vx v16, v26, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv4i64_0( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv4i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 0 + ret %r +} + +define @insertelt_nxv4i64_imm( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv4i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vi v28, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslideup.vi v16, v28, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 3 + ret %r +} + +define @insertelt_nxv4i64_idx( %v, i64 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv4i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: sext.w a1, a1 +; CHECK-NEXT: vsetvli a2, zero, e64,m4,tu,mu +; CHECK-NEXT: vslidedown.vx v28, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e64,m4,ta,mu +; CHECK-NEXT: vmv.s.x v28, a0 +; CHECK-NEXT: vsetvli a0, zero, e64,m4,tu,mu +; CHECK-NEXT: vslideup.vx v16, v28, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 %idx + ret %r +} + +define @insertelt_nxv8i64_0( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv8i64_0: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.s.x v16, a0 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 0 + ret %r +} + +define @insertelt_nxv8i64_imm( %v, i64 %elt) { +; CHECK-LABEL: insertelt_nxv8i64_imm: +; CHECK: # %bb.0: +; CHECK-NEXT: vsetvli a1, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vi v8, v16, 3 +; CHECK-NEXT: vsetvli a1, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslideup.vi v16, v8, 3 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 3 + ret %r +} + +define @insertelt_nxv8i64_idx( %v, i64 %elt, i32 %idx) { +; CHECK-LABEL: insertelt_nxv8i64_idx: +; CHECK: # %bb.0: +; CHECK-NEXT: sext.w a1, a1 +; CHECK-NEXT: vsetvli a2, zero, e64,m8,tu,mu +; CHECK-NEXT: vslidedown.vx v8, v16, a1 +; CHECK-NEXT: vsetvli a2, zero, e64,m8,ta,mu +; CHECK-NEXT: vmv.s.x v8, a0 +; CHECK-NEXT: vsetvli a0, zero, e64,m8,tu,mu +; CHECK-NEXT: vslideup.vx v16, v8, a1 +; CHECK-NEXT: ret + %r = insertelement %v, i64 %elt, i32 %idx + ret %r +} +