diff --git a/llvm/include/llvm/IR/IntrinsicsRISCV.td b/llvm/include/llvm/IR/IntrinsicsRISCV.td --- a/llvm/include/llvm/IR/IntrinsicsRISCV.td +++ b/llvm/include/llvm/IR/IntrinsicsRISCV.td @@ -375,6 +375,20 @@ [LLVMMatchType<0>, llvm_anyvector_ty, LLVMMatchType<0>, LLVMScalarOrSameVectorWidth<1, llvm_i1_ty>, llvm_anyint_ty], [IntrNoMem]>, RISCVVIntrinsic; + // For unary operations with scalar type output without mask + // Output: (scalar type) + // Input: (vector_in, vl) + class RISCVMaskUnarySOutNoMask + : Intrinsic<[llvm_anyint_ty], + [llvm_anyvector_ty, LLVMMatchType<0>], + [IntrNoMem]>, RISCVVIntrinsic; + // For unary operations with scalar type output with mask + // Output: (scalar type) + // Input: (vector_in, mask, vl) + class RISCVMaskUnarySOutMask + : Intrinsic<[llvm_anyint_ty], + [llvm_anyvector_ty, LLVMMatchType<1>, LLVMMatchType<0>], + [IntrNoMem]>, RISCVVIntrinsic; multiclass RISCVUSLoad { def "int_riscv_" # NAME : RISCVUSLoad; @@ -451,6 +465,10 @@ def "int_riscv_" # NAME : RISCVReductionNoMask; def "int_riscv_" # NAME # "_mask" : RISCVReductionMask; } + multiclass RISCVMaskUnarySOut { + def "int_riscv_" # NAME : RISCVMaskUnarySOutNoMask; + def "int_riscv_" # NAME # "_mask" : RISCVMaskUnarySOutMask; + } defm vle : RISCVUSLoad; defm vleff : RISCVUSLoad; @@ -658,4 +676,8 @@ def int_riscv_vmnor: RISCVBinaryAAANoMask; def int_riscv_vmornot: RISCVBinaryAAANoMask; def int_riscv_vmxnor: RISCVBinaryAAANoMask; + + defm vpopc : RISCVMaskUnarySOut; + defm vfirst : RISCVMaskUnarySOut; + } // TargetPrefix = "riscv" diff --git a/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td b/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td --- a/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td +++ b/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td @@ -188,23 +188,24 @@ VTypeInfo Vti = !cast(!subst("VF", "VI", !cast(vti))); } -class MTypeInfo { +class MTypeInfo { ValueType Mask = Mas; // {SEW, VLMul} values set a valid VType to deal with this mask type. // we assume SEW=8 and set corresponding LMUL. int SEW = 8; LMULInfo LMul = M; + string BX = Bx; // Appendix of mask operations. } defset list AllMasks = { // vbool_t, = SEW/LMUL, we assume SEW=8 and corresponding LMUL. - def : MTypeInfo; - def : MTypeInfo; - def : MTypeInfo; - def : MTypeInfo; - def : MTypeInfo; - def : MTypeInfo; - def : MTypeInfo; + def : MTypeInfo; + def : MTypeInfo; + def : MTypeInfo; + def : MTypeInfo; + def : MTypeInfo; + def : MTypeInfo; + def : MTypeInfo; } class VTypeInfoToWide @@ -294,8 +295,15 @@ !subst("_MF2", "", !subst("_MF4", "", !subst("_MF8", "", + !subst("_B1", "", + !subst("_B2", "", + !subst("_B4", "", + !subst("_B8", "", + !subst("_B16", "", + !subst("_B32", "", + !subst("_B64", "", !subst("_MASK", "", - !subst("Pseudo", "", PseudoInst))))))))); + !subst("Pseudo", "", PseudoInst)))))))))))))))); } // The destination vector register group for a masked vector instruction cannot @@ -499,6 +507,36 @@ let BaseInstr = !cast(PseudoToVInst.VInst); } +class VMaskPseudoUnarySOutNoMask: + Pseudo<(outs GPR:$rd), + (ins VR:$rs1, GPR:$vl, ixlenimm:$sew), []>, + RISCVVPseudo { + let mayLoad = 0; + let mayStore = 0; + let hasSideEffects = 0; + let usesCustomInserter = 1; + let Uses = [VL, VTYPE]; + let VLIndex = 2; + let SEWIndex = 3; + let HasDummyMask = 1; + let BaseInstr = !cast(PseudoToVInst.VInst); +} + +class VMaskPseudoUnarySOutMask: + Pseudo<(outs GPR:$rd), + (ins VR:$rs1, VMaskOp:$vm, GPR:$vl, ixlenimm:$sew), []>, + RISCVVPseudo { + let mayLoad = 0; + let mayStore = 0; + let hasSideEffects = 0; + let usesCustomInserter = 1; + let Uses = [VL, VTYPE]; + let VLIndex = 3; + let SEWIndex = 4; + let HasDummyMask = 1; + let BaseInstr = !cast(PseudoToVInst.VInst); +} + class VPseudoBinaryNoMask; } +multiclass VPatMaskUnarySOut +{ + foreach mti = AllMasks in { + def : Pat<(XLenVT (!cast(intrinsic_name) + (mti.Mask VR:$rs1), GPR:$vl)), + (!cast(inst#"_M_"#mti.BX) $rs1, + (NoX0 GPR:$vl), mti.SEW)>; + def : Pat<(XLenVT (!cast(intrinsic_name # "_mask") + (mti.Mask VR:$rs1), (mti.Mask V0), GPR:$vl)), + (!cast(inst#"_M_"#mti.BX#"_MASK") $rs1, + (mti.Mask V0), (NoX0 GPR:$vl), mti.SEW)>; + } +} + + multiclass VPatBinary; } // Predicates = [HasStdExtV] +//===----------------------------------------------------------------------===// +// 16.2. Vector mask population count vpopc +//===----------------------------------------------------------------------===// +let Predicates = [HasStdExtV] in { + defm "" : VPatMaskUnarySOut<"int_riscv_vpopc", "PseudoVPOPC">; +} // Predicates = [HasStdExtV] + +//===----------------------------------------------------------------------===// +// 16.3. vfirst find-first-set mask bit +//===----------------------------------------------------------------------===// +let Predicates = [HasStdExtV] in { + defm "" : VPatMaskUnarySOut<"int_riscv_vfirst", "PseudoVFIRST">; +} // Predicates = [HasStdExtV] + //===----------------------------------------------------------------------===// // 17. Vector Permutation Instructions //===----------------------------------------------------------------------===// diff --git a/llvm/test/CodeGen/RISCV/rvv/vfirst-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/vfirst-rv32.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/vfirst-rv32.ll @@ -0,0 +1,239 @@ +; RUN: llc -mtriple=riscv32 -mattr=+experimental-v,+f -verify-machineinstrs \ +; RUN: --riscv-no-aliases < %s | FileCheck %s +declare i32 @llvm.riscv.vfirst.i64.nxv1i1( + , + i32); + +define i32 @intrinsic_vfirst_m_i64_nxv1i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv1i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf8,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vfirst.i64.nxv1i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.mask.i64.nxv1i1( + , + , + i32); + +define i32 @intrinsic_vfirst_mask_m_i64_nxv1i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv1i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf8,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vfirst.mask.i64.nxv1i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.i64.nxv2i1( + , + i32); + +define i32 @intrinsic_vfirst_m_i64_nxv2i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv2i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf4,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vfirst.i64.nxv2i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.mask.i64.nxv2i1( + , + , + i32); + +define i32 @intrinsic_vfirst_mask_m_i64_nxv2i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv2i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf4,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vfirst.mask.i64.nxv2i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.i64.nxv4i1( + , + i32); + +define i32 @intrinsic_vfirst_m_i64_nxv4i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv4i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf2,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vfirst.i64.nxv4i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.mask.i64.nxv4i1( + , + , + i32); + +define i32 @intrinsic_vfirst_mask_m_i64_nxv4i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv4i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf2,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vfirst.mask.i64.nxv4i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.i64.nxv8i1( + , + i32); + +define i32 @intrinsic_vfirst_m_i64_nxv8i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv8i1 +; CHECK: vsetvli {{.*}}, a0, e8,m1,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vfirst.i64.nxv8i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.mask.i64.nxv8i1( + , + , + i32); + +define i32 @intrinsic_vfirst_mask_m_i64_nxv8i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv8i1 +; CHECK: vsetvli {{.*}}, a0, e8,m1,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vfirst.mask.i64.nxv8i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.i64.nxv16i1( + , + i32); + +define i32 @intrinsic_vfirst_m_i64_nxv16i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv16i1 +; CHECK: vsetvli {{.*}}, a0, e8,m2,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vfirst.i64.nxv16i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.mask.i64.nxv16i1( + , + , + i32); + +define i32 @intrinsic_vfirst_mask_m_i64_nxv16i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv16i1 +; CHECK: vsetvli {{.*}}, a0, e8,m2,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vfirst.mask.i64.nxv16i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.i64.nxv32i1( + , + i32); + +define i32 @intrinsic_vfirst_m_i64_nxv32i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv32i1 +; CHECK: vsetvli {{.*}}, a0, e8,m4,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vfirst.i64.nxv32i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.mask.i64.nxv32i1( + , + , + i32); + +define i32 @intrinsic_vfirst_mask_m_i64_nxv32i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv32i1 +; CHECK: vsetvli {{.*}}, a0, e8,m4,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vfirst.mask.i64.nxv32i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.i64.nxv64i1( + , + i32); + +define i32 @intrinsic_vfirst_m_i64_nxv64i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv64i1 +; CHECK: vsetvli {{.*}}, a0, e8,m8,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vfirst.i64.nxv64i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vfirst.mask.i64.nxv64i1( + , + , + i32); + +define i32 @intrinsic_vfirst_mask_m_i64_nxv64i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv64i1 +; CHECK: vsetvli {{.*}}, a0, e8,m8,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vfirst.mask.i64.nxv64i1( + %0, + %1, + i32 %2) + + ret i32 %a +} diff --git a/llvm/test/CodeGen/RISCV/rvv/vfirst-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/vfirst-rv64.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/vfirst-rv64.ll @@ -0,0 +1,239 @@ +; RUN: llc -mtriple=riscv64 -mattr=+experimental-v,+d -verify-machineinstrs \ +; RUN: --riscv-no-aliases < %s | FileCheck %s +declare i64 @llvm.riscv.vfirst.i64.nxv1i1( + , + i64); + +define i64 @intrinsic_vfirst_m_i64_nxv1i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv1i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf8,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vfirst.i64.nxv1i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.mask.i64.nxv1i1( + , + , + i64); + +define i64 @intrinsic_vfirst_mask_m_i64_nxv1i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv1i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf8,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vfirst.mask.i64.nxv1i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.i64.nxv2i1( + , + i64); + +define i64 @intrinsic_vfirst_m_i64_nxv2i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv2i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf4,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vfirst.i64.nxv2i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.mask.i64.nxv2i1( + , + , + i64); + +define i64 @intrinsic_vfirst_mask_m_i64_nxv2i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv2i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf4,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vfirst.mask.i64.nxv2i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.i64.nxv4i1( + , + i64); + +define i64 @intrinsic_vfirst_m_i64_nxv4i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv4i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf2,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vfirst.i64.nxv4i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.mask.i64.nxv4i1( + , + , + i64); + +define i64 @intrinsic_vfirst_mask_m_i64_nxv4i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv4i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf2,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vfirst.mask.i64.nxv4i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.i64.nxv8i1( + , + i64); + +define i64 @intrinsic_vfirst_m_i64_nxv8i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv8i1 +; CHECK: vsetvli {{.*}}, a0, e8,m1,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vfirst.i64.nxv8i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.mask.i64.nxv8i1( + , + , + i64); + +define i64 @intrinsic_vfirst_mask_m_i64_nxv8i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv8i1 +; CHECK: vsetvli {{.*}}, a0, e8,m1,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vfirst.mask.i64.nxv8i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.i64.nxv16i1( + , + i64); + +define i64 @intrinsic_vfirst_m_i64_nxv16i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv16i1 +; CHECK: vsetvli {{.*}}, a0, e8,m2,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vfirst.i64.nxv16i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.mask.i64.nxv16i1( + , + , + i64); + +define i64 @intrinsic_vfirst_mask_m_i64_nxv16i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv16i1 +; CHECK: vsetvli {{.*}}, a0, e8,m2,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vfirst.mask.i64.nxv16i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.i64.nxv32i1( + , + i64); + +define i64 @intrinsic_vfirst_m_i64_nxv32i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv32i1 +; CHECK: vsetvli {{.*}}, a0, e8,m4,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vfirst.i64.nxv32i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.mask.i64.nxv32i1( + , + , + i64); + +define i64 @intrinsic_vfirst_mask_m_i64_nxv32i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv32i1 +; CHECK: vsetvli {{.*}}, a0, e8,m4,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vfirst.mask.i64.nxv32i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.i64.nxv64i1( + , + i64); + +define i64 @intrinsic_vfirst_m_i64_nxv64i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_m_i64_nxv64i1 +; CHECK: vsetvli {{.*}}, a0, e8,m8,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vfirst.i64.nxv64i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vfirst.mask.i64.nxv64i1( + , + , + i64); + +define i64 @intrinsic_vfirst_mask_m_i64_nxv64i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vfirst_mask_m_i64_nxv64i1 +; CHECK: vsetvli {{.*}}, a0, e8,m8,ta,mu +; CHECK: vfirst.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vfirst.mask.i64.nxv64i1( + %0, + %1, + i64 %2) + + ret i64 %a +} diff --git a/llvm/test/CodeGen/RISCV/rvv/vpopc-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/vpopc-rv32.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/vpopc-rv32.ll @@ -0,0 +1,239 @@ +; RUN: llc -mtriple=riscv32 -mattr=+experimental-v,+f -verify-machineinstrs \ +; RUN: --riscv-no-aliases < %s | FileCheck %s +declare i32 @llvm.riscv.vpopc.i64.nxv1i1( + , + i32); + +define i32 @intrinsic_vpopc_m_i64_nxv1i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv1i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf8,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vpopc.i64.nxv1i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.mask.i64.nxv1i1( + , + , + i32); + +define i32 @intrinsic_vpopc_mask_m_i64_nxv1i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv1i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf8,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vpopc.mask.i64.nxv1i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.i64.nxv2i1( + , + i32); + +define i32 @intrinsic_vpopc_m_i64_nxv2i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv2i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf4,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vpopc.i64.nxv2i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.mask.i64.nxv2i1( + , + , + i32); + +define i32 @intrinsic_vpopc_mask_m_i64_nxv2i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv2i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf4,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vpopc.mask.i64.nxv2i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.i64.nxv4i1( + , + i32); + +define i32 @intrinsic_vpopc_m_i64_nxv4i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv4i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf2,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vpopc.i64.nxv4i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.mask.i64.nxv4i1( + , + , + i32); + +define i32 @intrinsic_vpopc_mask_m_i64_nxv4i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv4i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf2,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vpopc.mask.i64.nxv4i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.i64.nxv8i1( + , + i32); + +define i32 @intrinsic_vpopc_m_i64_nxv8i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv8i1 +; CHECK: vsetvli {{.*}}, a0, e8,m1,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vpopc.i64.nxv8i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.mask.i64.nxv8i1( + , + , + i32); + +define i32 @intrinsic_vpopc_mask_m_i64_nxv8i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv8i1 +; CHECK: vsetvli {{.*}}, a0, e8,m1,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vpopc.mask.i64.nxv8i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.i64.nxv16i1( + , + i32); + +define i32 @intrinsic_vpopc_m_i64_nxv16i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv16i1 +; CHECK: vsetvli {{.*}}, a0, e8,m2,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vpopc.i64.nxv16i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.mask.i64.nxv16i1( + , + , + i32); + +define i32 @intrinsic_vpopc_mask_m_i64_nxv16i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv16i1 +; CHECK: vsetvli {{.*}}, a0, e8,m2,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vpopc.mask.i64.nxv16i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.i64.nxv32i1( + , + i32); + +define i32 @intrinsic_vpopc_m_i64_nxv32i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv32i1 +; CHECK: vsetvli {{.*}}, a0, e8,m4,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vpopc.i64.nxv32i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.mask.i64.nxv32i1( + , + , + i32); + +define i32 @intrinsic_vpopc_mask_m_i64_nxv32i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv32i1 +; CHECK: vsetvli {{.*}}, a0, e8,m4,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vpopc.mask.i64.nxv32i1( + %0, + %1, + i32 %2) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.i64.nxv64i1( + , + i32); + +define i32 @intrinsic_vpopc_m_i64_nxv64i1( %0, i32 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv64i1 +; CHECK: vsetvli {{.*}}, a0, e8,m8,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i32 @llvm.riscv.vpopc.i64.nxv64i1( + %0, + i32 %1) + + ret i32 %a +} + +declare i32 @llvm.riscv.vpopc.mask.i64.nxv64i1( + , + , + i32); + +define i32 @intrinsic_vpopc_mask_m_i64_nxv64i1( %0, %1, i32 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv64i1 +; CHECK: vsetvli {{.*}}, a0, e8,m8,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i32 @llvm.riscv.vpopc.mask.i64.nxv64i1( + %0, + %1, + i32 %2) + + ret i32 %a +} diff --git a/llvm/test/CodeGen/RISCV/rvv/vpopc-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/vpopc-rv64.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/rvv/vpopc-rv64.ll @@ -0,0 +1,239 @@ +; RUN: llc -mtriple=riscv64 -mattr=+experimental-v,+d -verify-machineinstrs \ +; RUN: --riscv-no-aliases < %s | FileCheck %s +declare i64 @llvm.riscv.vpopc.i64.nxv1i1( + , + i64); + +define i64 @intrinsic_vpopc_m_i64_nxv1i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv1i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf8,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vpopc.i64.nxv1i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.mask.i64.nxv1i1( + , + , + i64); + +define i64 @intrinsic_vpopc_mask_m_i64_nxv1i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv1i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf8,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vpopc.mask.i64.nxv1i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.i64.nxv2i1( + , + i64); + +define i64 @intrinsic_vpopc_m_i64_nxv2i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv2i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf4,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vpopc.i64.nxv2i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.mask.i64.nxv2i1( + , + , + i64); + +define i64 @intrinsic_vpopc_mask_m_i64_nxv2i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv2i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf4,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vpopc.mask.i64.nxv2i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.i64.nxv4i1( + , + i64); + +define i64 @intrinsic_vpopc_m_i64_nxv4i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv4i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf2,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vpopc.i64.nxv4i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.mask.i64.nxv4i1( + , + , + i64); + +define i64 @intrinsic_vpopc_mask_m_i64_nxv4i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv4i1 +; CHECK: vsetvli {{.*}}, a0, e8,mf2,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vpopc.mask.i64.nxv4i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.i64.nxv8i1( + , + i64); + +define i64 @intrinsic_vpopc_m_i64_nxv8i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv8i1 +; CHECK: vsetvli {{.*}}, a0, e8,m1,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vpopc.i64.nxv8i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.mask.i64.nxv8i1( + , + , + i64); + +define i64 @intrinsic_vpopc_mask_m_i64_nxv8i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv8i1 +; CHECK: vsetvli {{.*}}, a0, e8,m1,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vpopc.mask.i64.nxv8i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.i64.nxv16i1( + , + i64); + +define i64 @intrinsic_vpopc_m_i64_nxv16i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv16i1 +; CHECK: vsetvli {{.*}}, a0, e8,m2,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vpopc.i64.nxv16i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.mask.i64.nxv16i1( + , + , + i64); + +define i64 @intrinsic_vpopc_mask_m_i64_nxv16i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv16i1 +; CHECK: vsetvli {{.*}}, a0, e8,m2,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vpopc.mask.i64.nxv16i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.i64.nxv32i1( + , + i64); + +define i64 @intrinsic_vpopc_m_i64_nxv32i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv32i1 +; CHECK: vsetvli {{.*}}, a0, e8,m4,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vpopc.i64.nxv32i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.mask.i64.nxv32i1( + , + , + i64); + +define i64 @intrinsic_vpopc_mask_m_i64_nxv32i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv32i1 +; CHECK: vsetvli {{.*}}, a0, e8,m4,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vpopc.mask.i64.nxv32i1( + %0, + %1, + i64 %2) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.i64.nxv64i1( + , + i64); + +define i64 @intrinsic_vpopc_m_i64_nxv64i1( %0, i64 %1) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_m_i64_nxv64i1 +; CHECK: vsetvli {{.*}}, a0, e8,m8,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}} + %a = call i64 @llvm.riscv.vpopc.i64.nxv64i1( + %0, + i64 %1) + + ret i64 %a +} + +declare i64 @llvm.riscv.vpopc.mask.i64.nxv64i1( + , + , + i64); + +define i64 @intrinsic_vpopc_mask_m_i64_nxv64i1( %0, %1, i64 %2) nounwind { +entry: +; CHECK-LABEL: intrinsic_vpopc_mask_m_i64_nxv64i1 +; CHECK: vsetvli {{.*}}, a0, e8,m8,ta,mu +; CHECK: vpopc.m a0, {{v[0-9]+}}, v0.t + %a = call i64 @llvm.riscv.vpopc.mask.i64.nxv64i1( + %0, + %1, + i64 %2) + + ret i64 %a +}