diff --git a/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td b/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td --- a/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td +++ b/llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td @@ -1598,16 +1598,14 @@ multiclass VPseudoBinaryW_WX { foreach m = MxList.m[0-5] in - defm "_WX" : VPseudoBinary; + defm "_WX" : VPseudoBinary; } multiclass VPseudoBinaryW_WF { foreach m = MxList.m[0-5] in foreach f = FPList.fpinfo[0-1] in defm "_W" # f.FX : VPseudoBinary; + f.fprclass, m>; } multiclass VPseudoBinaryV_WV { diff --git a/llvm/test/CodeGen/RISCV/rvv/vfwadd.w-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/vfwadd.w-rv32.ll --- a/llvm/test/CodeGen/RISCV/rvv/vfwadd.w-rv32.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vfwadd.w-rv32.ll @@ -418,8 +418,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,mf4,ta,mu -; CHECK-NEXT: vfwadd.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv1f32.f16( @@ -465,8 +464,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,mf2,ta,mu -; CHECK-NEXT: vfwadd.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv2f32.f16( @@ -512,8 +510,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m1,ta,mu -; CHECK-NEXT: vfwadd.wf v26, v8, ft0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv4f32.f16( @@ -559,8 +556,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m2,ta,mu -; CHECK-NEXT: vfwadd.wf v28, v8, ft0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv8f32.f16( @@ -606,8 +602,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m4,ta,mu -; CHECK-NEXT: vfwadd.wf v16, v8, ft0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv16f32.f16( @@ -653,8 +648,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,mf2,ta,mu -; CHECK-NEXT: vfwadd.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv1f64.f32( @@ -700,8 +694,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m1,ta,mu -; CHECK-NEXT: vfwadd.wf v26, v8, ft0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv2f64.f32( @@ -747,8 +740,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m2,ta,mu -; CHECK-NEXT: vfwadd.wf v28, v8, ft0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv4f64.f32( @@ -794,8 +786,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m4,ta,mu -; CHECK-NEXT: vfwadd.wf v16, v8, ft0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv8f64.f32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vfwadd.w-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/vfwadd.w-rv64.ll --- a/llvm/test/CodeGen/RISCV/rvv/vfwadd.w-rv64.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vfwadd.w-rv64.ll @@ -418,8 +418,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,mf4,ta,mu -; CHECK-NEXT: vfwadd.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv1f32.f16( @@ -465,8 +464,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,mf2,ta,mu -; CHECK-NEXT: vfwadd.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv2f32.f16( @@ -512,8 +510,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m1,ta,mu -; CHECK-NEXT: vfwadd.wf v26, v8, ft0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv4f32.f16( @@ -559,8 +556,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m2,ta,mu -; CHECK-NEXT: vfwadd.wf v28, v8, ft0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv8f32.f16( @@ -606,8 +602,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m4,ta,mu -; CHECK-NEXT: vfwadd.wf v16, v8, ft0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv16f32.f16( @@ -653,8 +648,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,mf2,ta,mu -; CHECK-NEXT: vfwadd.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv1f64.f32( @@ -700,8 +694,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m1,ta,mu -; CHECK-NEXT: vfwadd.wf v26, v8, ft0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv2f64.f32( @@ -747,8 +740,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m2,ta,mu -; CHECK-NEXT: vfwadd.wf v28, v8, ft0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv4f64.f32( @@ -794,8 +786,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m4,ta,mu -; CHECK-NEXT: vfwadd.wf v16, v8, ft0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vfwadd.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwadd.w.nxv8f64.f32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vfwsub.w-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/vfwsub.w-rv32.ll --- a/llvm/test/CodeGen/RISCV/rvv/vfwsub.w-rv32.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vfwsub.w-rv32.ll @@ -418,8 +418,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,mf4,ta,mu -; CHECK-NEXT: vfwsub.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv1f32.f16( @@ -465,8 +464,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,mf2,ta,mu -; CHECK-NEXT: vfwsub.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv2f32.f16( @@ -512,8 +510,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m1,ta,mu -; CHECK-NEXT: vfwsub.wf v26, v8, ft0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv4f32.f16( @@ -559,8 +556,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m2,ta,mu -; CHECK-NEXT: vfwsub.wf v28, v8, ft0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv8f32.f16( @@ -606,8 +602,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m4,ta,mu -; CHECK-NEXT: vfwsub.wf v16, v8, ft0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv16f32.f16( @@ -653,8 +648,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,mf2,ta,mu -; CHECK-NEXT: vfwsub.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv1f64.f32( @@ -700,8 +694,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m1,ta,mu -; CHECK-NEXT: vfwsub.wf v26, v8, ft0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv2f64.f32( @@ -747,8 +740,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m2,ta,mu -; CHECK-NEXT: vfwsub.wf v28, v8, ft0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv4f64.f32( @@ -794,8 +786,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m4,ta,mu -; CHECK-NEXT: vfwsub.wf v16, v8, ft0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv8f64.f32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vfwsub.w-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/vfwsub.w-rv64.ll --- a/llvm/test/CodeGen/RISCV/rvv/vfwsub.w-rv64.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vfwsub.w-rv64.ll @@ -418,8 +418,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,mf4,ta,mu -; CHECK-NEXT: vfwsub.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv1f32.f16( @@ -465,8 +464,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,mf2,ta,mu -; CHECK-NEXT: vfwsub.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv2f32.f16( @@ -512,8 +510,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m1,ta,mu -; CHECK-NEXT: vfwsub.wf v26, v8, ft0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv4f32.f16( @@ -559,8 +556,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m2,ta,mu -; CHECK-NEXT: vfwsub.wf v28, v8, ft0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv8f32.f16( @@ -606,8 +602,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.h.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e16,m4,ta,mu -; CHECK-NEXT: vfwsub.wf v16, v8, ft0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv16f32.f16( @@ -653,8 +648,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,mf2,ta,mu -; CHECK-NEXT: vfwsub.wf v25, v8, ft0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv1f64.f32( @@ -700,8 +694,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m1,ta,mu -; CHECK-NEXT: vfwsub.wf v26, v8, ft0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv2f64.f32( @@ -747,8 +740,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m2,ta,mu -; CHECK-NEXT: vfwsub.wf v28, v8, ft0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv4f64.f32( @@ -794,8 +786,7 @@ ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: fmv.w.x ft0, a0 ; CHECK-NEXT: vsetvli a0, a1, e32,m4,ta,mu -; CHECK-NEXT: vfwsub.wf v16, v8, ft0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vfwsub.wf v8, v8, ft0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vfwsub.w.nxv8f64.f32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vwadd.w-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/vwadd.w-rv32.ll --- a/llvm/test/CodeGen/RISCV/rvv/vwadd.w-rv32.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vwadd.w-rv32.ll @@ -688,8 +688,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv1i16_nxv1i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf8,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv1i16.i8( @@ -733,8 +732,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv2i16_nxv2i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf4,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv2i16.i8( @@ -778,8 +776,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv4i16_nxv4i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf2,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv4i16.i8( @@ -823,8 +820,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv8i16_nxv8i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m1,ta,mu -; CHECK-NEXT: vwadd.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv8i16.i8( @@ -868,8 +864,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv16i16_nxv16i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m2,ta,mu -; CHECK-NEXT: vwadd.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv16i16.i8( @@ -913,8 +908,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv32i16_nxv32i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m4,ta,mu -; CHECK-NEXT: vwadd.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv32i16.i8( @@ -958,8 +952,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv1i32_nxv1i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf4,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv1i32.i16( @@ -1003,8 +996,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv2i32_nxv2i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf2,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv2i32.i16( @@ -1048,8 +1040,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv4i32_nxv4i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m1,ta,mu -; CHECK-NEXT: vwadd.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv4i32.i16( @@ -1093,8 +1084,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv8i32_nxv8i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m2,ta,mu -; CHECK-NEXT: vwadd.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv8i32.i16( @@ -1138,8 +1128,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv16i32_nxv16i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m4,ta,mu -; CHECK-NEXT: vwadd.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv16i32.i16( @@ -1183,8 +1172,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv1i64_nxv1i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,mf2,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv1i64.i32( @@ -1228,8 +1216,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv2i64_nxv2i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m1,ta,mu -; CHECK-NEXT: vwadd.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv2i64.i32( @@ -1273,8 +1260,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv4i64_nxv4i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m2,ta,mu -; CHECK-NEXT: vwadd.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv4i64.i32( @@ -1318,8 +1304,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv8i64_nxv8i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m4,ta,mu -; CHECK-NEXT: vwadd.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv8i64.i32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vwadd.w-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/vwadd.w-rv64.ll --- a/llvm/test/CodeGen/RISCV/rvv/vwadd.w-rv64.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vwadd.w-rv64.ll @@ -688,8 +688,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv1i16_nxv1i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf8,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv1i16.i8( @@ -733,8 +732,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv2i16_nxv2i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf4,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv2i16.i8( @@ -778,8 +776,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv4i16_nxv4i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf2,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv4i16.i8( @@ -823,8 +820,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv8i16_nxv8i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m1,ta,mu -; CHECK-NEXT: vwadd.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv8i16.i8( @@ -868,8 +864,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv16i16_nxv16i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m2,ta,mu -; CHECK-NEXT: vwadd.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv16i16.i8( @@ -913,8 +908,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv32i16_nxv32i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m4,ta,mu -; CHECK-NEXT: vwadd.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv32i16.i8( @@ -958,8 +952,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv1i32_nxv1i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf4,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv1i32.i16( @@ -1003,8 +996,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv2i32_nxv2i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf2,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv2i32.i16( @@ -1048,8 +1040,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv4i32_nxv4i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m1,ta,mu -; CHECK-NEXT: vwadd.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv4i32.i16( @@ -1093,8 +1084,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv8i32_nxv8i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m2,ta,mu -; CHECK-NEXT: vwadd.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv8i32.i16( @@ -1138,8 +1128,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv16i32_nxv16i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m4,ta,mu -; CHECK-NEXT: vwadd.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv16i32.i16( @@ -1183,8 +1172,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv1i64_nxv1i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,mf2,ta,mu -; CHECK-NEXT: vwadd.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv1i64.i32( @@ -1228,8 +1216,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv2i64_nxv2i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m1,ta,mu -; CHECK-NEXT: vwadd.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv2i64.i32( @@ -1273,8 +1260,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv4i64_nxv4i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m2,ta,mu -; CHECK-NEXT: vwadd.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv4i64.i32( @@ -1318,8 +1304,7 @@ ; CHECK-LABEL: intrinsic_vwadd.w_wx_nxv8i64_nxv8i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m4,ta,mu -; CHECK-NEXT: vwadd.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwadd.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwadd.w.nxv8i64.i32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vwaddu.w-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/vwaddu.w-rv32.ll --- a/llvm/test/CodeGen/RISCV/rvv/vwaddu.w-rv32.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vwaddu.w-rv32.ll @@ -688,8 +688,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv1i16_nxv1i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf8,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv1i16.i8( @@ -733,8 +732,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv2i16_nxv2i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf4,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv2i16.i8( @@ -778,8 +776,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv4i16_nxv4i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf2,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv4i16.i8( @@ -823,8 +820,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv8i16_nxv8i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m1,ta,mu -; CHECK-NEXT: vwaddu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv8i16.i8( @@ -868,8 +864,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv16i16_nxv16i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m2,ta,mu -; CHECK-NEXT: vwaddu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv16i16.i8( @@ -913,8 +908,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv32i16_nxv32i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m4,ta,mu -; CHECK-NEXT: vwaddu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv32i16.i8( @@ -958,8 +952,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv1i32_nxv1i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf4,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv1i32.i16( @@ -1003,8 +996,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv2i32_nxv2i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf2,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv2i32.i16( @@ -1048,8 +1040,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv4i32_nxv4i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m1,ta,mu -; CHECK-NEXT: vwaddu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv4i32.i16( @@ -1093,8 +1084,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv8i32_nxv8i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m2,ta,mu -; CHECK-NEXT: vwaddu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv8i32.i16( @@ -1138,8 +1128,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv16i32_nxv16i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m4,ta,mu -; CHECK-NEXT: vwaddu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv16i32.i16( @@ -1183,8 +1172,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv1i64_nxv1i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,mf2,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv1i64.i32( @@ -1228,8 +1216,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv2i64_nxv2i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m1,ta,mu -; CHECK-NEXT: vwaddu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv2i64.i32( @@ -1273,8 +1260,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv4i64_nxv4i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m2,ta,mu -; CHECK-NEXT: vwaddu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv4i64.i32( @@ -1318,8 +1304,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv8i64_nxv8i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m4,ta,mu -; CHECK-NEXT: vwaddu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv8i64.i32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vwaddu.w-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/vwaddu.w-rv64.ll --- a/llvm/test/CodeGen/RISCV/rvv/vwaddu.w-rv64.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vwaddu.w-rv64.ll @@ -688,8 +688,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv1i16_nxv1i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf8,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv1i16.i8( @@ -733,8 +732,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv2i16_nxv2i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf4,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv2i16.i8( @@ -778,8 +776,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv4i16_nxv4i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf2,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv4i16.i8( @@ -823,8 +820,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv8i16_nxv8i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m1,ta,mu -; CHECK-NEXT: vwaddu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv8i16.i8( @@ -868,8 +864,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv16i16_nxv16i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m2,ta,mu -; CHECK-NEXT: vwaddu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv16i16.i8( @@ -913,8 +908,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv32i16_nxv32i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m4,ta,mu -; CHECK-NEXT: vwaddu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv32i16.i8( @@ -958,8 +952,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv1i32_nxv1i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf4,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv1i32.i16( @@ -1003,8 +996,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv2i32_nxv2i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf2,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv2i32.i16( @@ -1048,8 +1040,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv4i32_nxv4i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m1,ta,mu -; CHECK-NEXT: vwaddu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv4i32.i16( @@ -1093,8 +1084,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv8i32_nxv8i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m2,ta,mu -; CHECK-NEXT: vwaddu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv8i32.i16( @@ -1138,8 +1128,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv16i32_nxv16i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m4,ta,mu -; CHECK-NEXT: vwaddu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv16i32.i16( @@ -1183,8 +1172,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv1i64_nxv1i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,mf2,ta,mu -; CHECK-NEXT: vwaddu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv1i64.i32( @@ -1228,8 +1216,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv2i64_nxv2i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m1,ta,mu -; CHECK-NEXT: vwaddu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv2i64.i32( @@ -1273,8 +1260,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv4i64_nxv4i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m2,ta,mu -; CHECK-NEXT: vwaddu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv4i64.i32( @@ -1318,8 +1304,7 @@ ; CHECK-LABEL: intrinsic_vwaddu.w_wx_nxv8i64_nxv8i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m4,ta,mu -; CHECK-NEXT: vwaddu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwaddu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwaddu.w.nxv8i64.i32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vwsub.w-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/vwsub.w-rv32.ll --- a/llvm/test/CodeGen/RISCV/rvv/vwsub.w-rv32.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vwsub.w-rv32.ll @@ -688,8 +688,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv1i16_nxv1i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf8,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv1i16.i8( @@ -733,8 +732,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv2i16_nxv2i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf4,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv2i16.i8( @@ -778,8 +776,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv4i16_nxv4i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf2,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv4i16.i8( @@ -823,8 +820,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv8i16_nxv8i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m1,ta,mu -; CHECK-NEXT: vwsub.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv8i16.i8( @@ -868,8 +864,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv16i16_nxv16i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m2,ta,mu -; CHECK-NEXT: vwsub.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv16i16.i8( @@ -913,8 +908,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv32i16_nxv32i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m4,ta,mu -; CHECK-NEXT: vwsub.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv32i16.i8( @@ -958,8 +952,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv1i32_nxv1i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf4,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv1i32.i16( @@ -1003,8 +996,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv2i32_nxv2i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf2,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv2i32.i16( @@ -1048,8 +1040,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv4i32_nxv4i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m1,ta,mu -; CHECK-NEXT: vwsub.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv4i32.i16( @@ -1093,8 +1084,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv8i32_nxv8i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m2,ta,mu -; CHECK-NEXT: vwsub.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv8i32.i16( @@ -1138,8 +1128,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv16i32_nxv16i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m4,ta,mu -; CHECK-NEXT: vwsub.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv16i32.i16( @@ -1183,8 +1172,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv1i64_nxv1i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,mf2,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv1i64.i32( @@ -1228,8 +1216,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv2i64_nxv2i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m1,ta,mu -; CHECK-NEXT: vwsub.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv2i64.i32( @@ -1273,8 +1260,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv4i64_nxv4i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m2,ta,mu -; CHECK-NEXT: vwsub.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv4i64.i32( @@ -1318,8 +1304,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv8i64_nxv8i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m4,ta,mu -; CHECK-NEXT: vwsub.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv8i64.i32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vwsub.w-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/vwsub.w-rv64.ll --- a/llvm/test/CodeGen/RISCV/rvv/vwsub.w-rv64.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vwsub.w-rv64.ll @@ -688,8 +688,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv1i16_nxv1i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf8,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv1i16.i8( @@ -733,8 +732,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv2i16_nxv2i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf4,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv2i16.i8( @@ -778,8 +776,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv4i16_nxv4i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf2,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv4i16.i8( @@ -823,8 +820,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv8i16_nxv8i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m1,ta,mu -; CHECK-NEXT: vwsub.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv8i16.i8( @@ -868,8 +864,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv16i16_nxv16i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m2,ta,mu -; CHECK-NEXT: vwsub.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv16i16.i8( @@ -913,8 +908,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv32i16_nxv32i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m4,ta,mu -; CHECK-NEXT: vwsub.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv32i16.i8( @@ -958,8 +952,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv1i32_nxv1i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf4,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv1i32.i16( @@ -1003,8 +996,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv2i32_nxv2i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf2,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv2i32.i16( @@ -1048,8 +1040,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv4i32_nxv4i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m1,ta,mu -; CHECK-NEXT: vwsub.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv4i32.i16( @@ -1093,8 +1084,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv8i32_nxv8i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m2,ta,mu -; CHECK-NEXT: vwsub.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv8i32.i16( @@ -1138,8 +1128,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv16i32_nxv16i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m4,ta,mu -; CHECK-NEXT: vwsub.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv16i32.i16( @@ -1183,8 +1172,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv1i64_nxv1i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,mf2,ta,mu -; CHECK-NEXT: vwsub.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv1i64.i32( @@ -1228,8 +1216,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv2i64_nxv2i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m1,ta,mu -; CHECK-NEXT: vwsub.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv2i64.i32( @@ -1273,8 +1260,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv4i64_nxv4i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m2,ta,mu -; CHECK-NEXT: vwsub.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv4i64.i32( @@ -1318,8 +1304,7 @@ ; CHECK-LABEL: intrinsic_vwsub.w_wx_nxv8i64_nxv8i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m4,ta,mu -; CHECK-NEXT: vwsub.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsub.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsub.w.nxv8i64.i32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vwsubu.w-rv32.ll b/llvm/test/CodeGen/RISCV/rvv/vwsubu.w-rv32.ll --- a/llvm/test/CodeGen/RISCV/rvv/vwsubu.w-rv32.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vwsubu.w-rv32.ll @@ -688,8 +688,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv1i16_nxv1i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf8,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv1i16.i8( @@ -733,8 +732,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv2i16_nxv2i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf4,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv2i16.i8( @@ -778,8 +776,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv4i16_nxv4i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf2,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv4i16.i8( @@ -823,8 +820,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv8i16_nxv8i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m1,ta,mu -; CHECK-NEXT: vwsubu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv8i16.i8( @@ -868,8 +864,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv16i16_nxv16i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m2,ta,mu -; CHECK-NEXT: vwsubu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv16i16.i8( @@ -913,8 +908,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv32i16_nxv32i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m4,ta,mu -; CHECK-NEXT: vwsubu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv32i16.i8( @@ -958,8 +952,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv1i32_nxv1i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf4,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv1i32.i16( @@ -1003,8 +996,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv2i32_nxv2i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf2,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv2i32.i16( @@ -1048,8 +1040,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv4i32_nxv4i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m1,ta,mu -; CHECK-NEXT: vwsubu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv4i32.i16( @@ -1093,8 +1084,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv8i32_nxv8i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m2,ta,mu -; CHECK-NEXT: vwsubu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv8i32.i16( @@ -1138,8 +1128,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv16i32_nxv16i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m4,ta,mu -; CHECK-NEXT: vwsubu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv16i32.i16( @@ -1183,8 +1172,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv1i64_nxv1i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,mf2,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv1i64.i32( @@ -1228,8 +1216,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv2i64_nxv2i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m1,ta,mu -; CHECK-NEXT: vwsubu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv2i64.i32( @@ -1273,8 +1260,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv4i64_nxv4i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m2,ta,mu -; CHECK-NEXT: vwsubu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv4i64.i32( @@ -1318,8 +1304,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv8i64_nxv8i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m4,ta,mu -; CHECK-NEXT: vwsubu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv8i64.i32( diff --git a/llvm/test/CodeGen/RISCV/rvv/vwsubu.w-rv64.ll b/llvm/test/CodeGen/RISCV/rvv/vwsubu.w-rv64.ll --- a/llvm/test/CodeGen/RISCV/rvv/vwsubu.w-rv64.ll +++ b/llvm/test/CodeGen/RISCV/rvv/vwsubu.w-rv64.ll @@ -688,8 +688,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv1i16_nxv1i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf8,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv1i16.i8( @@ -733,8 +732,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv2i16_nxv2i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf4,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv2i16.i8( @@ -778,8 +776,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv4i16_nxv4i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,mf2,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv4i16.i8( @@ -823,8 +820,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv8i16_nxv8i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m1,ta,mu -; CHECK-NEXT: vwsubu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv8i16.i8( @@ -868,8 +864,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv16i16_nxv16i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m2,ta,mu -; CHECK-NEXT: vwsubu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv16i16.i8( @@ -913,8 +908,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv32i16_nxv32i16_i8: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e8,m4,ta,mu -; CHECK-NEXT: vwsubu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv32i16.i8( @@ -958,8 +952,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv1i32_nxv1i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf4,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv1i32.i16( @@ -1003,8 +996,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv2i32_nxv2i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,mf2,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv2i32.i16( @@ -1048,8 +1040,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv4i32_nxv4i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m1,ta,mu -; CHECK-NEXT: vwsubu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv4i32.i16( @@ -1093,8 +1084,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv8i32_nxv8i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m2,ta,mu -; CHECK-NEXT: vwsubu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv8i32.i16( @@ -1138,8 +1128,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv16i32_nxv16i32_i16: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e16,m4,ta,mu -; CHECK-NEXT: vwsubu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv16i32.i16( @@ -1183,8 +1172,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv1i64_nxv1i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,mf2,ta,mu -; CHECK-NEXT: vwsubu.wx v25, v8, a0 -; CHECK-NEXT: vmv1r.v v8, v25 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv1i64.i32( @@ -1228,8 +1216,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv2i64_nxv2i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m1,ta,mu -; CHECK-NEXT: vwsubu.wx v26, v8, a0 -; CHECK-NEXT: vmv2r.v v8, v26 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv2i64.i32( @@ -1273,8 +1260,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv4i64_nxv4i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m2,ta,mu -; CHECK-NEXT: vwsubu.wx v28, v8, a0 -; CHECK-NEXT: vmv4r.v v8, v28 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv4i64.i32( @@ -1318,8 +1304,7 @@ ; CHECK-LABEL: intrinsic_vwsubu.w_wx_nxv8i64_nxv8i64_i32: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: vsetvli a1, a1, e32,m4,ta,mu -; CHECK-NEXT: vwsubu.wx v16, v8, a0 -; CHECK-NEXT: vmv8r.v v8, v16 +; CHECK-NEXT: vwsubu.wx v8, v8, a0 ; CHECK-NEXT: jalr zero, 0(ra) entry: %a = call @llvm.riscv.vwsubu.w.nxv8i64.i32(