Index: llvm/lib/Target/PowerPC/PPCInstrVSX.td =================================================================== --- llvm/lib/Target/PowerPC/PPCInstrVSX.td +++ llvm/lib/Target/PowerPC/PPCInstrVSX.td @@ -1069,10 +1069,6 @@ // Stores. def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>; - def : Pat<(int_ppc_vsx_stxvd2x_be v2f64:$rS, xoaddr:$dst), - (STXVD2X $rS, xoaddr:$dst)>; - def : Pat<(int_ppc_vsx_stxvw4x_be v4i32:$rS, xoaddr:$dst), - (STXVW4X $rS, xoaddr:$dst)>; def : Pat<(PPCstxvd2x v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>; } let Predicates = [IsBigEndian, HasVSX, HasOnlySwappingMemOps] in { @@ -1993,6 +1989,10 @@ def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)), (f64 VectorExtractions.LE_VARIABLE_DOUBLE)>; +def : Pat<(int_ppc_vsx_stxvd2x_be v2f64:$rS, xoaddr:$dst), + (STXVD2X $rS, xoaddr:$dst)>; +def : Pat<(int_ppc_vsx_stxvw4x_be v4i32:$rS, xoaddr:$dst), + (STXVW4X $rS, xoaddr:$dst)>; def : Pat<(v4i32 (int_ppc_vsx_lxvw4x_be xoaddr:$src)), (LXVW4X xoaddr:$src)>; def : Pat<(v2f64 (int_ppc_vsx_lxvd2x_be xoaddr:$src)), (LXVD2X xoaddr:$src)>; Index: llvm/test/CodeGen/PowerPC/vsx.ll =================================================================== --- llvm/test/CodeGen/PowerPC/vsx.ll +++ llvm/test/CodeGen/PowerPC/vsx.ll @@ -1211,51 +1211,3 @@ ; CHECK-LE: xscmpudp cr0, f3, f4 ; CHECK-LE: beqlr cr0 } - -; Function Attrs: nounwind readnone -define <4 x i32> @test83(i8* %a) { - entry: - %0 = tail call <4 x i32> @llvm.ppc.vsx.lxvw4x.be(i8* %a) - ret <4 x i32> %0 -; CHECK-LABEL: test83 -; CHECK: lxvw4x v2, 0, r3 -; CHECK: blr -} -; Function Attrs: nounwind readnone -declare <4 x i32> @llvm.ppc.vsx.lxvw4x.be(i8*) - -; Function Attrs: nounwind readnone -define <2 x double> @test84(i8* %a) { - entry: - %0 = tail call <2 x double> @llvm.ppc.vsx.lxvd2x.be(i8* %a) - ret <2 x double> %0 -; CHECK-LABEL: test84 -; CHECK: lxvd2x v2, 0, r3 -; CHECK: blr -} -; Function Attrs: nounwind readnone -declare <2 x double> @llvm.ppc.vsx.lxvd2x.be(i8*) - -; Function Attrs: nounwind readnone -define void @test85(<4 x i32> %a, i8* %b) { - entry: - tail call void @llvm.ppc.vsx.stxvw4x.be(<4 x i32> %a, i8* %b) - ret void -; CHECK-LABEL: test85 -; CHECK: stxvw4x v2, 0, r5 -; CHECK: blr -} -; Function Attrs: nounwind readnone -declare void @llvm.ppc.vsx.stxvw4x.be(<4 x i32>, i8*) - -; Function Attrs: nounwind readnone -define void @test86(<2 x double> %a, i8* %b) { - entry: - tail call void @llvm.ppc.vsx.stxvd2x.be(<2 x double> %a, i8* %b) - ret void -; CHECK-LABEL: test86 -; CHECK: stxvd2x v2, 0, r5 -; CHECK: blr -} -; Function Attrs: nounwind readnone -declare void @llvm.ppc.vsx.stxvd2x.be(<2 x double>, i8*) Index: llvm/test/CodeGen/PowerPC/vsx_builtins.ll =================================================================== --- /dev/null +++ llvm/test/CodeGen/PowerPC/vsx_builtins.ll @@ -0,0 +1,51 @@ +; RUN: llc -relocation-model=static -verify-machineinstrs -mcpu=pwr9 \ +; RUN: -mtriple=powerpc64le-unknown-linux-gnu -mattr=+vsx \ +; RUN: -ppc-vsr-nums-as-vr -ppc-asm-full-reg-names < %s | FileCheck %s + +; Function Attrs: nounwind readnone +define <4 x i32> @test1(i8* %a) { + entry: + %0 = tail call <4 x i32> @llvm.ppc.vsx.lxvw4x.be(i8* %a) + ret <4 x i32> %0 +; CHECK-LABEL: test1 +; CHECK: lxvw4x v2, 0, r3 +; CHECK: blr +} +; Function Attrs: nounwind readnone +declare <4 x i32> @llvm.ppc.vsx.lxvw4x.be(i8*) + +; Function Attrs: nounwind readnone +define <2 x double> @test2(i8* %a) { + entry: + %0 = tail call <2 x double> @llvm.ppc.vsx.lxvd2x.be(i8* %a) + ret <2 x double> %0 +; CHECK-LABEL: test2 +; CHECK: lxvd2x v2, 0, r3 +; CHECK: blr +} +; Function Attrs: nounwind readnone +declare <2 x double> @llvm.ppc.vsx.lxvd2x.be(i8*) + +; Function Attrs: nounwind readnone +define void @test3(<4 x i32> %a, i8* %b) { + entry: + tail call void @llvm.ppc.vsx.stxvw4x.be(<4 x i32> %a, i8* %b) + ret void +; CHECK-LABEL: test3 +; CHECK: stxvw4x v2, 0, r5 +; CHECK: blr +} +; Function Attrs: nounwind readnone +declare void @llvm.ppc.vsx.stxvw4x.be(<4 x i32>, i8*) + +; Function Attrs: nounwind readnone +define void @test4(<2 x double> %a, i8* %b) { + entry: + tail call void @llvm.ppc.vsx.stxvd2x.be(<2 x double> %a, i8* %b) + ret void +; CHECK-LABEL: test4 +; CHECK: stxvd2x v2, 0, r5 +; CHECK: blr +} +; Function Attrs: nounwind readnone +declare void @llvm.ppc.vsx.stxvd2x.be(<2 x double>, i8*)