diff --git a/llvm/lib/Target/AArch64/AArch64ISelDAGToDAG.cpp b/llvm/lib/Target/AArch64/AArch64ISelDAGToDAG.cpp --- a/llvm/lib/Target/AArch64/AArch64ISelDAGToDAG.cpp +++ b/llvm/lib/Target/AArch64/AArch64ISelDAGToDAG.cpp @@ -435,6 +435,8 @@ bool trySelectCastFixedLengthToScalableVector(SDNode *N); bool trySelectCastScalableToFixedLengthVector(SDNode *N); + bool trySelectXAR(SDNode *N); + // Include the pieces autogenerated from the target description. #include "AArch64GenDAGISel.inc" @@ -4273,6 +4275,40 @@ return true; } +bool AArch64DAGToDAGISel::trySelectXAR(SDNode *N) { + assert(N->getOpcode() == ISD::OR && "Expected OR instruction"); + + SDValue N0 = N->getOperand(0); + SDValue N1 = N->getOperand(1); + + if (N0->getOpcode() != AArch64ISD::VSHL || + N1->getOpcode() != AArch64ISD::VLSHR) + return false; + + if (N0->getOperand(0)->getOpcode() != N1->getOperand(0)->getOpcode() || + N1->getOperand(0)->getOpcode() != ISD::XOR) + return false; + + SDValue XOR = N0.getOperand(0); + SDValue R1 = XOR.getOperand(0); + SDValue R2 = XOR.getOperand(1); + + unsigned HsAmt = N0.getConstantOperandVal(1); + unsigned ShAmt = N1.getConstantOperandVal(1); + + SDLoc DL = SDLoc(N0.getOperand(1)); + SDValue Imm = CurDAG->getTargetConstant( + ShAmt, DL, N0.getOperand(1).getValueType(), false); + + if (ShAmt + HsAmt != 64) + return false; + + SDValue Ops[] = {R1, R2, Imm}; + CurDAG->SelectNodeTo(N, AArch64::XAR, N0.getValueType(), Ops); + + return true; +} + void AArch64DAGToDAGISel::Select(SDNode *Node) { // If we have a custom node, we already have selected! if (Node->isMachineOpcode()) { @@ -4336,6 +4372,8 @@ case ISD::OR: if (tryBitfieldInsertOp(Node)) return; + if (Subtarget->hasSHA3() && trySelectXAR(Node)) + return; break; case ISD::EXTRACT_SUBVECTOR: { diff --git a/llvm/test/CodeGen/AArch64/xar.ll b/llvm/test/CodeGen/AArch64/xar.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/AArch64/xar.ll @@ -0,0 +1,23 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4 +; RUN: llc -mtriple=aarch64-none-eabi -mattr=+sha3 < %s | FileCheck --check-prefix=SHA3 %s +; RUN: llc -mtriple=aarch64-none-eabi -mattr=-sha3 < %s | FileCheck --check-prefix=NOSHA3 %s + +define <2 x i64> @xar(<2 x i64> %x, <2 x i64> %y) { +; SHA3-LABEL: xar: +; SHA3: // %bb.0: +; SHA3-NEXT: xar v0.2d, v0.2d, v1.2d, #54 +; SHA3-NEXT: ret +; +; NOSHA3-LABEL: xar: +; NOSHA3: // %bb.0: +; NOSHA3-NEXT: eor v0.16b, v0.16b, v1.16b +; NOSHA3-NEXT: ushr v1.2d, v0.2d, #54 +; NOSHA3-NEXT: shl v0.2d, v0.2d, #10 +; NOSHA3-NEXT: orr v0.16b, v0.16b, v1.16b +; NOSHA3-NEXT: ret + %a = xor <2 x i64> %x, %y + %b = call <2 x i64> @llvm.fshl.v2i64(<2 x i64> %a, <2 x i64> %a, <2 x i64> ) + ret <2 x i64> %b +} + +declare <2 x i64> @llvm.fshl.v2i64(<2 x i64>, <2 x i64>, <2 x i64>)