diff --git a/llvm/lib/Target/AArch64/GISel/AArch64InstructionSelector.cpp b/llvm/lib/Target/AArch64/GISel/AArch64InstructionSelector.cpp --- a/llvm/lib/Target/AArch64/GISel/AArch64InstructionSelector.cpp +++ b/llvm/lib/Target/AArch64/GISel/AArch64InstructionSelector.cpp @@ -1640,20 +1640,19 @@ if (PtrTy.getAddressSpace() != 0) return false; - // Only do this for scalars for now. - if (PtrTy.isVector()) - return false; - MachineIRBuilder MIB(I); - const LLT s64 = LLT::scalar(64); - auto PtrToInt = MIB.buildPtrToInt(s64, AddOp1Reg); + const LLT CastPtrTy = PtrTy.isVector() ? LLT::vector(2, 64) : LLT::scalar(64); + auto PtrToInt = MIB.buildPtrToInt(CastPtrTy, AddOp1Reg); // Set regbanks on the registers. - MRI.setRegBank(PtrToInt.getReg(0), RBI.getRegBank(AArch64::GPRRegBankID)); + if (PtrTy.isVector()) + MRI.setRegBank(PtrToInt.getReg(0), RBI.getRegBank(AArch64::FPRRegBankID)); + else + MRI.setRegBank(PtrToInt.getReg(0), RBI.getRegBank(AArch64::GPRRegBankID)); // Now turn the %dst(p0) = G_PTR_ADD %base, off into: - // %dst(s64) = G_ADD %intbase, off + // %dst(intty) = G_ADD %intbase, off I.setDesc(TII.get(TargetOpcode::G_ADD)); - MRI.setType(DstReg, s64); + MRI.setType(DstReg, CastPtrTy); I.getOperand(1).setReg(PtrToInt.getReg(0)); if (!select(*PtrToInt)) { LLVM_DEBUG(dbgs() << "Failed to select G_PTRTOINT in convertPtrAddToAdd"); @@ -2506,6 +2505,13 @@ I.eraseFromParent(); return true; } + + // We might have a vector G_PTRTOINT, in which case just emit a COPY. + if (Opcode == TargetOpcode::G_PTRTOINT) { + assert(DstTy.isVector() && "Expected an FPR ptrtoint to be a vector"); + I.setDesc(TII.get(TargetOpcode::COPY)); + return true; + } } return false; diff --git a/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp b/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp --- a/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp +++ b/llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp @@ -108,7 +108,7 @@ .minScalarSameAs(1, 0); getActionDefinitionsBuilder(G_PTR_ADD) - .legalFor({{p0, s64}}) + .legalFor({{p0, s64}, {v2p0, v2s64}}) .clampScalar(1, s64, s64); getActionDefinitionsBuilder(G_PTRMASK).legalFor({{p0, s64}}); diff --git a/llvm/test/CodeGen/AArch64/GlobalISel/legalize-ptr-add.mir b/llvm/test/CodeGen/AArch64/GlobalISel/legalize-ptr-add.mir --- a/llvm/test/CodeGen/AArch64/GlobalISel/legalize-ptr-add.mir +++ b/llvm/test/CodeGen/AArch64/GlobalISel/legalize-ptr-add.mir @@ -1,18 +1,18 @@ # NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py # RUN: llc -march=aarch64 -run-pass=legalizer %s -o - | FileCheck %s --- -name: test_gep_small +name: test_ptr_add_small body: | bb.0.entry: - ; CHECK-LABEL: name: test_gep_small + ; CHECK-LABEL: name: test_ptr_add_small ; CHECK: [[COPY:%[0-9]+]]:_(p0) = COPY $x0 ; CHECK: [[COPY1:%[0-9]+]]:_(s64) = COPY $x1 ; CHECK: [[COPY2:%[0-9]+]]:_(s64) = COPY [[COPY1]](s64) ; CHECK: [[C:%[0-9]+]]:_(s64) = G_CONSTANT i64 56 ; CHECK: [[SHL:%[0-9]+]]:_(s64) = G_SHL [[COPY2]], [[C]](s64) ; CHECK: [[ASHR:%[0-9]+]]:_(s64) = G_ASHR [[SHL]], [[C]](s64) - ; CHECK: [[GEP:%[0-9]+]]:_(p0) = G_PTR_ADD [[COPY]], [[ASHR]](s64) - ; CHECK: $x0 = COPY [[GEP]](p0) + ; CHECK: [[PTR_ADD:%[0-9]+]]:_(p0) = G_PTR_ADD [[COPY]], [[ASHR]](s64) + ; CHECK: $x0 = COPY [[PTR_ADD]](p0) %0:_(p0) = COPY $x0 %1:_(s64) = COPY $x1 %2:_(s8) = G_TRUNC %1(s64) @@ -20,3 +20,18 @@ $x0 = COPY %3(p0) ... +--- +name: test_ptr_add_vec_p0 +body: | + bb.0.entry: + ; CHECK-LABEL: name: test_ptr_add_vec_p0 + ; CHECK: [[COPY:%[0-9]+]]:_(<2 x p0>) = COPY $q0 + ; CHECK: [[COPY1:%[0-9]+]]:_(<2 x s64>) = COPY $q1 + ; CHECK: [[PTR_ADD:%[0-9]+]]:_(<2 x p0>) = G_PTR_ADD [[COPY]], [[COPY1]](<2 x s64>) + ; CHECK: $q0 = COPY [[PTR_ADD]](<2 x p0>) + %0:_(<2 x p0>) = COPY $q0 + %1:_(<2 x s64>) = COPY $q1 + %3:_(<2 x p0>) = G_PTR_ADD %0, %1(<2 x s64>) + $q0 = COPY %3(<2 x p0>) + +... diff --git a/llvm/test/CodeGen/AArch64/GlobalISel/select-ptr-add.mir b/llvm/test/CodeGen/AArch64/GlobalISel/select-ptr-add.mir new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/AArch64/GlobalISel/select-ptr-add.mir @@ -0,0 +1,74 @@ +# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py +# RUN: llc -O0 -mtriple=aarch64-apple-ios -run-pass=instruction-select -verify-machineinstrs %s -o - | FileCheck %s -check-prefix=CHECK +--- +name: ptr_add +legalized: true +regBankSelected: true +body: | + bb.0: + liveins: $x0 + ; CHECK-LABEL: name: ptr_add + ; CHECK: [[COPY:%[0-9]+]]:gpr64 = COPY $x0 + ; CHECK: [[COPY1:%[0-9]+]]:gpr64common = COPY [[COPY]] + ; CHECK: [[ADDXri:%[0-9]+]]:gpr64sp = ADDXri [[COPY1]], 42, 0 + ; CHECK: $x0 = COPY [[ADDXri]] + %0:gpr(p0) = COPY $x0 + %1:gpr(s64) = G_CONSTANT i64 42 + %2:gpr(p0) = G_PTR_ADD %0, %1(s64) + $x0 = COPY %2(p0) +... + +--- +name: ptr_add_no_constant +legalized: true +regBankSelected: true +body: | + bb.0: + liveins: $x0, $x1 + ; CHECK-LABEL: name: ptr_add_no_constant + ; CHECK: [[COPY:%[0-9]+]]:gpr64 = COPY $x0 + ; CHECK: [[COPY1:%[0-9]+]]:gpr64 = COPY $x1 + ; CHECK: [[ADDXrr:%[0-9]+]]:gpr64 = ADDXrr [[COPY]], [[COPY1]] + ; CHECK: $x0 = COPY [[ADDXrr]] + %0:gpr(p0) = COPY $x0 + %1:gpr(s64) = COPY $x1 + %2:gpr(p0) = G_PTR_ADD %0, %1(s64) + $x0 = COPY %2(p0) +... + +--- +name: ptr_add_bad_imm +legalized: true +regBankSelected: true +body: | + bb.0: + liveins: $x0, $x1 + ; CHECK-LABEL: name: ptr_add_bad_imm + ; CHECK: [[COPY:%[0-9]+]]:gpr64 = COPY $x0 + ; CHECK: [[MOVi32imm:%[0-9]+]]:gpr32 = MOVi32imm 10000 + ; CHECK: [[SUBREG_TO_REG:%[0-9]+]]:gpr64 = SUBREG_TO_REG 0, [[MOVi32imm]], %subreg.sub_32 + ; CHECK: [[ADDXrr:%[0-9]+]]:gpr64 = ADDXrr [[COPY]], [[SUBREG_TO_REG]] + ; CHECK: $x0 = COPY [[ADDXrr]] + %0:gpr(p0) = COPY $x0 + %1:gpr(s64) = G_CONSTANT i64 10000 + %2:gpr(p0) = G_PTR_ADD %0, %1(s64) + $x0 = COPY %2(p0) +... + +--- +name: ptr_add_vec +legalized: true +regBankSelected: true +body: | + bb.0: + liveins: $q0, $q1 + ; CHECK-LABEL: name: ptr_add_vec + ; CHECK: [[COPY:%[0-9]+]]:fpr128 = COPY $q0 + ; CHECK: [[COPY1:%[0-9]+]]:fpr128 = COPY $q1 + ; CHECK: [[ADDv2i64_:%[0-9]+]]:fpr128 = ADDv2i64 [[COPY]], [[COPY1]] + ; CHECK: $q0 = COPY [[ADDv2i64_]] + %0:fpr(<2 x p0>) = COPY $q0 + %1:fpr(<2 x s64>) = COPY $q1 + %3:fpr(<2 x p0>) = G_PTR_ADD %0, %1(<2 x s64>) + $q0 = COPY %3(<2 x p0>) +... diff --git a/llvm/test/CodeGen/AArch64/GlobalISel/select.mir b/llvm/test/CodeGen/AArch64/GlobalISel/select.mir --- a/llvm/test/CodeGen/AArch64/GlobalISel/select.mir +++ b/llvm/test/CodeGen/AArch64/GlobalISel/select.mir @@ -10,10 +10,6 @@ ret void } - define i8* @ptr_add(i8* %in) { ret i8* undef } - define i8* @ptr_add_no_constant(i8* %in) { ret i8* undef } - define i8* @ptr_add_bad_imm(i8* %in) { ret i8* undef } - define i8* @ptr_mask(i8* %in) { ret i8* undef } @var_local = global i8 0 @@ -53,70 +49,6 @@ ... --- -# CHECK-LABEL: name: ptr_add -name: ptr_add -legalized: true -regBankSelected: true -registers: - - { id: 0, class: gpr } - - { id: 1, class: gpr } - - { id: 2, class: gpr } - -# CHECK: body: -# CHECK: %{{[0-9]+}}:gpr64sp = ADDXri %{{[0-9]+}}, 42, 0 -body: | - bb.0: - liveins: $x0 - %0(p0) = COPY $x0 - %1(s64) = G_CONSTANT i64 42 - %2(p0) = G_PTR_ADD %0, %1(s64) - $x0 = COPY %2(p0) -... - ---- -# CHECK-LABEL: name: ptr_add_no_constant -name: ptr_add_no_constant -legalized: true -regBankSelected: true -registers: - - { id: 0, class: gpr } - - { id: 1, class: gpr } - - { id: 2, class: gpr } - -# CHECK: body: -# CHECK: %{{[0-9]+}}:gpr64 = ADDXrr %{{[0-9]+}}, %{{[0-9]+}} -body: | - bb.0: - liveins: $x0, $x1 - %0(p0) = COPY $x0 - %1(s64) = COPY $x1 - %2(p0) = G_PTR_ADD %0, %1(s64) - $x0 = COPY %2(p0) -... - ---- -# CHECK-LABEL: name: ptr_add_bad_imm -name: ptr_add_bad_imm -legalized: true -regBankSelected: true -registers: - - { id: 0, class: gpr } - - { id: 1, class: gpr } - - { id: 2, class: gpr } - -# CHECK: body: -# CHECK: %0:gpr64 = COPY $x0 -# CHECK: %4:gpr32 = MOVi32imm 10000 -# CHECK: %1:gpr64 = SUBREG_TO_REG 0, %4, %subreg.sub_32 -# CHECK: %{{[0-9]+}}:gpr64 = ADDXrr %0, %1 -body: | - bb.0: - liveins: $x0, $x1 - %0(p0) = COPY $x0 - %1(s64) = G_CONSTANT i64 10000 - %2(p0) = G_PTR_ADD %0, %1(s64) - $x0 = COPY %2(p0) -... --- # CHECK-LABEL: name: ptr_mask