Diff 166498

lib/Target/ARM/ARMLoadStoreOptimizer.cpp

Show First 20 Lines • Show All 1,021 Lines • ▼ Show 20 Lines	do {
// deprecated; LDM to PC is fine but cannot happen here.		// deprecated; LDM to PC is fine but cannot happen here.
if (PReg == ARM::SP \|\| PReg == ARM::PC)		if (PReg == ARM::SP \|\| PReg == ARM::PC)
CanMergeToLSMulti = CanMergeToLSDouble = false;		CanMergeToLSMulti = CanMergeToLSDouble = false;

// Should we be conservative?		// Should we be conservative?
if (AssumeMisalignedLoadStores && !mayCombineMisaligned(STI, MI))		if (AssumeMisalignedLoadStores && !mayCombineMisaligned(STI, MI))
CanMergeToLSMulti = CanMergeToLSDouble = false;		CanMergeToLSMulti = CanMergeToLSDouble = false;

		// vldm / vstm limit are 32 for S variants, 16 for D variants.
		unsigned Limit;
		switch (Opcode) {
		default:
		Limit = UINT_MAX;
		break;
		case ARM::VLDRD:
		case ARM::VSTRD:
		Limit = 16;
		break;
		}

// Merge following instructions where possible.		// Merge following instructions where possible.
for (unsigned I = SIndex+1; I < EIndex; ++I, ++Count) {		for (unsigned I = SIndex+1; I < EIndex; ++I, ++Count) {
int NewOffset = MemOps[I].Offset;		int NewOffset = MemOps[I].Offset;
if (NewOffset != Offset + (int)Size)		if (NewOffset != Offset + (int)Size)
break;		break;
const MachineOperand &MO = getLoadStoreRegOp(*MemOps[I].MI);		const MachineOperand &MO = getLoadStoreRegOp(*MemOps[I].MI);
unsigned Reg = MO.getReg();		unsigned Reg = MO.getReg();
if (Reg == ARM::SP \|\| Reg == ARM::PC)		if (Reg == ARM::SP \|\| Reg == ARM::PC)
break;		break;
		if (Count == Limit)
		break;

// See if the current load/store may be part of a multi load/store.		// See if the current load/store may be part of a multi load/store.
		efriedmaUnsubmitted Done Reply Inline Actions Instead of disabling merging, could we just do something like "if (Count == Limit) break;", so we merge the first 16 stores, then consider any remaining stores as a separate set? efriedma: Instead of disabling merging, could we just do something like "if (Count == Limit) break;", so…
		LukeCheesemanAuthorUnsubmitted Not Done Reply Inline Actions Ah yes, that's a much better idea. Thanks LukeCheeseman: Ah yes, that's a much better idea. Thanks
unsigned RegNum = MO.isUndef() ? std::numeric_limits<unsigned>::max()		unsigned RegNum = MO.isUndef() ? std::numeric_limits<unsigned>::max()
: TRI->getEncodingValue(Reg);		: TRI->getEncodingValue(Reg);
bool PartOfLSMulti = CanMergeToLSMulti;		bool PartOfLSMulti = CanMergeToLSMulti;
if (PartOfLSMulti) {		if (PartOfLSMulti) {
// Register numbers must be in ascending order.		// Register numbers must be in ascending order.
if (RegNum <= PRegNum)		if (RegNum <= PRegNum)
PartOfLSMulti = false;		PartOfLSMulti = false;
// For VFP / NEON load/store multiples, the registers must be		// For VFP / NEON load/store multiples, the registers must be
Show All 23 Lines	do {

// Form a candidate from the Ops collected so far.		// Form a candidate from the Ops collected so far.
MergeCandidate *Candidate = new(Allocator.Allocate()) MergeCandidate;		MergeCandidate *Candidate = new(Allocator.Allocate()) MergeCandidate;
for (unsigned C = SIndex, CE = SIndex + Count; C < CE; ++C)		for (unsigned C = SIndex, CE = SIndex + Count; C < CE; ++C)
Candidate->Instrs.push_back(MemOps[C].MI);		Candidate->Instrs.push_back(MemOps[C].MI);
Candidate->LatestMIIdx = Latest - SIndex;		Candidate->LatestMIIdx = Latest - SIndex;
Candidate->EarliestMIIdx = Earliest - SIndex;		Candidate->EarliestMIIdx = Earliest - SIndex;
Candidate->InsertPos = MemOps[Latest].Position;		Candidate->InsertPos = MemOps[Latest].Position;
if (Count == 1)		if (Count == 1)
		efriedmaUnsubmitted Done Reply Inline Actions This limit isn't actually useful...? There are only 32 float registers anyway. efriedma: This limit isn't actually useful...? There are only 32 float registers anyway.
CanMergeToLSMulti = CanMergeToLSDouble = false;		CanMergeToLSMulti = CanMergeToLSDouble = false;
Candidate->CanMergeToLSMulti = CanMergeToLSMulti;		Candidate->CanMergeToLSMulti = CanMergeToLSMulti;
Candidate->CanMergeToLSDouble = CanMergeToLSDouble;		Candidate->CanMergeToLSDouble = CanMergeToLSDouble;
Candidates.push_back(Candidate);		Candidates.push_back(Candidate);
// Continue after the chain.		// Continue after the chain.
SIndex += Count;		SIndex += Count;
} while (SIndex < EIndex);		} while (SIndex < EIndex);
}		}
▲ Show 20 Lines • Show All 762 Lines • ▼ Show 20 Lines	if (Candidate->CanMergeToLSMulti \|\| Candidate->CanMergeToLSDouble) {
MergeBaseUpdateLSMultiple(Merged);		MergeBaseUpdateLSMultiple(Merged);
} else {		} else {
for (MachineInstr *MI : Candidate->Instrs) {		for (MachineInstr *MI : Candidate->Instrs) {
if (MergeBaseUpdateLoadStore(MI))		if (MergeBaseUpdateLoadStore(MI))
Changed = true;		Changed = true;
}		}
}		}
} else {		} else {
assert(Candidate->Instrs.size() == 1);		assert(Candidate->Instrs.size() == 1);
efriedmaUnsubmitted Not Done Reply Inline Actions How is this change related? efriedma: How is this change related?
if (MergeBaseUpdateLoadStore(Candidate->Instrs.front()))		if (MergeBaseUpdateLoadStore(Candidate->Instrs.front()))
Changed = true;		Changed = true;
}		}
}		}
Candidates.clear();		Candidates.clear();
// Try to fold add/sub into the LDRD/STRD formed by ARMPreAllocLoadStoreOpt.		// Try to fold add/sub into the LDRD/STRD formed by ARMPreAllocLoadStoreOpt.
for (MachineInstr *MI : MergeBaseCandidates)		for (MachineInstr *MI : MergeBaseCandidates)
MergeBaseUpdateLSDouble(*MI);		MergeBaseUpdateLSDouble(*MI);
▲ Show 20 Lines • Show All 580 Lines • Show Last 20 Lines

test/CodeGen/ARM/load_store_opt_reg_limit.mir

This file was added.

				# RUN: llc -mtriple=thumbv7--linux-android -verify-machineinstrs -run-pass=arm-ldst-opt %s -o - \| FileCheck %s --check-prefix=CHECK-MERGE
				#CHECK-MERGE: foo
				name: foo
				# CHECK-MERGE: VSTMDIA $r4, 14, $noreg, $d15, $d16, $d17, $d18, $d19, $d20, $d21, $d22, $d23, $d24, $d25, $d26, $d27, $d28, $d29, $d30
				# CHECK-MERGE-NEXT: VSTRD $d31, $r4, 32, 14, $noreg :: (store 8)
				# CHECK-MERGE: VSTMDIA killed $r0, 14, $noreg, $d4, $d5, $d6, $d7, $d8, $d9, $d10, $d11, $d12, $d13, $d14
				body: \|
				bb.0:
				VSTRD $d15, $r4, 0, 14, $noreg :: (store 8)
				VSTRD $d16, $r4, 2, 14, $noreg :: (store 8)
				VSTRD $d17, $r4, 4, 14, $noreg :: (store 8)
				MatzeBUnsubmitted Done Reply Inline Actions You should be able to drop the whole IR block too I think. MatzeB: You should be able to drop the whole IR block too I think.
				VSTRD $d18, $r4, 6, 14, $noreg :: (store 8)
				VSTRD $d19, $r4, 8, 14, $noreg :: (store 8)
				MatzeBUnsubmitted Done Reply Inline Actions Better style: `# CHECK-LABEL: name: _Z2brR1lI1ME` (may also consider choosing a simpler function name) MatzeB: Better style: `# CHECK-LABEL: name: _Z2brR1lI1ME` (may also consider choosing a simpler…
				VSTRD $d20, $r4, 10, 14, $noreg :: (store 8)
				VSTRD $d21, $r4, 12, 14, $noreg :: (store 8)
				VSTRD $d22, $r4, 14, 14, $noreg :: (store 8)
				VSTRD $d23, $r4, 16, 14, $noreg :: (store 8)
				VSTRD $d24, $r4, 18, 14, $noreg :: (store 8)
				VSTRD $d25, $r4, 20, 14, $noreg :: (store 8)
				VSTRD $d26, $r4, 22, 14, $noreg :: (store 8)
				VSTRD $d27, $r4, 24, 14, $noreg :: (store 8)
				VSTRD $d28, $r4, 26, 14, $noreg :: (store 8)
				VSTRD $d29, $r4, 28, 14, $noreg :: (store 8)
				VSTRD $d30, $r4, 30, 14, $noreg :: (store 8)
				VSTRD $d31, $r4, 32, 14, $noreg :: (store 8)
				VSTRD $d0, $r4, 34, 14, $noreg :: (store 8)
				VSTRD $d1, $r4, 36, 14, $noreg :: (store 8)
				VSTRD $d3, $r4, 38, 14, $noreg :: (store 8)
				VSTRD $d2, $r4, 40, 14, $noreg :: (store 8)
				VSTRD $d4, $r4, 42, 14, $noreg :: (store 8)
				VSTRD $d5, $r4, 44, 14, $noreg :: (store 8)
				VSTRD $d6, $r4, 46, 14, $noreg :: (store 8)
				VSTRD $d7, $r4, 48, 14, $noreg :: (store 8)
				VSTRD $d8, $r4, 50, 14, $noreg :: (store 8)
				VSTRD $d9, $r4, 52, 14, $noreg :: (store 8)
				VSTRD $d10, $r4, 54, 14, $noreg :: (store 8)
				VSTRD $d11, $r4, 56, 14, $noreg :: (store 8)
				VSTRD $d12, $r4, 58, 14, $noreg :: (store 8)
				VSTRD $d13, $r4, 60, 14, $noreg :: (store 8)
				VSTRD $d14, $r4, 62, 14, $noreg :: (store 8)

This is an archive of the discontinued LLVM Phabricator instance.

[ARM][ARMLoadStoreOptimizer]
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 166498

lib/Target/ARM/ARMLoadStoreOptimizer.cpp

test/CodeGen/ARM/load_store_opt_reg_limit.mir

This is an archive of the discontinued LLVM Phabricator instance.

[ARM][ARMLoadStoreOptimizer]ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 166498

lib/Target/ARM/ARMLoadStoreOptimizer.cpp

test/CodeGen/ARM/load_store_opt_reg_limit.mir

[ARM][ARMLoadStoreOptimizer]
ClosedPublic