Diff 113378

lib/Target/Mips/MipsISelLowering.h

Context not available.
	MipsCCState &State) const;	MipsCCState &State) const;

	/// passByValArg - Pass a byval argument in registers or on stack.	/// passByValArg - Pass a byval argument in registers or on stack.
	void passByValArg(SDValue Chain, const SDLoc &DL,	SDValue passByValArg(SDValue Chain, const SDLoc &DL,
	std::deque<std::pair<unsigned, SDValue>> &RegsToPass,	std::deque<std::pair<unsigned, SDValue>> &RegsToPass,
	SmallVectorImpl<SDValue> &MemOpChains, SDValue StackPtr,	SmallVectorImpl<SDValue> &MemOpChains,
	MachineFrameInfo &MFI, SelectionDAG &DAG, SDValue Arg,	SDValue StackPtr, MachineFrameInfo &MFI,
	unsigned FirstReg, unsigned LastReg,	SelectionDAG &DAG, SDValue Arg, unsigned FirstReg,
	const ISD::ArgFlagsTy &Flags, bool isLittle,	unsigned LastReg, const ISD::ArgFlagsTy &Flags,
	const CCValAssign &VA) const;	bool isLittle, const CCValAssign &VA) const;

	/// writeVarArgRegs - Write variable function arguments passed in registers	/// writeVarArgRegs - Write variable function arguments passed in registers
	/// to the stack. Also create a stack frame object for the first variable	/// to the stack. Also create a stack frame object for the first variable
Context not available.

lib/Target/Mips/MipsISelLowering.cpp

Context not available.
	if (IsTailCall)	if (IsTailCall)
	++NumTailCalls;	++NumTailCalls;

	// Chain is the output chain of the last Load/Store or CopyToReg node.
	// ByValChain is the output chain of the last Memcpy node created for copying
	// byval arguments to the stack.
	unsigned StackAlignment = TFL->getStackAlignment();
	NextStackOffset = alignTo(NextStackOffset, StackAlignment);
	SDValue NextStackOffsetVal = DAG.getIntPtrConstant(NextStackOffset, DL, true);

	if (!IsTailCall)
	Chain = DAG.getCALLSEQ_START(Chain, NextStackOffset, 0, DL);

	SDValue StackPtr =	SDValue StackPtr =
	DAG.getCopyFromReg(Chain, DL, ABI.IsN64() ? Mips::SP_64 : Mips::SP,	DAG.getCopyFromReg(Chain, DL, ABI.IsN64() ? Mips::SP_64 : Mips::SP,
	getPointerTy(DAG.getDataLayout()));	getPointerTy(DAG.getDataLayout()));
Context not available.
	assert(ByValIdx < CCInfo.getInRegsParamsCount());	assert(ByValIdx < CCInfo.getInRegsParamsCount());
	assert(!IsTailCall &&	assert(!IsTailCall &&
	"Do not tail-call optimize if there is a byval argument.");	"Do not tail-call optimize if there is a byval argument.");
	passByValArg(Chain, DL, RegsToPass, MemOpChains, StackPtr, MFI, DAG, Arg,	Chain = passByValArg(Chain, DL, RegsToPass, MemOpChains, StackPtr, MFI,
	FirstByValReg, LastByValReg, Flags, Subtarget.isLittle(),	DAG, Arg, FirstByValReg, LastByValReg, Flags,
	VA);	Subtarget.isLittle(), VA);
	CCInfo.nextInRegsParam();	CCInfo.nextInRegsParam();
	continue;	continue;
	}	}
Context not available.
	EVT Ty = Callee.getValueType();	EVT Ty = Callee.getValueType();
	bool GlobalOrExternal = false, IsCallReloc = false;	bool GlobalOrExternal = false, IsCallReloc = false;

		// Chain is the output chain of the last Load/Store or CopyToReg node.
		// ByValChain is the output chain of the last Memcpy node created for copying
		// byval arguments to the stack.
		unsigned StackAlignment = TFL->getStackAlignment();
		NextStackOffset = alignTo(NextStackOffset, StackAlignment);
		SDValue NextStackOffsetVal = DAG.getIntPtrConstant(NextStackOffset, DL, true);

		if (!IsTailCall)
		Chain = DAG.getCALLSEQ_START(Chain, NextStackOffset, 0, DL);

	// The long-calls feature is ignored in case of PIC.	// The long-calls feature is ignored in case of PIC.
	// While we do not support -mshared / -mno-shared properly,	// While we do not support -mshared / -mno-shared properly,
	// ignore long-calls in case of -mabicalls too.	// ignore long-calls in case of -mabicalls too.
Context not available.
	}	}

	// Copy byVal arg to registers and stack.	// Copy byVal arg to registers and stack.
	void MipsTargetLowering::passByValArg(	SDValue MipsTargetLowering::passByValArg(
	SDValue Chain, const SDLoc &DL,	SDValue Chain, const SDLoc &DL,
	std::deque<std::pair<unsigned, SDValue>> &RegsToPass,	std::deque<std::pair<unsigned, SDValue>> &RegsToPass,
	SmallVectorImpl<SDValue> &MemOpChains, SDValue StackPtr,	SmallVectorImpl<SDValue> &MemOpChains, SDValue StackPtr,
Context not available.

	// Return if the struct has been fully copied.	// Return if the struct has been fully copied.
	if (ByValSizeInBytes == OffsetInBytes)	if (ByValSizeInBytes == OffsetInBytes)
	return;	return Chain;

	// Copy the remainder of the byval argument with sub-word loads and shifts.	// Copy the remainder of the byval argument with sub-word loads and shifts.
	if (LeftoverBytes) {	if (LeftoverBytes) {
Context not available.

	unsigned ArgReg = ArgRegs[FirstReg + I];	unsigned ArgReg = ArgRegs[FirstReg + I];
	RegsToPass.push_back(std::make_pair(ArgReg, Val));	RegsToPass.push_back(std::make_pair(ArgReg, Val));
	return;	return Chain;
	}	}
	}	}

Context not available.
	DAG.getConstant(OffsetInBytes, DL, PtrTy));	DAG.getConstant(OffsetInBytes, DL, PtrTy));
	SDValue Dst = DAG.getNode(ISD::ADD, DL, PtrTy, StackPtr,	SDValue Dst = DAG.getNode(ISD::ADD, DL, PtrTy, StackPtr,
	DAG.getIntPtrConstant(VA.getLocMemOffset(), DL));	DAG.getIntPtrConstant(VA.getLocMemOffset(), DL));
	Chain = DAG.getMemcpy(Chain, DL, Dst, Src,	Chain = DAG.getMemcpy(
	DAG.getConstant(MemCpySize, DL, PtrTy),	Chain, DL, Dst, Src, DAG.getConstant(MemCpySize, DL, PtrTy), Alignment,
	Alignment, /isVolatile=/false, /AlwaysInline=/false,	/isVolatile=/false, /AlwaysInline=/false,
	/isTailCall=/false,	/isTailCall=/false, MachinePointerInfo(), MachinePointerInfo());
	MachinePointerInfo(), MachinePointerInfo());
	MemOpChains.push_back(Chain);	MemOpChains.push_back(Chain);

		return Chain;
	}	}

	void MipsTargetLowering::writeVarArgRegs(std::vector<SDValue> &OutChains,	void MipsTargetLowering::writeVarArgRegs(std::vector<SDValue> &OutChains,
Context not available.

test/CodeGen/Mips/callseq_order.ll

This file was added.

				; RUN: llc -mtriple=mipsel-linux-gnu -mcpu=mips32 -o /dev/null \
				; RUN: --debug %s 2>&1 \| FileCheck %s
				sdardisUnsubmitted Done Reply Inline Actions You can drop the CPU specification portion of the llc invocations here, the defaults of 32r2 and 64r2 should sufficient to test the logic that has been changed. sdardis: You can drop the CPU specification portion of the llc invocations here, the defaults of 32r2…
				; RUN: llc -mtriple=mips64el-linux-gnu -mcpu=mips64 -o /dev/null \
				; RUN: --debug %s 2>&1 \| FileCheck %s
				; RUN: llc -mtriple=mips-linux-gnu -mcpu=mips32 -o /dev/null \
				; RUN: --debug %s 2>&1 \| FileCheck %s
				; RUN: llc -mtriple=mips64-linux-gnu -mcpu=mips64 -o /dev/null \
				; RUN: --debug %s 2>&1 \| FileCheck %s

				sdardisUnsubmitted Done Reply Inline Actions Add -verify-machineinstrs to these llc commands. sdardis: Add -verify-machineinstrs to these llc commands.
				sdardisUnsubmitted Done Reply Inline Actions These can have -stop-before=expand-isel-pseudos to terminate llc early. sdardis: These can have -stop-before=expand-isel-pseudos to terminate llc early.

				%struct.Str1 = type { [64 x i32] }

				@s1 = common global %struct.Str1 zeroinitializer, align 4

				; Function Attrs: noinline nounwind optnone
				define void @foo1() #0 {
				sdardisUnsubmitted Done Reply Inline Actions This and the one below can be removed. sdardis: This and the one below can be removed.
				entry:
				sdardisUnsubmitted Done Reply Inline Actions The #0 and the #1s below can be removed. sdardis: The #0 and the #1s below can be removed.
				call void @bar1(%struct.Str1* byval align 4 @s1)
				ret void
				; CHECK-LABEL: Optimized legalized selection DAG: BB#0 'foo1:entry'
				; CHECK: t[[T0:[0-9]+]]: ch,glue = callseq_start
				; CHECK: t[[T1:[0-9]+]]: ch,glue = MipsISD::JmpLink t[[T0]]
				; CHECK: t[[T2:[0-9]+]]: ch,glue = callseq_end t[[T1]]
				; CHECK: t[[T3:[0-9]+]]: i{{(32\|64)}},ch,glue = CopyFromReg t[[T2]]
				; CHECK: t[[T4:[0-9]+]]: ch = TokenFactor {{(t[0-9]+:1, )+}}t[[T3]]:1
				; CHECK: t[[T5:[0-9]+]]: ch,glue = callseq_start t[[T4]]
				; CHECK: t[[T6:[0-9]+]]: ch,glue = MipsISD::JmpLink t[[T5]]
				; CHECK: callseq_end t[[T6]]
				; CHECK-LABEL: Instruction selection begins: BB#0 'entry'
				}

				declare void @bar1(%struct.Str1* byval align 4) #1

				; Function Attrs: noinline nounwind optnone
				define void @foo2() #0 {
				entry:
				call void @bar2(%struct.Str1* byval align 4 @s1, %struct.Str1* byval align 4 @s1)
				ret void
				; CHECK-LABEL: Optimized legalized selection DAG: BB#0 'foo2:entry'
				; CHECK: t[[T0:[0-9]+]]: ch,glue = callseq_start
				; CHECK: t[[T1:[0-9]+]]: ch,glue = MipsISD::JmpLink t[[T0]]
				; CHECK: t[[T2:[0-9]+]]: ch,glue = callseq_end t[[T1]]
				; CHECK: t[[T3:[0-9]+]]: i{{(32\|64)}},ch,glue = CopyFromReg t[[T2]]
				; CHECK: t[[T4:[0-9]+]]: ch,glue = callseq_start t[[T3]]
				; CHECK: t[[T5:[0-9]+]]: ch,glue = MipsISD::JmpLink t[[T4]]
				; CHECK: t[[T6:[0-9]+]]: ch,glue = callseq_end t[[T5]]
				; CHECK: t[[T7:[0-9]+]]: i{{(32\|64)}},ch,glue = CopyFromReg t[[T6]]
				; CHECK: t[[T8:[0-9]+]]: ch = TokenFactor {{(t[0-9]+:1, )+}}t[[T3]]:1, t[[T7]]:1
				; CHECK: t[[T9:[0-9]+]]: ch,glue = callseq_start t[[T8]]
				; CHECK: t[[T10:[0-9]+]]: ch,glue = MipsISD::JmpLink t[[T9]]
				; CHECK: callseq_end t[[T10]]
				; CHECK-LABEL: Instruction selection begins: BB#0 'entry'
				sdardisUnsubmitted Done Reply Inline Actions Rather than matching SelectionDAG's output, can you instead match the end output of -debug-only=isel and ensure that the output is a sequence of ADJCALLSTACKDOWN, ADJCALLSTACKUP which are not nested and match the memcpy calls where they occur. sdardis: Rather than matching SelectionDAG's output, can you instead match the end output of -debug…
				}

				declare void @bar2(%struct.Str1* byval align 4, %struct.Str1* byval align 4) #1

test/CodeGen/Mips/llvm-ir/mul.ll

Context not available.
	; MM64R6: daddu $2, $[[T1]], $[[T0]]	; MM64R6: daddu $2, $[[T1]], $[[T0]]
	; MM64R6-DAG: dmul $3, $5, $7	; MM64R6-DAG: dmul $3, $5, $7

	; MM32: lw $25, %call16(__multi3)($16)	; MM32: lw $25, %call16(__multi3)($[[T0:[0-9]+]])
		sdardisUnsubmitted Done Reply Inline Actions You don't need to bind the register number to a FileCheck variable in this case, as it's unused afterwards. Either match it with {{[0-9a-z]+}} or drop the register portion as we're interested in matching the: lw $25, %call16(__multi3) part of the instruction. This applies to the following test changes as well. sdardis: You don't need to bind the register number to a FileCheck variable in this case, as it's unused…

	%r = mul i128 %a, %b	%r = mul i128 %a, %b
	ret i128 %r	ret i128 %r
Context not available.

test/CodeGen/Mips/llvm-ir/sdiv.ll

Context not available.
	; GP64-NOT-R6: ld $25, %call16(__divti3)($gp)	; GP64-NOT-R6: ld $25, %call16(__divti3)($gp)
	; 64R6: ld $25, %call16(__divti3)($gp)	; 64R6: ld $25, %call16(__divti3)($gp)

	; MM32: lw $25, %call16(__divti3)($16)	; MM32: lw $25, %call16(__divti3)($[[T0:[0-9]+]])

	; MM64: ld $25, %call16(__divti3)($2)	; MM64: ld $25, %call16(__divti3)($2)

Context not available.

test/CodeGen/Mips/llvm-ir/srem.ll

Context not available.
	; GP64-NOT-R6: ld $25, %call16(__modti3)($gp)	; GP64-NOT-R6: ld $25, %call16(__modti3)($gp)
	; 64R6: ld $25, %call16(__modti3)($gp)	; 64R6: ld $25, %call16(__modti3)($gp)

	; MM32: lw $25, %call16(__modti3)($16)	; MM32: lw $25, %call16(__modti3)($[[T0:[0-9]+]])

	; MM64: ld $25, %call16(__modti3)($2)	; MM64: ld $25, %call16(__modti3)($2)

Context not available.

test/CodeGen/Mips/llvm-ir/udiv.ll

Context not available.
	; GP64-NOT-R6: ld $25, %call16(__udivti3)($gp)	; GP64-NOT-R6: ld $25, %call16(__udivti3)($gp)
	; 64-R6: ld $25, %call16(__udivti3)($gp)	; 64-R6: ld $25, %call16(__udivti3)($gp)

	; MM32: lw $25, %call16(__udivti3)($16)	; MM32: lw $25, %call16(__udivti3)($[[T0:[0-9]+]])

	; MM64: ld $25, %call16(__udivti3)($2)	; MM64: ld $25, %call16(__udivti3)($2)

Context not available.

test/CodeGen/Mips/llvm-ir/urem.ll

Context not available.
	; GP64-NOT-R6: ld $25, %call16(__umodti3)($gp)	; GP64-NOT-R6: ld $25, %call16(__umodti3)($gp)
	; 64R6: ld $25, %call16(__umodti3)($gp)	; 64R6: ld $25, %call16(__umodti3)($gp)

	; MM32: lw $25, %call16(__umodti3)($16)	; MM32: lw $25, %call16(__umodti3)($[[T0:[0-9]+]])

	; MM64: ld $25, %call16(__umodti3)($2)	; MM64: ld $25, %call16(__umodti3)($2)

Context not available.

This is an archive of the discontinued LLVM Phabricator instance.

[mips] Reordering callseq* nodes to be linear
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 113378

lib/Target/Mips/MipsISelLowering.h

lib/Target/Mips/MipsISelLowering.cpp

test/CodeGen/Mips/callseq_order.ll

test/CodeGen/Mips/llvm-ir/mul.ll

test/CodeGen/Mips/llvm-ir/sdiv.ll

test/CodeGen/Mips/llvm-ir/srem.ll

test/CodeGen/Mips/llvm-ir/udiv.ll

test/CodeGen/Mips/llvm-ir/urem.ll

This is an archive of the discontinued LLVM Phabricator instance.

[mips] Reordering callseq* nodes to be linearClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 113378

lib/Target/Mips/MipsISelLowering.h

lib/Target/Mips/MipsISelLowering.cpp

test/CodeGen/Mips/callseq_order.ll

test/CodeGen/Mips/llvm-ir/mul.ll

test/CodeGen/Mips/llvm-ir/sdiv.ll

test/CodeGen/Mips/llvm-ir/srem.ll

test/CodeGen/Mips/llvm-ir/udiv.ll

test/CodeGen/Mips/llvm-ir/urem.ll

[mips] Reordering callseq* nodes to be linear
ClosedPublic