This is an archive of the discontinued LLVM Phabricator instance.

lib/CodeGen/GlobalISel/LegalizerHelper.cpp
756	Hi Matt @arsenm, Looks like adding `widenScalarDst` call for type index 0 is not enough to adjust the widening to the new type constraints in full. All the code below it that now would handle type index 1 widening appears to be written under the assumption that destination and source types are the same, and it widens both, source and the destination. It was perfectly fine an assumption before, but not anymore. If the source needs to be widened, it generates incorrect code. Here's a unit test that reproduces one of the possible issues (thanks Aditya @aditya_nandakumar for coming up with it!): diff --git a/unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp b/unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp index 815f1e3d321..a5798693c08 100644 --- a/unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp +++ b/unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp @@ -341,6 +341,31 @@ TEST_F(GISelMITest, WidenBitCountingCTPOP) { EXPECT_TRUE(CheckMachineFunction(MF, CheckStr)) << MF; } +// CTPOP widening. +TEST_F(GISelMITest, WidenBitCountingCTPOP1) { + if (!TM) + return; + + // Declare your legalization info + DefineLegalizerInfo(A, { + getActionDefinitionsBuilder(G_CTPOP).legalFor({{s16, s16}}); + }); + // Build + // Trunc it to s8. + LLT s8{LLT::scalar(8)}; + LLT s16{LLT::scalar(16)}; + auto MIBTrunc = B.buildTrunc(s8, Copies[0]); + auto MIBCTPOP = B.buildInstr(TargetOpcode::G_CTPOP, {s16}, {MIBTrunc}); + AInfo Info(MF->getSubtarget()); + DummyGISelObserver Observer; + LegalizerHelper Helper(MF, Info, Observer, B); + EXPECT_TRUE(Helper.widenScalar(MIBCTPOP, 1, s16) == + LegalizerHelper::LegalizeResult::Legalized); + + + MF->dump(); +} + // CTTZ_ZERO_UNDEF widening. TEST_F(GISelMITest, WidenBitCountingCTTZ_ZERO_UNDEF) { if (!TM) Could you please take a look at this?
test/CodeGen/AMDGPU/GlobalISel/legalize-ctlz.mir
78	Is this really legal?
unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp
338	Another example of the behavior - isn't widening for type index 1 supposed to widen only the source? But as could be seen here, it ends up widening both the source and the destination. The resulting code isn't broken largely because the source and destination types of the input instruction are the same.

These are all bugs hidden by not calling the observer when doing the index 0 legalization

unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp
338	Yes, for these the source and dest can be separately legalized

arsenm marked an inline comment as done.Feb 4 2019, 2:26 PM

arsenm added inline comments.

lib/CodeGen/GlobalISel/LegalizerHelper.cpp
756	Try r353102

rtereshin added a subscriber: qcolombet.Feb 4 2019, 3:48 PM

rtereshin added inline comments.

lib/CodeGen/GlobalISel/LegalizerHelper.cpp

756

Hi Matt,

That's much better, thank you!

I feel a little bit divided though about the fact that in some cases widening one type index ends up changing the type of the other type index.

For instance, in this case widening type index 1 ends up also widening type index 0:

// CTLZ widening.
TEST_F(GISelMITest, WidenBitCountingCTLZ) {
  if (!TM)
    return;

  // Declare your legalization info
  DefineLegalizerInfo(A, {
    getActionDefinitionsBuilder(G_CTLZ).legalFor({{s16, s16}});
  });
  // Build
  // Trunc it to s8.
  LLT s8{LLT::scalar(8)};
  LLT s16{LLT::scalar(16)};
  auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
  auto MIBCTLZ = B.buildInstr(TargetOpcode::G_CTLZ, {s8}, {MIBTrunc}); // We start with the type signature {s8, s8}
  AInfo Info(MF->getSubtarget());
  DummyGISelObserver Observer;
  LegalizerHelper Helper(*MF, Info, Observer, B);
  EXPECT_TRUE(Helper.widenScalar(*MIBCTLZ, 1, s16) ==  // We ask the API to widen type index 1 to s16, probably expecting type signature {s8, s16} as a result
              LegalizerHelper::LegalizeResult::Legalized);

  auto CheckStr = R"(
  CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC
  CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]
  CHECK: [[Ctlz:%[0-9]+]]:_(s16) = G_CTLZ [[Zext]]  # The API ends up widening not just type index 1, but also type index 0 with the resulting {s16, s16} type signature
  CHECK: [[Cst8:%[0-9]+]]:_(s16) = G_CONSTANT i16 8
  CHECK: [[Sub:%[0-9]+]]:_(s16) = G_SUB [[Ctlz]]:_, [[Cst8]]:_
  CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Sub]]
  )";

  // Check
  EXPECT_TRUE(CheckMachineFunction(*MF, CheckStr)) << *MF;
}

In this other case widening type index 1 ends up also narrowing type index 0:

// Test a strange case where the result is wider than the source
TEST_F(GISelMITest, WidenBitCountingCTPOP2) {
  if (!TM)
    return;

  // Declare your legalization info
  DefineLegalizerInfo(A, {
      getActionDefinitionsBuilder(G_CTPOP).legalFor({{s32, s16}});
    });

  // Build
  // Trunc it to s8.
  LLT s8{LLT::scalar(8)};
  LLT s16{LLT::scalar(16)};
  LLT s32{LLT::scalar(32)};
  auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
  auto MIBCTPOP = B.buildInstr(TargetOpcode::G_CTPOP, {s32}, {MIBTrunc}); // We start with type signature {s32, s8}
  AInfo Info(MF->getSubtarget());
  DummyGISelObserver Observer;
  LegalizerHelper Helper(*MF, Info, Observer, B);
  EXPECT_EQ(LegalizerHelper::LegalizeResult::Legalized,  // We ask the API to widen type index 1 to s16, probably expecting {s32, s16} as a result
            Helper.widenScalar(*MIBCTPOP, 1, s16));

  auto CheckStr = R"(
  CHECK: [[TRUNC:%[0-9]+]]:_(s8) = G_TRUNC %0:_(s64)
  CHECK: [[ZEXT:%[0-9]+]]:_(s16) = G_ZEXT [[TRUNC]]:_(s8)
  CHECK: [[CTPOP:%[0-9]+]]:_(s16) = G_CTPOP [[ZEXT]]  # API ends up narrowing the type index 0 in the process with {s16, s16} type signature as a result.
  CHECK: [[COPY:%[0-9]+]]:_(s32) = G_ZEXT [[CTPOP]]:_(s16)
  )";

  EXPECT_TRUE(CheckMachineFunction(*MF, CheckStr)) << *MF;
}

I talked to @aditya_nandakumar, @volkan, and @qcolombet offline and it appears that we don't have any contract about what pre-defined operations like widenScalar, narrowScalar etc. are allowed to do with the type indices not included in the request, but I think it maybe worth introducing such a contract. Specifically the one that would state that it's guaranteed that these generic, pre-defined operations aren't allowed to change the types of the type indices except the one(s) explicitly included in the request.

I think not having these operations following such a contract makes their behavior quite unexpected for anyone who focuses on writing legalizations rules for their target w/o having an extensive knowledge about how exactly the implementation of the pre-defined API-provided operations looks like. In particular, I think it might make it easier for the users to accidentally introduce loops in legalization rules, and harder for them to understand where they are coming from.

Please let me know what do you think!

Thanks,
Roman

arsenm marked an inline comment as done.Feb 4 2019, 3:58 PM

arsenm added inline comments.

lib/CodeGen/GlobalISel/LegalizerHelper.cpp
756	In general I don't think it's in general possible to avoid changing other type indexes. For example, FewerElements for a select's condition type requires doing the same FewerElements for the select type. The same applies for any vector cast. The two type indexes won't match, but they still need to have the same number of elements. I don't think these examples actually show this though. Note in these examples, these aren't producing the fully legalized operation. They're only doing one step, but need at least one more to legalize the operation

arsenm marked an inline comment as done.Feb 4 2019, 4:08 PM

arsenm added inline comments.

lib/CodeGen/GlobalISel/LegalizerHelper.cpp
756	A bigger problem I have is the order of legalization steps matters. The intermediate operations will be done in a different type if you specify the legalize actions for type index 1 before 0 vs. the other wya around. You wouldn't see the new operation with the narrower type if you legalized in the other order

rtereshin added inline comments.Feb 4 2019, 4:13 PM

lib/CodeGen/GlobalISel/LegalizerHelper.cpp
756	A bigger problem I have is the order of legalization steps matters. The intermediate operations will be done in a different type if you specify the legalize actions for type index 1 before 0 vs. the other wya around. You wouldn't see the new operation with the narrower type if you legalized in the other order That's a very good point!

dsanders added inline comments.Feb 4 2019, 4:16 PM

lib/CodeGen/GlobalISel/LegalizerHelper.cpp
756	I generally agree that the types should generally be modified independently. Not following that makes it fairly easy to get into infinite loops where one type is too big and one is too small. However... There are some difficulties with such a rule though (at least with the current definitions of operations). Suppose you have: %dst:(s4) = G_EXTRACT %src:(s16), %idx:s32 and the legalizer is told to widen %dst to s32. G_EXTRACT currently expects all the result bits to originate from the input which isn't possible if the input stays fixed at s16. Arguably, G_EXTRACT should have a size operand anyway at which point we can treat it the excess bits as an any-extension. There's also some performance costs to such a rule as it increases the number of hops needed to get from illegal to legal. I generally think targets should be allowed to leap directly to the right answer whenever possible. From that point of view, the limitation that we can only specify one index and type as the target for a legalization step is a bit of a nuisance. Personally, I'd like to replace the LegalizationAction with a function pointer that just performs the desired change and have a standard library of actions that can be called for the common changes. This also has the nice side-benefit of removing the Custom action and the limitations that has (the opcode must always be changed to something that is Legal rather than Custom).

qcolombet added inline comments.Feb 5 2019, 9:53 AM

lib/CodeGen/GlobalISel/LegalizerHelper.cpp
756	For example, FewerElements for a select's condition type requires doing the same FewerElements for the select type. The same applies for any vector cast. The two type indexes won't match, but they still need to have the same number of elements. That's a good example, but that doesn't mean we shouldn't come up with some kind of contract. The thing I am after is a way to tell if we are creating loops in our legalization rules. I haven't thought if this is practical, but we could imagine that the contract if we don't change the element type of the other operands. The number of elements can change but in a reasonable way (at least for the generic code, custom legalization does what it wants). What do you think?

Personally, I'd like to replace the LegalizationAction with a function pointer that just performs the desired change and have a standard library of actions that can be called for the common changes.

@dsanders didn't we try something like that for ISel and the performance was terrible?

Should we revert this change to have the conversation going or am I the only one unhappy with the absence of guarantees for the other operands?

In D57243#1385507, @qcolombet wrote:

Personally, I'd like to replace the LegalizationAction with a function pointer that just performs the desired change and have a standard library of actions that can be called for the common changes.

@dsanders didn't we try something like that for ISel and the performance was terrible?

You're thinking of the hundreds-thousands of single-use lambdas that were generated. It was the ugly temporary code that was used to inject multiple statements inside an if-statement condition and looked like this:

if ([&](...) {
    if (!...) return false;
    if (!...) return false;
    if (!...) return false;
    if (!...) return false;
    return true;
    }(Arg1, Arg2)) {
      ...
}

The legalizer is already done the way I'm talking about on the rule matching side and performance was marginally better on average than the old setAction() interface.

arsenm marked an inline comment as done.Feb 5 2019, 10:11 AM

arsenm added inline comments.

lib/CodeGen/GlobalISel/LegalizerHelper.cpp
756	I guess it depends what you mean by changing the other types. In this case with these, this is really expanding the operation which happens to involve a new instance of the same operation in the requested narrowed type. Other operations really have type constraints not expressed in the simple, independent type index list (like build_vector requiring the input scalars to match the output vector element type). If you want to widen the scalars, you have to widen the result as well. I agree legalizations should try to avoid changing the other types if possible, but for most operations I don't think it's avoidable. I was thinking we should maybe enforce in these sorts of linked cases by only allowing one of the type indexes to be specified in a mutation. I've found it kind of annoying to have to figure out what the other type index needs to do in either case, and it would simplify code to only have to worry about one of them.

For the shift amount type, and bit count result type, I still think these are more of an ask the target for what it wants to use situation rather than a type index which should be subject to legalization

The legalizer is already done the way I'm talking about on the rule matching side and performance was marginally better on average than the old setAction() interface.

Got it.
That said, to me the legalizer is no different than ISel or a sort of InstCombine, thus I would expect we eventually use the same engine/automaton for selecting/lowering what goes through. The same goes with the way we represent them, although admittedly legalization is a bit more complicated because we have to come up with a way of representing the constraints on the unbound input types.

lib/CodeGen/GlobalISel/LegalizerHelper.cpp
756	I agree legalizations should try to avoid changing the other types if possible, but for most operations I don't think it's avoidable. I agree this is unavoidable in some case. What I have in mind is that we should somehow document this effect in the API, so that we can detect cycles and run verifier. I understand that doing all this manually is painful and we may not want to tackle that for now, however, long term, I believe we should TableGen most of the legalization transformation and generate checks along the way.

In D57243#1385543, @qcolombet wrote:

The legalizer is already done the way I'm talking about on the rule matching side and performance was marginally better on average than the old setAction() interface.

Got it.
That said, to me the legalizer is no different than ISel or a sort of InstCombine, thus I would expect we eventually use the same engine/automaton for selecting/lowering what goes through. The same goes with the way we represent them, although admittedly legalization is a bit more complicated because we have to come up with a way of representing the constraints on the unbound input types.

I'd agree with that. Though it's worth pointing out that none of those currently build a description of what it wants to do like the legalizer currently does, they just make the change straightaway when the rules match. Removing in LegalizationAction in favour of just making the change brings the legalizer closer to the others.

In D57243#1385511, @qcolombet wrote:

Should we revert this change to have the conversation going or am I the only one unhappy with the absence of guarantees for the other operands?

I'm not happy with the current state too!

Though, maybe reverting is a bit of a hassle, there is already a follow-up committed later that fixes functional bugs in here (https://reviews.llvm.org/rL353102), it'll have to be reverted too. Maybe a follow up commit instead?

In general, I think we can continue figuring out what the contract needs to be, and adopt "don't change type indices that aren't explicitly requested to be changed unless it's impossible to do so w/o introducing broken MIR" as a guideline right away.

Also, it's just a gut feeling, so it could be a complete nonsense as I didn't give it much thought, but I feel especially bad about the version that widens one type index and narrows the other one. At least just widening more than asked to strictly increases the entire type tuple (as in partial order). Skewing the type tuple like so on the other hand might be more loop-prone, I think.

Though it's worth pointing out that none of those currently build a description of what it wants to do like the legalizer currently does, they just make the change straightaway when the rules match. Removing in LegalizationAction in favour of just making the change brings the legalizer closer to the others.

Agree. This kind of mode would only be used for debug purposes anyway (like with expensive_checks).

The type used in this case for the result has more to do with the type required for the operations after required for the legalization. The G_SUB can be done in either width, but the narrower sub seems like a more preferable canonical form.

In D57243#1385704, @arsenm wrote:

The type used in this case for the result has more to do with the type required for the operations after required for the legalization. The G_SUB can be done in either width, but the narrower sub seems like a more preferable canonical form.

That's a very good point. On the other hand, I think it's a general and expected behavior of the Legalizer to use truncates and extends to bridge the types. So it's possible to keep the result of the bit op itself as it is, truncate it if it's safe (due to the original narrow type of the source), and do the G_SUB of the truncated type.

Subsequent steps of the legalization, if they narrow the destination of the bit op itself, will eliminate that truncate as a legalization artifact. In the same time, having G_SUB with of a narrow type generated in the process of widening something isn't much of a problem contract-wise or introducing-loops-wise because AFAIK the legalizer in general legalizes one instruction at a time based on the properties on that instruction only, so that G_SUB will be legalized later on just like any other G_SUB with no interference from the surrounding ops. That latter argument is not true when it's different operands (or type indices) of the same opcode specifically because of what we're discussing here.

Revision Contents

Path

Size

include/

llvm/

CodeGen/

GlobalISel/

LegalizerHelper.h

6 lines

Target/

GenericOpcodes.td

10 lines

lib/

CodeGen/

GlobalISel/

LegalizerHelper.cpp

31 lines

Target/

AMDGPU/

AMDGPULegalizerInfo.cpp

15 lines

ARM/

ARMLegalizerInfo.cpp

12 lines

test/

CodeGen/

AArch64/

GlobalISel/

legalizer-info-validation.mir

10 lines

AMDGPU/

GlobalISel/

legalize-ctlz-zero-undef.mir

88 lines

legalize-ctlz.mir

88 lines

legalize-ctpop.mir

88 lines

legalize-cttz-zero-undef.mir

88 lines

legalize-cttz.mir

88 lines

unittests/

CodeGen/

GlobalISel/

LegalizerHelperTest.cpp

80 lines

Diff 183554

include/llvm/CodeGen/GlobalISel/LegalizerHelper.h

Show First 20 Lines • Show All 108 Lines • ▼ Show 20 Lines	private:
void narrowScalarSrc(MachineInstr &MI, LLT NarrowTy, unsigned OpIdx);		void narrowScalarSrc(MachineInstr &MI, LLT NarrowTy, unsigned OpIdx);

/// Legalize a single operand \p OpIdx of the machine instruction \p MI as a		/// Legalize a single operand \p OpIdx of the machine instruction \p MI as a
/// Def by extending the operand's type to \p WideTy and truncating it back		/// Def by extending the operand's type to \p WideTy and truncating it back
/// with the \p TruncOpcode, and replacing the vreg of the operand in place.		/// with the \p TruncOpcode, and replacing the vreg of the operand in place.
void widenScalarDst(MachineInstr &MI, LLT WideTy, unsigned OpIdx = 0,		void widenScalarDst(MachineInstr &MI, LLT WideTy, unsigned OpIdx = 0,
unsigned TruncOpcode = TargetOpcode::G_TRUNC);		unsigned TruncOpcode = TargetOpcode::G_TRUNC);

		// Legalize a single operand \p OpIdx of the machine instruction \p MI as a
		// Def by truncating the operand's type to \p NarrowTy, replacing in place and
		// extending back with \p ExtOpcode.
		void narrowScalarDst(MachineInstr &MI, LLT NarrowTy, unsigned OpIdx,
		unsigned ExtOpcode);

/// Helper function to split a wide generic register into bitwise blocks with		/// Helper function to split a wide generic register into bitwise blocks with
/// the given Type (which implies the number of blocks needed). The generic		/// the given Type (which implies the number of blocks needed). The generic
/// registers created are appended to Ops, starting at bit 0 of Reg.		/// registers created are appended to Ops, starting at bit 0 of Reg.
void extractParts(unsigned Reg, LLT Ty, int NumParts,		void extractParts(unsigned Reg, LLT Ty, int NumParts,
SmallVectorImpl<unsigned> &VRegs);		SmallVectorImpl<unsigned> &VRegs);

LegalizeResult fewerElementsVectorCasts(MachineInstr &MI, unsigned TypeIdx,		LegalizeResult fewerElementsVectorCasts(MachineInstr &MI, unsigned TypeIdx,
LLT NarrowTy);		LLT NarrowTy);
Show All 20 Lines

include/llvm/Target/GenericOpcodes.td

Show First 20 Lines • Show All 117 Lines • ▼ Show 20 Lines	def G_VAARG : GenericInstruction {
let InOperandList = (ins type1:$list, unknown:$align);		let InOperandList = (ins type1:$list, unknown:$align);
let hasSideEffects = 0;		let hasSideEffects = 0;
let mayLoad = 1;		let mayLoad = 1;
let mayStore = 1;		let mayStore = 1;
}		}

def G_CTLZ : GenericInstruction {		def G_CTLZ : GenericInstruction {
let OutOperandList = (outs type0:$dst);		let OutOperandList = (outs type0:$dst);
let InOperandList = (ins type0:$src);		let InOperandList = (ins type1:$src);
let hasSideEffects = 0;		let hasSideEffects = 0;
}		}

def G_CTLZ_ZERO_UNDEF : GenericInstruction {		def G_CTLZ_ZERO_UNDEF : GenericInstruction {
let OutOperandList = (outs type0:$dst);		let OutOperandList = (outs type0:$dst);
let InOperandList = (ins type0:$src);		let InOperandList = (ins type1:$src);
let hasSideEffects = 0;		let hasSideEffects = 0;
}		}

def G_CTTZ : GenericInstruction {		def G_CTTZ : GenericInstruction {
let OutOperandList = (outs type0:$dst);		let OutOperandList = (outs type0:$dst);
let InOperandList = (ins type0:$src);		let InOperandList = (ins type1:$src);
let hasSideEffects = 0;		let hasSideEffects = 0;
}		}

def G_CTTZ_ZERO_UNDEF : GenericInstruction {		def G_CTTZ_ZERO_UNDEF : GenericInstruction {
let OutOperandList = (outs type0:$dst);		let OutOperandList = (outs type0:$dst);
let InOperandList = (ins type0:$src);		let InOperandList = (ins type1:$src);
let hasSideEffects = 0;		let hasSideEffects = 0;
}		}

def G_CTPOP : GenericInstruction {		def G_CTPOP : GenericInstruction {
let OutOperandList = (outs type0:$dst);		let OutOperandList = (outs type0:$dst);
let InOperandList = (ins type0:$src);		let InOperandList = (ins type1:$src);
let hasSideEffects = 0;		let hasSideEffects = 0;
}		}

def G_BSWAP : GenericInstruction {		def G_BSWAP : GenericInstruction {
let OutOperandList = (outs type0:$dst);		let OutOperandList = (outs type0:$dst);
let InOperandList = (ins type0:$src);		let InOperandList = (ins type0:$src);
let hasSideEffects = 0;		let hasSideEffects = 0;
}		}
▲ Show 20 Lines • Show All 632 Lines • Show Last 20 Lines

lib/CodeGen/GlobalISel/LegalizerHelper.cpp

Show First 20 Lines • Show All 661 Lines • ▼ Show 20 Lines	LegalizerHelper::LegalizeResult LegalizerHelper::narrowScalar(MachineInstr &MI,
case TargetOpcode::G_SHL:		case TargetOpcode::G_SHL:
case TargetOpcode::G_LSHR:		case TargetOpcode::G_LSHR:
case TargetOpcode::G_ASHR: {		case TargetOpcode::G_ASHR: {
if (TypeIdx != 1)		if (TypeIdx != 1)
return UnableToLegalize; // TODO		return UnableToLegalize; // TODO
narrowScalarSrc(MI, NarrowTy, 2);		narrowScalarSrc(MI, NarrowTy, 2);
return Legalized;		return Legalized;
}		}
		case TargetOpcode::G_CTLZ:
		case TargetOpcode::G_CTLZ_ZERO_UNDEF:
		case TargetOpcode::G_CTTZ:
		case TargetOpcode::G_CTTZ_ZERO_UNDEF:
		case TargetOpcode::G_CTPOP:
		if (TypeIdx != 0)
		return UnableToLegalize; // TODO
		narrowScalarDst(MI, NarrowTy, 0, TargetOpcode::G_ZEXT);
		return Legalized;
}		}
}		}

void LegalizerHelper::widenScalarSrc(MachineInstr &MI, LLT WideTy,		void LegalizerHelper::widenScalarSrc(MachineInstr &MI, LLT WideTy,
unsigned OpIdx, unsigned ExtOpcode) {		unsigned OpIdx, unsigned ExtOpcode) {
MachineOperand &MO = MI.getOperand(OpIdx);		MachineOperand &MO = MI.getOperand(OpIdx);
auto ExtB = MIRBuilder.buildInstr(ExtOpcode, {WideTy}, {MO.getReg()});		auto ExtB = MIRBuilder.buildInstr(ExtOpcode, {WideTy}, {MO.getReg()});
MO.setReg(ExtB->getOperand(0).getReg());		MO.setReg(ExtB->getOperand(0).getReg());
Show All 11 Lines	void LegalizerHelper::widenScalarDst(MachineInstr &MI, LLT WideTy,
unsigned OpIdx, unsigned TruncOpcode) {		unsigned OpIdx, unsigned TruncOpcode) {
MachineOperand &MO = MI.getOperand(OpIdx);		MachineOperand &MO = MI.getOperand(OpIdx);
unsigned DstExt = MRI.createGenericVirtualRegister(WideTy);		unsigned DstExt = MRI.createGenericVirtualRegister(WideTy);
MIRBuilder.setInsertPt(MIRBuilder.getMBB(), ++MIRBuilder.getInsertPt());		MIRBuilder.setInsertPt(MIRBuilder.getMBB(), ++MIRBuilder.getInsertPt());
MIRBuilder.buildInstr(TruncOpcode, {MO.getReg()}, {DstExt});		MIRBuilder.buildInstr(TruncOpcode, {MO.getReg()}, {DstExt});
MO.setReg(DstExt);		MO.setReg(DstExt);
}		}

		void LegalizerHelper::narrowScalarDst(MachineInstr &MI, LLT NarrowTy,
		unsigned OpIdx, unsigned ExtOpcode) {
		MachineOperand &MO = MI.getOperand(OpIdx);
		unsigned DstTrunc = MRI.createGenericVirtualRegister(NarrowTy);
		MIRBuilder.setInsertPt(MIRBuilder.getMBB(), ++MIRBuilder.getInsertPt());
		MIRBuilder.buildInstr(ExtOpcode, {MO.getReg()}, {DstTrunc});
		MO.setReg(DstTrunc);
		}

LegalizerHelper::LegalizeResult		LegalizerHelper::LegalizeResult
LegalizerHelper::widenScalar(MachineInstr &MI, unsigned TypeIdx, LLT WideTy) {		LegalizerHelper::widenScalar(MachineInstr &MI, unsigned TypeIdx, LLT WideTy) {
MIRBuilder.setInstr(MI);		MIRBuilder.setInstr(MI);

switch (MI.getOpcode()) {		switch (MI.getOpcode()) {
default:		default:
return UnableToLegalize;		return UnableToLegalize;
case TargetOpcode::G_UADDO:		case TargetOpcode::G_UADDO:
Show All 22 Lines	case TargetOpcode::G_USUBO: {
MI.eraseFromParent();		MI.eraseFromParent();
return Legalized;		return Legalized;
}		}
case TargetOpcode::G_CTTZ:		case TargetOpcode::G_CTTZ:
case TargetOpcode::G_CTTZ_ZERO_UNDEF:		case TargetOpcode::G_CTTZ_ZERO_UNDEF:
case TargetOpcode::G_CTLZ:		case TargetOpcode::G_CTLZ:
case TargetOpcode::G_CTLZ_ZERO_UNDEF:		case TargetOpcode::G_CTLZ_ZERO_UNDEF:
case TargetOpcode::G_CTPOP: {		case TargetOpcode::G_CTPOP: {
		if (TypeIdx == 0) {
		widenScalarDst(MI, WideTy, 0);
		return Legalized;
		}
		rtereshinUnsubmitted Not Done Reply Inline Actions Hi Matt @arsenm, Looks like adding `widenScalarDst` call for type index 0 is not enough to adjust the widening to the new type constraints in full. All the code below it that now would handle type index 1 widening appears to be written under the assumption that destination and source types are the same, and it widens both, source and the destination. It was perfectly fine an assumption before, but not anymore. If the source needs to be widened, it generates incorrect code. Here's a unit test that reproduces one of the possible issues (thanks Aditya @aditya_nandakumar for coming up with it!): diff --git a/unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp b/unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp index 815f1e3d321..a5798693c08 100644 --- a/unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp +++ b/unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp @@ -341,6 +341,31 @@ TEST_F(GISelMITest, WidenBitCountingCTPOP) { EXPECT_TRUE(CheckMachineFunction(MF, CheckStr)) << MF; } +// CTPOP widening. +TEST_F(GISelMITest, WidenBitCountingCTPOP1) { + if (!TM) + return; + + // Declare your legalization info + DefineLegalizerInfo(A, { + getActionDefinitionsBuilder(G_CTPOP).legalFor({{s16, s16}}); + }); + // Build + // Trunc it to s8. + LLT s8{LLT::scalar(8)}; + LLT s16{LLT::scalar(16)}; + auto MIBTrunc = B.buildTrunc(s8, Copies[0]); + auto MIBCTPOP = B.buildInstr(TargetOpcode::G_CTPOP, {s16}, {MIBTrunc}); + AInfo Info(MF->getSubtarget()); + DummyGISelObserver Observer; + LegalizerHelper Helper(MF, Info, Observer, B); + EXPECT_TRUE(Helper.widenScalar(MIBCTPOP, 1, s16) == + LegalizerHelper::LegalizeResult::Legalized); + + + MF->dump(); +} + // CTTZ_ZERO_UNDEF widening. TEST_F(GISelMITest, WidenBitCountingCTTZ_ZERO_UNDEF) { if (!TM) Could you please take a look at this? rtereshin: Hi Matt @arsenm, Looks like adding `widenScalarDst` call for type index 0 is not enough to…
		arsenmAuthorUnsubmitted Done Reply Inline Actions Try r353102 arsenm: Try r353102
		rtereshinUnsubmitted Not Done Reply Inline Actions Hi Matt, That's much better, thank you! I feel a little bit divided though about the fact that in some cases widening one type index ends up changing the type of the other type index. For instance, in this case widening type index 1 ends up also widening type index 0: // CTLZ widening. TEST_F(GISelMITest, WidenBitCountingCTLZ) { if (!TM) return; // Declare your legalization info DefineLegalizerInfo(A, { getActionDefinitionsBuilder(G_CTLZ).legalFor({{s16, s16}}); }); // Build // Trunc it to s8. LLT s8{LLT::scalar(8)}; LLT s16{LLT::scalar(16)}; auto MIBTrunc = B.buildTrunc(s8, Copies[0]); auto MIBCTLZ = B.buildInstr(TargetOpcode::G_CTLZ, {s8}, {MIBTrunc}); // We start with the type signature {s8, s8} AInfo Info(MF->getSubtarget()); DummyGISelObserver Observer; LegalizerHelper Helper(MF, Info, Observer, B); EXPECT_TRUE(Helper.widenScalar(MIBCTLZ, 1, s16) == // We ask the API to widen type index 1 to s16, probably expecting type signature {s8, s16} as a result LegalizerHelper::LegalizeResult::Legalized); auto CheckStr = R"( CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]] CHECK: [[Ctlz:%[0-9]+]]:_(s16) = G_CTLZ [[Zext]] # The API ends up widening not just type index 1, but also type index 0 with the resulting {s16, s16} type signature CHECK: [[Cst8:%[0-9]+]]:_(s16) = G_CONSTANT i16 8 CHECK: [[Sub:%[0-9]+]]:_(s16) = G_SUB [[Ctlz]]:_, [[Cst8]]:_ CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Sub]] )"; // Check EXPECT_TRUE(CheckMachineFunction(MF, CheckStr)) << MF; } In this other case widening type index 1 ends up also narrowing type index 0: // Test a strange case where the result is wider than the source TEST_F(GISelMITest, WidenBitCountingCTPOP2) { if (!TM) return; // Declare your legalization info DefineLegalizerInfo(A, { getActionDefinitionsBuilder(G_CTPOP).legalFor({{s32, s16}}); }); // Build // Trunc it to s8. LLT s8{LLT::scalar(8)}; LLT s16{LLT::scalar(16)}; LLT s32{LLT::scalar(32)}; auto MIBTrunc = B.buildTrunc(s8, Copies[0]); auto MIBCTPOP = B.buildInstr(TargetOpcode::G_CTPOP, {s32}, {MIBTrunc}); // We start with type signature {s32, s8} AInfo Info(MF->getSubtarget()); DummyGISelObserver Observer; LegalizerHelper Helper(MF, Info, Observer, B); EXPECT_EQ(LegalizerHelper::LegalizeResult::Legalized, // We ask the API to widen type index 1 to s16, probably expecting {s32, s16} as a result Helper.widenScalar(MIBCTPOP, 1, s16)); auto CheckStr = R"( CHECK: [[TRUNC:%[0-9]+]]:_(s8) = G_TRUNC %0:_(s64) CHECK: [[ZEXT:%[0-9]+]]:_(s16) = G_ZEXT [[TRUNC]]:_(s8) CHECK: [[CTPOP:%[0-9]+]]:_(s16) = G_CTPOP [[ZEXT]] # API ends up narrowing the type index 0 in the process with {s16, s16} type signature as a result. CHECK: [[COPY:%[0-9]+]]:_(s32) = G_ZEXT [[CTPOP]]:_(s16) )"; EXPECT_TRUE(CheckMachineFunction(MF, CheckStr)) << MF; } I talked to @aditya_nandakumar, @volkan, and @qcolombet offline and it appears that we don't have any contract about what pre-defined operations like widenScalar, narrowScalar etc. are allowed to do with the type indices not included in the request, but I think it maybe worth introducing such a contract. Specifically the one that would state that it's guaranteed that these generic, pre-defined operations aren't allowed to change the types of the type indices except the one(s) explicitly included in the request. I think not having these operations following such a contract makes their behavior quite unexpected for anyone who focuses on writing legalizations rules for their target w/o having an extensive knowledge about how exactly the implementation of the pre-defined API-provided operations looks like. In particular, I think it might make it easier for the users to accidentally introduce loops in legalization rules, and harder for them to understand where they are coming from. Please let me know what do you think! Thanks, Roman rtereshin: Hi Matt, That's much better, thank you! I feel a little bit divided though about the fact…
		arsenmAuthorUnsubmitted Done Reply Inline Actions In general I don't think it's in general possible to avoid changing other type indexes. For example, FewerElements for a select's condition type requires doing the same FewerElements for the select type. The same applies for any vector cast. The two type indexes won't match, but they still need to have the same number of elements. I don't think these examples actually show this though. Note in these examples, these aren't producing the fully legalized operation. They're only doing one step, but need at least one more to legalize the operation arsenm: In general I don't think it's in general possible to avoid changing other type indexes. For…
		arsenmAuthorUnsubmitted Done Reply Inline Actions A bigger problem I have is the order of legalization steps matters. The intermediate operations will be done in a different type if you specify the legalize actions for type index 1 before 0 vs. the other wya around. You wouldn't see the new operation with the narrower type if you legalized in the other order arsenm: A bigger problem I have is the order of legalization steps matters. The intermediate operations…
		rtereshinUnsubmitted Not Done Reply Inline Actions A bigger problem I have is the order of legalization steps matters. The intermediate operations will be done in a different type if you specify the legalize actions for type index 1 before 0 vs. the other wya around. You wouldn't see the new operation with the narrower type if you legalized in the other order That's a very good point! rtereshin: > A bigger problem I have is the order of legalization steps matters. The intermediate…
		qcolombetUnsubmitted Not Done Reply Inline Actions For example, FewerElements for a select's condition type requires doing the same FewerElements for the select type. The same applies for any vector cast. The two type indexes won't match, but they still need to have the same number of elements. That's a good example, but that doesn't mean we shouldn't come up with some kind of contract. The thing I am after is a way to tell if we are creating loops in our legalization rules. I haven't thought if this is practical, but we could imagine that the contract if we don't change the element type of the other operands. The number of elements can change but in a reasonable way (at least for the generic code, custom legalization does what it wants). What do you think? qcolombet: > For example, FewerElements for a select's condition type requires doing the same…
		arsenmAuthorUnsubmitted Done Reply Inline Actions I guess it depends what you mean by changing the other types. In this case with these, this is really expanding the operation which happens to involve a new instance of the same operation in the requested narrowed type. Other operations really have type constraints not expressed in the simple, independent type index list (like build_vector requiring the input scalars to match the output vector element type). If you want to widen the scalars, you have to widen the result as well. I agree legalizations should try to avoid changing the other types if possible, but for most operations I don't think it's avoidable. I was thinking we should maybe enforce in these sorts of linked cases by only allowing one of the type indexes to be specified in a mutation. I've found it kind of annoying to have to figure out what the other type index needs to do in either case, and it would simplify code to only have to worry about one of them. arsenm: I guess it depends what you mean by changing the other types. In this case with these, this is…
		qcolombetUnsubmitted Not Done Reply Inline Actions I agree legalizations should try to avoid changing the other types if possible, but for most operations I don't think it's avoidable. I agree this is unavoidable in some case. What I have in mind is that we should somehow document this effect in the API, so that we can detect cycles and run verifier. I understand that doing all this manually is painful and we may not want to tackle that for now, however, long term, I believe we should TableGen most of the legalization transformation and generate checks along the way. qcolombet: > I agree legalizations should try to avoid changing the other types if possible, but for most…
		dsandersUnsubmitted Not Done Reply Inline Actions I generally agree that the types should generally be modified independently. Not following that makes it fairly easy to get into infinite loops where one type is too big and one is too small. However... There are some difficulties with such a rule though (at least with the current definitions of operations). Suppose you have: %dst:(s4) = G_EXTRACT %src:(s16), %idx:s32 and the legalizer is told to widen %dst to s32. G_EXTRACT currently expects all the result bits to originate from the input which isn't possible if the input stays fixed at s16. Arguably, G_EXTRACT should have a size operand anyway at which point we can treat it the excess bits as an any-extension. There's also some performance costs to such a rule as it increases the number of hops needed to get from illegal to legal. I generally think targets should be allowed to leap directly to the right answer whenever possible. From that point of view, the limitation that we can only specify one index and type as the target for a legalization step is a bit of a nuisance. Personally, I'd like to replace the LegalizationAction with a function pointer that just performs the desired change and have a standard library of actions that can be called for the common changes. This also has the nice side-benefit of removing the Custom action and the limitations that has (the opcode must always be changed to something that is Legal rather than Custom). dsanders: I generally agree that the types should generally be modified independently. Not following that…

// First ZEXT the input.		// First ZEXT the input.
auto MIBSrc = MIRBuilder.buildZExt(WideTy, MI.getOperand(1).getReg());		auto MIBSrc = MIRBuilder.buildZExt(WideTy, MI.getOperand(1).getReg());
LLT CurTy = MRI.getType(MI.getOperand(0).getReg());		LLT CurTy = MRI.getType(MI.getOperand(0).getReg());
if (MI.getOpcode() == TargetOpcode::G_CTTZ) {		if (MI.getOpcode() == TargetOpcode::G_CTTZ) {
// The count is the same in the larger type except if the original		// The count is the same in the larger type except if the original
// value was zero. This can be handled by setting the bit just off		// value was zero. This can be handled by setting the bit just off
// the top of the original type.		// the top of the original type.
auto TopBit =		auto TopBit =
▲ Show 20 Lines • Show All 794 Lines • ▼ Show 20 Lines	case TargetOpcode::G_CTLZ_ZERO_UNDEF: {
Observer.changingInstr(MI);		Observer.changingInstr(MI);
MI.setDesc(TII.get(TargetOpcode::G_CTLZ));		MI.setDesc(TII.get(TargetOpcode::G_CTLZ));
Observer.changedInstr(MI);		Observer.changedInstr(MI);
return Legalized;		return Legalized;
}		}
case TargetOpcode::G_CTLZ: {		case TargetOpcode::G_CTLZ: {
unsigned SrcReg = MI.getOperand(1).getReg();		unsigned SrcReg = MI.getOperand(1).getReg();
unsigned Len = Ty.getSizeInBits();		unsigned Len = Ty.getSizeInBits();
if (isSupported({TargetOpcode::G_CTLZ_ZERO_UNDEF, {Ty}})) {		if (isSupported({TargetOpcode::G_CTLZ_ZERO_UNDEF, {Ty, Ty}})) {
// If CTLZ_ZERO_UNDEF is supported, emit that and a select for zero.		// If CTLZ_ZERO_UNDEF is supported, emit that and a select for zero.
auto MIBCtlzZU = MIRBuilder.buildInstr(TargetOpcode::G_CTLZ_ZERO_UNDEF,		auto MIBCtlzZU = MIRBuilder.buildInstr(TargetOpcode::G_CTLZ_ZERO_UNDEF,
{Ty}, {SrcReg});		{Ty}, {SrcReg});
auto MIBZero = MIRBuilder.buildConstant(Ty, 0);		auto MIBZero = MIRBuilder.buildConstant(Ty, 0);
auto MIBLen = MIRBuilder.buildConstant(Ty, Len);		auto MIBLen = MIRBuilder.buildConstant(Ty, Len);
auto MIBICmp = MIRBuilder.buildICmp(CmpInst::ICMP_EQ, LLT::scalar(1),		auto MIBICmp = MIRBuilder.buildICmp(CmpInst::ICMP_EQ, LLT::scalar(1),
SrcReg, MIBZero);		SrcReg, MIBZero);
MIRBuilder.buildSelect(MI.getOperand(0).getReg(), MIBICmp, MIBLen,		MIRBuilder.buildSelect(MI.getOperand(0).getReg(), MIBICmp, MIBLen,
Show All 33 Lines	case TargetOpcode::G_CTTZ_ZERO_UNDEF: {
Observer.changingInstr(MI);		Observer.changingInstr(MI);
MI.setDesc(TII.get(TargetOpcode::G_CTTZ));		MI.setDesc(TII.get(TargetOpcode::G_CTTZ));
Observer.changedInstr(MI);		Observer.changedInstr(MI);
return Legalized;		return Legalized;
}		}
case TargetOpcode::G_CTTZ: {		case TargetOpcode::G_CTTZ: {
unsigned SrcReg = MI.getOperand(1).getReg();		unsigned SrcReg = MI.getOperand(1).getReg();
unsigned Len = Ty.getSizeInBits();		unsigned Len = Ty.getSizeInBits();
if (isSupported({TargetOpcode::G_CTTZ_ZERO_UNDEF, {Ty}})) {		if (isSupported({TargetOpcode::G_CTTZ_ZERO_UNDEF, {Ty, Ty}})) {
// If CTTZ_ZERO_UNDEF is legal or custom, emit that and a select with		// If CTTZ_ZERO_UNDEF is legal or custom, emit that and a select with
// zero.		// zero.
auto MIBCttzZU = MIRBuilder.buildInstr(TargetOpcode::G_CTTZ_ZERO_UNDEF,		auto MIBCttzZU = MIRBuilder.buildInstr(TargetOpcode::G_CTTZ_ZERO_UNDEF,
{Ty}, {SrcReg});		{Ty}, {SrcReg});
auto MIBZero = MIRBuilder.buildConstant(Ty, 0);		auto MIBZero = MIRBuilder.buildConstant(Ty, 0);
auto MIBLen = MIRBuilder.buildConstant(Ty, Len);		auto MIBLen = MIRBuilder.buildConstant(Ty, Len);
auto MIBICmp = MIRBuilder.buildICmp(CmpInst::ICMP_EQ, LLT::scalar(1),		auto MIBICmp = MIRBuilder.buildICmp(CmpInst::ICMP_EQ, LLT::scalar(1),
SrcReg, MIBZero);		SrcReg, MIBZero);
MIRBuilder.buildSelect(MI.getOperand(0).getReg(), MIBICmp, MIBLen,		MIRBuilder.buildSelect(MI.getOperand(0).getReg(), MIBICmp, MIBLen,
MIBCttzZU);		MIBCttzZU);
MI.eraseFromParent();		MI.eraseFromParent();
return Legalized;		return Legalized;
}		}
// for now, we use: { return popcount(~x & (x - 1)); }		// for now, we use: { return popcount(~x & (x - 1)); }
// unless the target has ctlz but not ctpop, in which case we use:		// unless the target has ctlz but not ctpop, in which case we use:
// { return 32 - nlz(~x & (x-1)); }		// { return 32 - nlz(~x & (x-1)); }
// Ref: "Hacker's Delight" by Henry Warren		// Ref: "Hacker's Delight" by Henry Warren
auto MIBCstNeg1 = MIRBuilder.buildConstant(Ty, -1);		auto MIBCstNeg1 = MIRBuilder.buildConstant(Ty, -1);
auto MIBNot =		auto MIBNot =
MIRBuilder.buildInstr(TargetOpcode::G_XOR, {Ty}, {SrcReg, MIBCstNeg1});		MIRBuilder.buildInstr(TargetOpcode::G_XOR, {Ty}, {SrcReg, MIBCstNeg1});
auto MIBTmp = MIRBuilder.buildInstr(		auto MIBTmp = MIRBuilder.buildInstr(
TargetOpcode::G_AND, {Ty},		TargetOpcode::G_AND, {Ty},
{MIBNot, MIRBuilder.buildInstr(TargetOpcode::G_ADD, {Ty},		{MIBNot, MIRBuilder.buildInstr(TargetOpcode::G_ADD, {Ty},
{SrcReg, MIBCstNeg1})});		{SrcReg, MIBCstNeg1})});
if (!isSupported({TargetOpcode::G_CTPOP, {Ty}}) &&		if (!isSupported({TargetOpcode::G_CTPOP, {Ty, Ty}}) &&
isSupported({TargetOpcode::G_CTLZ, {Ty}})) {		isSupported({TargetOpcode::G_CTLZ, {Ty, Ty}})) {
auto MIBCstLen = MIRBuilder.buildConstant(Ty, Len);		auto MIBCstLen = MIRBuilder.buildConstant(Ty, Len);
MIRBuilder.buildInstr(		MIRBuilder.buildInstr(
TargetOpcode::G_SUB, {MI.getOperand(0).getReg()},		TargetOpcode::G_SUB, {MI.getOperand(0).getReg()},
{MIBCstLen,		{MIBCstLen,
MIRBuilder.buildInstr(TargetOpcode::G_CTLZ, {Ty}, {MIBTmp})});		MIRBuilder.buildInstr(TargetOpcode::G_CTLZ, {Ty}, {MIBTmp})});
MI.eraseFromParent();		MI.eraseFromParent();
return Legalized;		return Legalized;
}		}
MI.setDesc(TII.get(TargetOpcode::G_CTPOP));		MI.setDesc(TII.get(TargetOpcode::G_CTPOP));
MI.getOperand(1).setReg(MIBTmp->getOperand(0).getReg());		MI.getOperand(1).setReg(MIBTmp->getOperand(0).getReg());
return Legalized;		return Legalized;
}		}
}		}
}		}

lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp

Show First 20 Lines • Show All 200 Lines • ▼ Show 20 Lines	getActionDefinitionsBuilder({G_ICMP, G_FCMP})
.clampMaxNumElements(1, S32, 1);		.clampMaxNumElements(1, S32, 1);

// FIXME: fexp, flog2, flog10 needs to be custom lowered.		// FIXME: fexp, flog2, flog10 needs to be custom lowered.
getActionDefinitionsBuilder({G_FPOW, G_FEXP, G_FEXP2,		getActionDefinitionsBuilder({G_FPOW, G_FEXP, G_FEXP2,
G_FLOG, G_FLOG2, G_FLOG10})		G_FLOG, G_FLOG2, G_FLOG10})
.legalFor({S32})		.legalFor({S32})
.scalarize(0);		.scalarize(0);

setAction({G_CTLZ, S32}, Legal);		// The 64-bit versions produce 32-bit results, but only on the SALU.
setAction({G_CTLZ_ZERO_UNDEF, S32}, Legal);		getActionDefinitionsBuilder({G_CTLZ, G_CTLZ_ZERO_UNDEF,
setAction({G_CTTZ, S32}, Legal);		G_CTTZ, G_CTTZ_ZERO_UNDEF,
setAction({G_CTTZ_ZERO_UNDEF, S32}, Legal);		G_CTPOP})
		.legalFor({{S32, S32}, {S32, S64}})
		.clampScalar(0, S32, S32)
		.clampScalar(1, S32, S64);
		// TODO: Scalarize


setAction({G_BSWAP, S32}, Legal);		setAction({G_BSWAP, S32}, Legal);
setAction({G_CTPOP, S32}, Legal);

getActionDefinitionsBuilder(G_INTTOPTR)		getActionDefinitionsBuilder(G_INTTOPTR)
.legalIf([](const LegalityQuery &Query) {		.legalIf([](const LegalityQuery &Query) {
return true;		return true;
});		});

getActionDefinitionsBuilder(G_PTRTOINT)		getActionDefinitionsBuilder(G_PTRTOINT)
.legalIf([](const LegalityQuery &Query) {		.legalIf([](const LegalityQuery &Query) {
▲ Show 20 Lines • Show All 198 Lines • Show Last 20 Lines

lib/Target/ARM/ARMLegalizerInfo.cpp

Show First 20 Lines • Show All 138 Lines • ▼ Show 20 Lines	ARMLegalizerInfo::ARMLegalizerInfo(const ARMSubtarget &ST) {
getActionDefinitionsBuilder(G_PTRTOINT).legalFor({{s32, p0}});		getActionDefinitionsBuilder(G_PTRTOINT).legalFor({{s32, p0}});

getActionDefinitionsBuilder({G_ASHR, G_LSHR, G_SHL})		getActionDefinitionsBuilder({G_ASHR, G_LSHR, G_SHL})
.legalFor({{s32, s32}})		.legalFor({{s32, s32}})
.clampScalar(1, s32, s32);		.clampScalar(1, s32, s32);

if (ST.hasV5TOps()) {		if (ST.hasV5TOps()) {
getActionDefinitionsBuilder(G_CTLZ)		getActionDefinitionsBuilder(G_CTLZ)
.legalFor({s32})		.legalFor({s32, s32})
		.clampScalar(1, s32, s32)
.clampScalar(0, s32, s32);		.clampScalar(0, s32, s32);
getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF)		getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF)
.lowerFor({s32})		.lowerFor({s32, s32})
		.clampScalar(1, s32, s32)
.clampScalar(0, s32, s32);		.clampScalar(0, s32, s32);
} else {		} else {
getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF)		getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF)
.libcallFor({s32})		.libcallFor({s32, s32})
		.clampScalar(1, s32, s32)
.clampScalar(0, s32, s32);		.clampScalar(0, s32, s32);
getActionDefinitionsBuilder(G_CTLZ)		getActionDefinitionsBuilder(G_CTLZ)
.lowerFor({s32})		.lowerFor({s32, s32})
		.clampScalar(1, s32, s32)
.clampScalar(0, s32, s32);		.clampScalar(0, s32, s32);
}		}

getActionDefinitionsBuilder(G_GEP).legalFor({{p0, s32}});		getActionDefinitionsBuilder(G_GEP).legalFor({{p0, s32}});

getActionDefinitionsBuilder(G_SELECT).legalForCartesianProduct({s32, p0},		getActionDefinitionsBuilder(G_SELECT).legalForCartesianProduct({s32, p0},
{s1});		{s1});

▲ Show 20 Lines • Show All 299 Lines • Show Last 20 Lines

test/CodeGen/AArch64/GlobalISel/legalizer-info-validation.mir

	Show First 20 Lines • Show All 306 Lines • ▼ Show 20 Lines
	# DEBUG: .. type index coverage check SKIPPED: no rules defined			# DEBUG: .. type index coverage check SKIPPED: no rules defined
	#			#
	# DEBUG-NEXT: G_EXTRACT_VECTOR_ELT (opcode {{[0-9]+}}): 3 type indices			# DEBUG-NEXT: G_EXTRACT_VECTOR_ELT (opcode {{[0-9]+}}): 3 type indices
	# DEBUG: .. type index coverage check SKIPPED: user-defined predicate detected			# DEBUG: .. type index coverage check SKIPPED: user-defined predicate detected
	#			#
	# DEBUG-NEXT: G_SHUFFLE_VECTOR (opcode {{[0-9]+}}): 3 type indices			# DEBUG-NEXT: G_SHUFFLE_VECTOR (opcode {{[0-9]+}}): 3 type indices
	# DEBUG: .. type index coverage check SKIPPED: no rules defined			# DEBUG: .. type index coverage check SKIPPED: no rules defined
	#			#
	# DEBUG-NEXT: G_CTTZ (opcode {{[0-9]+}}): 1 type index			# DEBUG-NEXT: G_CTTZ (opcode {{[0-9]+}}): 2 type indices
	# DEBUG: .. type index coverage check SKIPPED: no rules defined			# DEBUG: .. type index coverage check SKIPPED: no rules defined
	#			#
	# DEBUG-NEXT: G_CTTZ_ZERO_UNDEF (opcode {{[0-9]+}}): 1 type index			# DEBUG-NEXT: G_CTTZ_ZERO_UNDEF (opcode {{[0-9]+}}): 2 type indices
	# DEBUG: .. type index coverage check SKIPPED: no rules defined			# DEBUG: .. type index coverage check SKIPPED: no rules defined
	#			#
	# DEBUG-NEXT: G_CTLZ (opcode {{[0-9]+}}): 1 type index			# DEBUG-NEXT: G_CTLZ (opcode {{[0-9]+}}): 2 type indices
	# DEBUG: .. type index coverage check SKIPPED: no rules defined			# DEBUG: .. type index coverage check SKIPPED: no rules defined
	#			#
	# DEBUG-NEXT: G_CTLZ_ZERO_UNDEF (opcode {{[0-9]+}}): 1 type index			# DEBUG-NEXT: G_CTLZ_ZERO_UNDEF (opcode {{[0-9]+}}): 2 type indices
	# DEBUG: .. type index coverage check SKIPPED: no rules defined			# DEBUG: .. type index coverage check SKIPPED: no rules defined
	#			#
	# DEBUG-NEXT: G_CTPOP (opcode {{[0-9]+}}): 1 type index			# DEBUG-NEXT: G_CTPOP (opcode {{[0-9]+}}): 2 type indices
	# DEBUG: .. type index coverage check SKIPPED: no rules defined			# DEBUG: .. type index coverage check SKIPPED: no rules defined
	#			#
	# DEBUG-NEXT: G_BSWAP (opcode {{[0-9]+}}): 1 type index			# DEBUG-NEXT: G_BSWAP (opcode {{[0-9]+}}): 1 type index
	# DEBUG: .. the first uncovered type index: 1, OK			# DEBUG: .. the first uncovered type index: 1, OK
	#			#
	# DEBUG-NEXT: G_FCEIL (opcode {{[0-9]+}}): 1 type index			# DEBUG-NEXT: G_FCEIL (opcode {{[0-9]+}}): 1 type index
	# DEBUG: .. the first uncovered type index: 1, OK			# DEBUG: .. the first uncovered type index: 1, OK

	# CHECK-NOT: ill-defined			# CHECK-NOT: ill-defined

	---			---
	name: dummy			name: dummy
	body: \|			body: \|
	bb.0:			bb.0:
	...			...

test/CodeGen/AMDGPU/GlobalISel/legalize-ctlz-zero-undef.mir

This file was added.

				# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
				# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -O0 -run-pass=legalizer %s -o - \| FileCheck %s

				---
				name: ctlz_zero_undef_s32_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: ctlz_zero_undef_s32_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTLZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTLZ_ZERO_UNDEF [[COPY]](s32)
				; CHECK: $vgpr0 = COPY [[CTLZ_ZERO_UNDEF]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s32) = G_CTLZ_ZERO_UNDEF %0
				$vgpr0 = COPY %1
				...

				---
				name: ctlz_zero_undef_s32_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: ctlz_zero_undef_s32_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTLZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTLZ_ZERO_UNDEF [[COPY]](s64)
				; CHECK: $vgpr0 = COPY [[CTLZ_ZERO_UNDEF]](s32)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s32) = G_CTLZ_ZERO_UNDEF %0
				$vgpr0 = COPY %1
				...

				---
				name: ctlz_zero_undef_s64_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: ctlz_zero_undef_s64_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTLZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTLZ_ZERO_UNDEF [[COPY]](s64)
				; CHECK: [[ZEXT:%[0-9]+]]:_(s64) = G_ZEXT [[CTLZ_ZERO_UNDEF]](s32)
				; CHECK: $vgpr0_vgpr1 = COPY [[ZEXT]](s64)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s64) = G_CTLZ_ZERO_UNDEF %0
				$vgpr0_vgpr1 = COPY %1
				...

				---
				name: ctlz_zero_undef_s16_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: ctlz_zero_undef_s16_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTLZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTLZ_ZERO_UNDEF [[COPY]](s32)
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTLZ_ZERO_UNDEF]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_CTLZ_ZERO_UNDEF %0
				%2:_(s32) = G_ZEXT %1
				$vgpr0 = COPY %2
				...

				---
				name: ctlz_zero_undef_s16_s16

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: ctlz_zero_undef_s16_s16
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[COPY]](s32)
				; CHECK: [[CTLZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTLZ_ZERO_UNDEF [[TRUNC]](s16)
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTLZ_ZERO_UNDEF]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_TRUNC %0
				%2:_(s16) = G_CTLZ_ZERO_UNDEF %1
				%3:_(s32) = G_ZEXT %2
				$vgpr0 = COPY %3
				...

test/CodeGen/AMDGPU/GlobalISel/legalize-ctlz.mir

This file was added.

				# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
				# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -O0 -run-pass=legalizer %s -o - \| FileCheck %s

				---
				name: ctlz_s32_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: ctlz_s32_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTLZ:%[0-9]+]]:_(s32) = G_CTLZ [[COPY]](s32)
				; CHECK: $vgpr0 = COPY [[CTLZ]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s32) = G_CTLZ %0
				$vgpr0 = COPY %1
				...

				---
				name: ctlz_s32_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: ctlz_s32_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTLZ:%[0-9]+]]:_(s32) = G_CTLZ [[COPY]](s64)
				; CHECK: $vgpr0 = COPY [[CTLZ]](s32)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s32) = G_CTLZ %0
				$vgpr0 = COPY %1
				...

				---
				name: ctlz_s64_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: ctlz_s64_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTLZ:%[0-9]+]]:_(s32) = G_CTLZ [[COPY]](s64)
				; CHECK: [[ZEXT:%[0-9]+]]:_(s64) = G_ZEXT [[CTLZ]](s32)
				; CHECK: $vgpr0_vgpr1 = COPY [[ZEXT]](s64)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s64) = G_CTLZ %0
				$vgpr0_vgpr1 = COPY %1
				...

				---
				name: ctlz_s16_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: ctlz_s16_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTLZ:%[0-9]+]]:_(s32) = G_CTLZ [[COPY]](s32)
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTLZ]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_CTLZ %0
				%2:_(s32) = G_ZEXT %1
				$vgpr0 = COPY %2
				...

				---
				name: ctlz_s16_s16

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: ctlz_s16_s16
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[COPY]](s32)
				; CHECK: [[CTLZ:%[0-9]+]]:_(s32) = G_CTLZ [[TRUNC]](s16)
				rtereshinUnsubmitted Not Done Reply Inline Actions Is this really legal? rtereshin: Is this really legal?
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTLZ]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_TRUNC %0
				%2:_(s16) = G_CTLZ %1
				%3:_(s32) = G_ZEXT %2
				$vgpr0 = COPY %3
				...

test/CodeGen/AMDGPU/GlobalISel/legalize-ctpop.mir

This file was added.

				# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
				# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -O0 -run-pass=legalizer %s -o - \| FileCheck %s

				---
				name: ctpop_s32_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: ctpop_s32_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTPOP:%[0-9]+]]:_(s32) = G_CTPOP [[COPY]](s32)
				; CHECK: $vgpr0 = COPY [[CTPOP]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s32) = G_CTPOP %0
				$vgpr0 = COPY %1
				...

				---
				name: ctpop_s32_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: ctpop_s32_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTPOP:%[0-9]+]]:_(s32) = G_CTPOP [[COPY]](s64)
				; CHECK: $vgpr0 = COPY [[CTPOP]](s32)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s32) = G_CTPOP %0
				$vgpr0 = COPY %1
				...

				---
				name: ctpop_s64_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: ctpop_s64_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTPOP:%[0-9]+]]:_(s32) = G_CTPOP [[COPY]](s64)
				; CHECK: [[ZEXT:%[0-9]+]]:_(s64) = G_ZEXT [[CTPOP]](s32)
				; CHECK: $vgpr0_vgpr1 = COPY [[ZEXT]](s64)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s64) = G_CTPOP %0
				$vgpr0_vgpr1 = COPY %1
				...

				---
				name: ctpop_s16_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: ctpop_s16_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTPOP:%[0-9]+]]:_(s32) = G_CTPOP [[COPY]](s32)
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTPOP]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_CTPOP %0
				%2:_(s32) = G_ZEXT %1
				$vgpr0 = COPY %2
				...

				---
				name: ctpop_s16_s16

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: ctpop_s16_s16
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[COPY]](s32)
				; CHECK: [[CTPOP:%[0-9]+]]:_(s32) = G_CTPOP [[TRUNC]](s16)
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTPOP]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_TRUNC %0
				%2:_(s16) = G_CTPOP %1
				%3:_(s32) = G_ZEXT %2
				$vgpr0 = COPY %3
				...

test/CodeGen/AMDGPU/GlobalISel/legalize-cttz-zero-undef.mir

This file was added.

				# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
				# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -O0 -run-pass=legalizer %s -o - \| FileCheck %s

				---
				name: cttz_zero_undef_s32_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: cttz_zero_undef_s32_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTTZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTTZ_ZERO_UNDEF [[COPY]](s32)
				; CHECK: $vgpr0 = COPY [[CTTZ_ZERO_UNDEF]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s32) = G_CTTZ_ZERO_UNDEF %0
				$vgpr0 = COPY %1
				...

				---
				name: cttz_zero_undef_s32_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: cttz_zero_undef_s32_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTTZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTTZ_ZERO_UNDEF [[COPY]](s64)
				; CHECK: $vgpr0 = COPY [[CTTZ_ZERO_UNDEF]](s32)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s32) = G_CTTZ_ZERO_UNDEF %0
				$vgpr0 = COPY %1
				...

				---
				name: cttz_zero_undef_s64_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: cttz_zero_undef_s64_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTTZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTTZ_ZERO_UNDEF [[COPY]](s64)
				; CHECK: [[ZEXT:%[0-9]+]]:_(s64) = G_ZEXT [[CTTZ_ZERO_UNDEF]](s32)
				; CHECK: $vgpr0_vgpr1 = COPY [[ZEXT]](s64)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s64) = G_CTTZ_ZERO_UNDEF %0
				$vgpr0_vgpr1 = COPY %1
				...

				---
				name: cttz_zero_undef_s16_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: cttz_zero_undef_s16_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTTZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTTZ_ZERO_UNDEF [[COPY]](s32)
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTTZ_ZERO_UNDEF]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_CTTZ_ZERO_UNDEF %0
				%2:_(s32) = G_ZEXT %1
				$vgpr0 = COPY %2
				...

				---
				name: cttz_zero_undef_s16_s16

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: cttz_zero_undef_s16_s16
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[COPY]](s32)
				; CHECK: [[CTTZ_ZERO_UNDEF:%[0-9]+]]:_(s32) = G_CTTZ_ZERO_UNDEF [[TRUNC]](s16)
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTTZ_ZERO_UNDEF]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_TRUNC %0
				%2:_(s16) = G_CTTZ_ZERO_UNDEF %1
				%3:_(s32) = G_ZEXT %2
				$vgpr0 = COPY %3
				...

test/CodeGen/AMDGPU/GlobalISel/legalize-cttz.mir

This file was added.

				# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
				# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -O0 -run-pass=legalizer %s -o - \| FileCheck %s

				---
				name: cttz_s32_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: cttz_s32_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTTZ:%[0-9]+]]:_(s32) = G_CTTZ [[COPY]](s32)
				; CHECK: $vgpr0 = COPY [[CTTZ]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s32) = G_CTTZ %0
				$vgpr0 = COPY %1
				...

				---
				name: cttz_s32_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: cttz_s32_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTTZ:%[0-9]+]]:_(s32) = G_CTTZ [[COPY]](s64)
				; CHECK: $vgpr0 = COPY [[CTTZ]](s32)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s32) = G_CTTZ %0
				$vgpr0 = COPY %1
				...

				---
				name: cttz_s64_s64

				body: \|
				bb.0:
				liveins: $vgpr0_vgpr1
				; CHECK-LABEL: name: cttz_s64_s64
				; CHECK: [[COPY:%[0-9]+]]:_(s64) = COPY $vgpr0_vgpr1
				; CHECK: [[CTTZ:%[0-9]+]]:_(s32) = G_CTTZ [[COPY]](s64)
				; CHECK: [[ZEXT:%[0-9]+]]:_(s64) = G_ZEXT [[CTTZ]](s32)
				; CHECK: $vgpr0_vgpr1 = COPY [[ZEXT]](s64)
				%0:_(s64) = COPY $vgpr0_vgpr1
				%1:_(s64) = G_CTTZ %0
				$vgpr0_vgpr1 = COPY %1
				...

				---
				name: cttz_s16_s32

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: cttz_s16_s32
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[CTTZ:%[0-9]+]]:_(s32) = G_CTTZ [[COPY]](s32)
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTTZ]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_CTTZ %0
				%2:_(s32) = G_ZEXT %1
				$vgpr0 = COPY %2
				...

				---
				name: cttz_s16_s16

				body: \|
				bb.0:
				liveins: $vgpr0
				; CHECK-LABEL: name: cttz_s16_s16
				; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
				; CHECK: [[TRUNC:%[0-9]+]]:_(s16) = G_TRUNC [[COPY]](s32)
				; CHECK: [[CTTZ:%[0-9]+]]:_(s32) = G_CTTZ [[TRUNC]](s16)
				; CHECK: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 65535
				; CHECK: [[COPY1:%[0-9]+]]:_(s32) = COPY [[CTTZ]](s32)
				; CHECK: [[AND:%[0-9]+]]:_(s32) = G_AND [[COPY1]], [[C]]
				; CHECK: $vgpr0 = COPY [[AND]](s32)
				%0:_(s32) = COPY $vgpr0
				%1:_(s16) = G_TRUNC %0
				%2:_(s16) = G_CTTZ %1
				%3:_(s32) = G_ZEXT %2
				$vgpr0 = COPY %3
				...

unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp

	Show All 20 Lines

	// Test CTTZ expansion when CTTZ_ZERO_UNDEF is legal or custom,			// Test CTTZ expansion when CTTZ_ZERO_UNDEF is legal or custom,
	// in which case it becomes CTTZ_ZERO_UNDEF with select.			// in which case it becomes CTTZ_ZERO_UNDEF with select.
	TEST_F(GISelMITest, LowerBitCountingCTTZ0) {			TEST_F(GISelMITest, LowerBitCountingCTTZ0) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(			DefineLegalizerInfo(A, {
	A, { getActionDefinitionsBuilder(G_CTTZ_ZERO_UNDEF).legalFor({s64}); });			getActionDefinitionsBuilder(G_CTTZ_ZERO_UNDEF).legalFor({{s64, s64}});
				});
	// Build Instr			// Build Instr
	auto MIBCTTZ =			auto MIBCTTZ =
	B.buildInstr(TargetOpcode::G_CTTZ, {LLT::scalar(64)}, {Copies[0]});			B.buildInstr(TargetOpcode::G_CTTZ, {LLT::scalar(64)}, {Copies[0]});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	// Perform Legalization			// Perform Legalization
	ASSERT_TRUE(Helper.lower(*MIBCTTZ, 0, LLT::scalar(64)) ==			ASSERT_TRUE(Helper.lower(*MIBCTTZ, 0, LLT::scalar(64)) ==
	Show All 12 Lines
	}			}

	// CTTZ expansion in terms of CTLZ			// CTTZ expansion in terms of CTLZ
	TEST_F(GISelMITest, LowerBitCountingCTTZ1) {			TEST_F(GISelMITest, LowerBitCountingCTTZ1) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(A,			DefineLegalizerInfo(A, {
	{ getActionDefinitionsBuilder(G_CTLZ).legalFor({s64}); });			getActionDefinitionsBuilder(G_CTLZ).legalFor({{s64, s64}});
				});
	// Build Instr			// Build Instr
	auto MIBCTTZ =			auto MIBCTTZ =
	B.buildInstr(TargetOpcode::G_CTTZ, {LLT::scalar(64)}, {Copies[0]});			B.buildInstr(TargetOpcode::G_CTTZ, {LLT::scalar(64)}, {Copies[0]});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	// Perform Legalization			// Perform Legalization
	ASSERT_TRUE(Helper.lower(*MIBCTTZ, 0, LLT::scalar(64)) ==			ASSERT_TRUE(Helper.lower(*MIBCTTZ, 0, LLT::scalar(64)) ==
	Show All 14 Lines
	}			}

	// CTTZ expansion in terms of CTPOP			// CTTZ expansion in terms of CTPOP
	TEST_F(GISelMITest, LowerBitCountingCTTZ2) {			TEST_F(GISelMITest, LowerBitCountingCTTZ2) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(			DefineLegalizerInfo(A, {
	A, { getActionDefinitionsBuilder(G_CTPOP).legalFor({s64}); });			getActionDefinitionsBuilder(G_CTPOP).legalFor({{s64, s64}});
				});
	// Build			// Build
	auto MIBCTTZ =			auto MIBCTTZ =
	B.buildInstr(TargetOpcode::G_CTTZ, {LLT::scalar(64)}, {Copies[0]});			B.buildInstr(TargetOpcode::G_CTTZ, {LLT::scalar(64)}, {Copies[0]});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	ASSERT_TRUE(Helper.lower(*MIBCTTZ, 0, LLT::scalar(64)) ==			ASSERT_TRUE(Helper.lower(*MIBCTTZ, 0, LLT::scalar(64)) ==
	LegalizerHelper::LegalizeResult::Legalized);			LegalizerHelper::LegalizeResult::Legalized);
	Show All 11 Lines
	}			}

	// CTTZ_ZERO_UNDEF expansion in terms of CTTZ			// CTTZ_ZERO_UNDEF expansion in terms of CTTZ
	TEST_F(GISelMITest, LowerBitCountingCTTZ3) {			TEST_F(GISelMITest, LowerBitCountingCTTZ3) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(A,			DefineLegalizerInfo(A, {
	{ getActionDefinitionsBuilder(G_CTTZ).legalFor({s64}); });			getActionDefinitionsBuilder(G_CTTZ).legalFor({{s64, s64}});
				});
	// Build			// Build
	auto MIBCTTZ = B.buildInstr(TargetOpcode::G_CTTZ_ZERO_UNDEF,			auto MIBCTTZ = B.buildInstr(TargetOpcode::G_CTTZ_ZERO_UNDEF,
	{LLT::scalar(64)}, {Copies[0]});			{LLT::scalar(64)}, {Copies[0]});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	ASSERT_TRUE(Helper.lower(*MIBCTTZ, 0, LLT::scalar(64)) ==			ASSERT_TRUE(Helper.lower(*MIBCTTZ, 0, LLT::scalar(64)) ==
	LegalizerHelper::LegalizeResult::Legalized);			LegalizerHelper::LegalizeResult::Legalized);

	auto CheckStr = R"(			auto CheckStr = R"(
	CHECK: CTTZ			CHECK: CTTZ
	)";			)";

	// Check			// Check
	ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));			ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));
	}			}

	// CTLZ expansion in terms of CTLZ_ZERO_UNDEF			// CTLZ expansion in terms of CTLZ_ZERO_UNDEF
	TEST_F(GISelMITest, LowerBitCountingCTLZ0) {			TEST_F(GISelMITest, LowerBitCountingCTLZ0) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(			DefineLegalizerInfo(A, {
	A, { getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF).legalFor({s64}); });			getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF).legalFor({{s64, s64}});
				});
	// Build			// Build
	auto MIBCTLZ =			auto MIBCTLZ =
	B.buildInstr(TargetOpcode::G_CTLZ, {LLT::scalar(64)}, {Copies[0]});			B.buildInstr(TargetOpcode::G_CTLZ, {LLT::scalar(64)}, {Copies[0]});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	ASSERT_TRUE(Helper.lower(*MIBCTLZ, 0, LLT::scalar(64)) ==			ASSERT_TRUE(Helper.lower(*MIBCTLZ, 0, LLT::scalar(64)) ==
	LegalizerHelper::LegalizeResult::Legalized);			LegalizerHelper::LegalizeResult::Legalized);
	Show All 11 Lines
	}			}

	// CTLZ expansion in terms of CTLZ_ZERO_UNDEF if the latter is a libcall			// CTLZ expansion in terms of CTLZ_ZERO_UNDEF if the latter is a libcall
	TEST_F(GISelMITest, LowerBitCountingCTLZLibcall) {			TEST_F(GISelMITest, LowerBitCountingCTLZLibcall) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(			DefineLegalizerInfo(A, {
	A, { getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF).libcallFor({s64}); });			getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF).libcallFor({{s64, s64}});
				});
	// Build			// Build
	auto MIBCTLZ =			auto MIBCTLZ =
	B.buildInstr(TargetOpcode::G_CTLZ, {LLT::scalar(64)}, {Copies[0]});			B.buildInstr(TargetOpcode::G_CTLZ, {LLT::scalar(64)}, {Copies[0]});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	ASSERT_TRUE(Helper.lower(*MIBCTLZ, 0, LLT::scalar(64)) ==			ASSERT_TRUE(Helper.lower(*MIBCTLZ, 0, LLT::scalar(64)) ==
	LegalizerHelper::LegalizeResult::Legalized);			LegalizerHelper::LegalizeResult::Legalized);
	Show All 11 Lines
	}			}

	// CTLZ expansion			// CTLZ expansion
	TEST_F(GISelMITest, LowerBitCountingCTLZ1) {			TEST_F(GISelMITest, LowerBitCountingCTLZ1) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(A,			DefineLegalizerInfo(A, {
	{ getActionDefinitionsBuilder(G_CTPOP).legalFor({s8}); });			getActionDefinitionsBuilder(G_CTPOP).legalFor({{s8, s8}});
				});
	// Build			// Build
	// Trunc it to s8.			// Trunc it to s8.
	LLT s8{LLT::scalar(8)};			LLT s8{LLT::scalar(8)};
	auto MIBTrunc = B.buildTrunc(s8, Copies[0]);			auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
	auto MIBCTLZ = B.buildInstr(TargetOpcode::G_CTLZ, {s8}, {MIBTrunc});			auto MIBCTLZ = B.buildInstr(TargetOpcode::G_CTLZ, {s8}, {MIBTrunc});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	Show All 21 Lines
	}			}

	// CTLZ widening.			// CTLZ widening.
	TEST_F(GISelMITest, WidenBitCountingCTLZ) {			TEST_F(GISelMITest, WidenBitCountingCTLZ) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(A,			DefineLegalizerInfo(A, {
	{ getActionDefinitionsBuilder(G_CTLZ).legalFor({s16}); });			getActionDefinitionsBuilder(G_CTLZ).legalFor({{s16, s16}});
				});
	// Build			// Build
	// Trunc it to s8.			// Trunc it to s8.
	LLT s8{LLT::scalar(8)};			LLT s8{LLT::scalar(8)};
	LLT s16{LLT::scalar(16)};			LLT s16{LLT::scalar(16)};
	auto MIBTrunc = B.buildTrunc(s8, Copies[0]);			auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
	auto MIBCTLZ = B.buildInstr(TargetOpcode::G_CTLZ, {s8}, {MIBTrunc});			auto MIBCTLZ = B.buildInstr(TargetOpcode::G_CTLZ, {s8}, {MIBTrunc});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	ASSERT_TRUE(Helper.widenScalar(*MIBCTLZ, 0, s16) ==			ASSERT_TRUE(Helper.widenScalar(*MIBCTLZ, 1, s16) ==
	LegalizerHelper::LegalizeResult::Legalized);			LegalizerHelper::LegalizeResult::Legalized);

	auto CheckStr = R"(			auto CheckStr = R"(
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC
	CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]			CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]
	CHECK: [[Ctlz:%[0-9]+]]:_(s16) = G_CTLZ [[Zext]]			CHECK: [[Ctlz:%[0-9]+]]:_(s16) = G_CTLZ [[Zext]]
	CHECK: [[Cst8:%[0-9]+]]:_(s16) = G_CONSTANT i16 8			CHECK: [[Cst8:%[0-9]+]]:_(s16) = G_CONSTANT i16 8
	CHECK: [[Sub:%[0-9]+]]:_(s16) = G_SUB [[Ctlz]]:_, [[Cst8]]:_			CHECK: [[Sub:%[0-9]+]]:_(s16) = G_SUB [[Ctlz]]:_, [[Cst8]]:_
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Sub]]			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Sub]]
	)";			)";

	// Check			// Check
	ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));			ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));
	}			}

	// CTLZ_ZERO_UNDEF widening.			// CTLZ_ZERO_UNDEF widening.
	TEST_F(GISelMITest, WidenBitCountingCTLZZeroUndef) {			TEST_F(GISelMITest, WidenBitCountingCTLZZeroUndef) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(			DefineLegalizerInfo(A, {
	A, { getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF).legalFor({s16}); });			getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF).legalFor({{s16, s16}});
				});
	// Build			// Build
	// Trunc it to s8.			// Trunc it to s8.
	LLT s8{LLT::scalar(8)};			LLT s8{LLT::scalar(8)};
	LLT s16{LLT::scalar(16)};			LLT s16{LLT::scalar(16)};
	auto MIBTrunc = B.buildTrunc(s8, Copies[0]);			auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
	auto MIBCTLZ_ZU =			auto MIBCTLZ_ZU =
	B.buildInstr(TargetOpcode::G_CTLZ_ZERO_UNDEF, {s8}, {MIBTrunc});			B.buildInstr(TargetOpcode::G_CTLZ_ZERO_UNDEF, {s8}, {MIBTrunc});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	ASSERT_TRUE(Helper.widenScalar(*MIBCTLZ_ZU, 0, s16) ==			ASSERT_TRUE(Helper.widenScalar(*MIBCTLZ_ZU, 1, s16) ==
	LegalizerHelper::LegalizeResult::Legalized);			LegalizerHelper::LegalizeResult::Legalized);

	auto CheckStr = R"(			auto CheckStr = R"(
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC
	CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]			CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]
	CHECK: [[CtlzZu:%[0-9]+]]:_(s16) = G_CTLZ_ZERO_UNDEF [[Zext]]			CHECK: [[CtlzZu:%[0-9]+]]:_(s16) = G_CTLZ_ZERO_UNDEF [[Zext]]
	CHECK: [[Cst8:%[0-9]+]]:_(s16) = G_CONSTANT i16 8			CHECK: [[Cst8:%[0-9]+]]:_(s16) = G_CONSTANT i16 8
	CHECK: [[Sub:%[0-9]+]]:_(s16) = G_SUB [[CtlzZu]]:_, [[Cst8]]:_			CHECK: [[Sub:%[0-9]+]]:_(s16) = G_SUB [[CtlzZu]]:_, [[Cst8]]:_
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Sub]]			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Sub]]
	)";			)";

	// Check			// Check
	ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));			ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));
	}			}

	// CTPOP widening.			// CTPOP widening.
	TEST_F(GISelMITest, WidenBitCountingCTPOP) {			TEST_F(GISelMITest, WidenBitCountingCTPOP) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(			DefineLegalizerInfo(A, {
	A, { getActionDefinitionsBuilder(G_CTPOP).legalFor({s16}); });			getActionDefinitionsBuilder(G_CTPOP).legalFor({{s16, s16}});
				});
	// Build			// Build
	// Trunc it to s8.			// Trunc it to s8.
	LLT s8{LLT::scalar(8)};			LLT s8{LLT::scalar(8)};
	LLT s16{LLT::scalar(16)};			LLT s16{LLT::scalar(16)};
	auto MIBTrunc = B.buildTrunc(s8, Copies[0]);			auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
	auto MIBCTPOP = B.buildInstr(TargetOpcode::G_CTPOP, {s8}, {MIBTrunc});			auto MIBCTPOP = B.buildInstr(TargetOpcode::G_CTPOP, {s8}, {MIBTrunc});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	ASSERT_TRUE(Helper.widenScalar(*MIBCTPOP, 0, s16) ==			ASSERT_TRUE(Helper.widenScalar(*MIBCTPOP, 1, s16) ==
	LegalizerHelper::LegalizeResult::Legalized);			LegalizerHelper::LegalizeResult::Legalized);

	auto CheckStr = R"(			auto CheckStr = R"(
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC
	CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]			CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]
	CHECK: [[Ctpop:%[0-9]+]]:_(s16) = G_CTPOP [[Zext]]			CHECK: [[Ctpop:%[0-9]+]]:_(s16) = G_CTPOP [[Zext]]
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Ctpop]]			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Ctpop]]
	)";			)";
				rtereshinUnsubmitted Not Done Reply Inline Actions Another example of the behavior - isn't widening for type index 1 supposed to widen only the source? But as could be seen here, it ends up widening both the source and the destination. The resulting code isn't broken largely because the source and destination types of the input instruction are the same. rtereshin: Another example of the behavior - isn't widening for type index 1 supposed to widen only the…
				arsenmAuthorUnsubmitted Done Reply Inline Actions Yes, for these the source and dest can be separately legalized arsenm: Yes, for these the source and dest can be separately legalized

	// Check			// Check
	ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));			ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));
	}			}

	// CTTZ_ZERO_UNDEF widening.			// CTTZ_ZERO_UNDEF widening.
	TEST_F(GISelMITest, WidenBitCountingCTTZ_ZERO_UNDEF) {			TEST_F(GISelMITest, WidenBitCountingCTTZ_ZERO_UNDEF) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(			DefineLegalizerInfo(A, {
	A, { getActionDefinitionsBuilder(G_CTTZ_ZERO_UNDEF).legalFor({s16}); });			getActionDefinitionsBuilder(G_CTTZ_ZERO_UNDEF).legalFor({{s16, s16}});
				});
	// Build			// Build
	// Trunc it to s8.			// Trunc it to s8.
	LLT s8{LLT::scalar(8)};			LLT s8{LLT::scalar(8)};
	LLT s16{LLT::scalar(16)};			LLT s16{LLT::scalar(16)};
	auto MIBTrunc = B.buildTrunc(s8, Copies[0]);			auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
	auto MIBCTTZ_ZERO_UNDEF =			auto MIBCTTZ_ZERO_UNDEF =
	B.buildInstr(TargetOpcode::G_CTTZ_ZERO_UNDEF, {s8}, {MIBTrunc});			B.buildInstr(TargetOpcode::G_CTTZ_ZERO_UNDEF, {s8}, {MIBTrunc});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	ASSERT_TRUE(Helper.widenScalar(*MIBCTTZ_ZERO_UNDEF, 0, s16) ==			ASSERT_TRUE(Helper.widenScalar(*MIBCTTZ_ZERO_UNDEF, 1, s16) ==
	LegalizerHelper::LegalizeResult::Legalized);			LegalizerHelper::LegalizeResult::Legalized);

	auto CheckStr = R"(			auto CheckStr = R"(
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC
	CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]			CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]
	CHECK: [[CttzZu:%[0-9]+]]:_(s16) = G_CTTZ_ZERO_UNDEF [[Zext]]			CHECK: [[CttzZu:%[0-9]+]]:_(s16) = G_CTTZ_ZERO_UNDEF [[Zext]]
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[CttzZu]]			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[CttzZu]]
	)";			)";

	// Check			// Check
	ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));			ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));
	}			}

	// CTTZ widening.			// CTTZ widening.
	TEST_F(GISelMITest, WidenBitCountingCTTZ) {			TEST_F(GISelMITest, WidenBitCountingCTTZ) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(A,			DefineLegalizerInfo(A, {
	{ getActionDefinitionsBuilder(G_CTTZ).legalFor({s16}); });			getActionDefinitionsBuilder(G_CTTZ).legalFor({{s16, s16}});
				});
	// Build			// Build
	// Trunc it to s8.			// Trunc it to s8.
	LLT s8{LLT::scalar(8)};			LLT s8{LLT::scalar(8)};
	LLT s16{LLT::scalar(16)};			LLT s16{LLT::scalar(16)};
	auto MIBTrunc = B.buildTrunc(s8, Copies[0]);			auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
	auto MIBCTTZ = B.buildInstr(TargetOpcode::G_CTTZ, {s8}, {MIBTrunc});			auto MIBCTTZ = B.buildInstr(TargetOpcode::G_CTTZ, {s8}, {MIBTrunc});
	AInfo Info(MF->getSubtarget());			AInfo Info(MF->getSubtarget());
	DummyGISelObserver Observer;			DummyGISelObserver Observer;
	LegalizerHelper Helper(*MF, Info, Observer, B);			LegalizerHelper Helper(*MF, Info, Observer, B);
	ASSERT_TRUE(Helper.widenScalar(*MIBCTTZ, 0, s16) ==			ASSERT_TRUE(Helper.widenScalar(*MIBCTTZ, 1, s16) ==
	LegalizerHelper::LegalizeResult::Legalized);			LegalizerHelper::LegalizeResult::Legalized);

	auto CheckStr = R"(			auto CheckStr = R"(
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC
	CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]			CHECK: [[Zext:%[0-9]+]]:_(s16) = G_ZEXT [[Trunc]]
	CHECK: [[Cst:%[0-9]+]]:_(s16) = G_CONSTANT i16 256			CHECK: [[Cst:%[0-9]+]]:_(s16) = G_CONSTANT i16 256
	CHECK: [[Or:%[0-9]+]]:_(s16) = G_OR [[Zext]]:_, [[Cst]]			CHECK: [[Or:%[0-9]+]]:_(s16) = G_OR [[Zext]]:_, [[Cst]]
	CHECK: [[Cttz:%[0-9]+]]:_(s16) = G_CTTZ [[Or]]			CHECK: [[Cttz:%[0-9]+]]:_(s16) = G_CTTZ [[Or]]
	CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Cttz]]			CHECK: [[Trunc:%[0-9]+]]:_(s8) = G_TRUNC [[Cttz]]
	)";			)";

	// Check			// Check
	ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));			ASSERT_TRUE(CheckMachineFunction(*MF, CheckStr));
	}			}
	// UADDO widening.			// UADDO widening.
	TEST_F(GISelMITest, WidenUADDO) {			TEST_F(GISelMITest, WidenUADDO) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(A,			DefineLegalizerInfo(A, {
	{ getActionDefinitionsBuilder(G_ADD).legalFor({s16}); });			getActionDefinitionsBuilder(G_ADD).legalFor({{s16, s16}});
				});
	// Build			// Build
	// Trunc it to s8.			// Trunc it to s8.
	LLT s8{LLT::scalar(8)};			LLT s8{LLT::scalar(8)};
	LLT s16{LLT::scalar(16)};			LLT s16{LLT::scalar(16)};
	auto MIBTrunc = B.buildTrunc(s8, Copies[0]);			auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
	unsigned CarryReg = MRI->createGenericVirtualRegister(LLT::scalar(1));			unsigned CarryReg = MRI->createGenericVirtualRegister(LLT::scalar(1));
	auto MIBUAddO =			auto MIBUAddO =
	B.buildInstr(TargetOpcode::G_UADDO, {s8, CarryReg}, {MIBTrunc, MIBTrunc});			B.buildInstr(TargetOpcode::G_UADDO, {s8, CarryReg}, {MIBTrunc, MIBTrunc});
	Show All 19 Lines
	}			}

	// USUBO widening.			// USUBO widening.
	TEST_F(GISelMITest, WidenUSUBO) {			TEST_F(GISelMITest, WidenUSUBO) {
	if (!TM)			if (!TM)
	return;			return;

	// Declare your legalization info			// Declare your legalization info
	DefineLegalizerInfo(A,			DefineLegalizerInfo(A, {
	{ getActionDefinitionsBuilder(G_SUB).legalFor({s16}); });			getActionDefinitionsBuilder(G_SUB).legalFor({{s16, s16}});
				});
	// Build			// Build
	// Trunc it to s8.			// Trunc it to s8.
	LLT s8{LLT::scalar(8)};			LLT s8{LLT::scalar(8)};
	LLT s16{LLT::scalar(16)};			LLT s16{LLT::scalar(16)};
	auto MIBTrunc = B.buildTrunc(s8, Copies[0]);			auto MIBTrunc = B.buildTrunc(s8, Copies[0]);
	unsigned CarryReg = MRI->createGenericVirtualRegister(LLT::scalar(1));			unsigned CarryReg = MRI->createGenericVirtualRegister(LLT::scalar(1));
	auto MIBUSUBO =			auto MIBUSUBO =
	B.buildInstr(TargetOpcode::G_USUBO, {s8, CarryReg}, {MIBTrunc, MIBTrunc});			B.buildInstr(TargetOpcode::G_USUBO, {s8, CarryReg}, {MIBTrunc, MIBTrunc});
	Show All 21 Lines

This is an archive of the discontinued LLVM Phabricator instance.

GlobalISel: Allow bitcount ops to have different result typeClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 183554

include/llvm/CodeGen/GlobalISel/LegalizerHelper.h

include/llvm/Target/GenericOpcodes.td

lib/CodeGen/GlobalISel/LegalizerHelper.cpp

lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp

lib/Target/ARM/ARMLegalizerInfo.cpp

test/CodeGen/AArch64/GlobalISel/legalizer-info-validation.mir

test/CodeGen/AMDGPU/GlobalISel/legalize-ctlz-zero-undef.mir

test/CodeGen/AMDGPU/GlobalISel/legalize-ctlz.mir

test/CodeGen/AMDGPU/GlobalISel/legalize-ctpop.mir

test/CodeGen/AMDGPU/GlobalISel/legalize-cttz-zero-undef.mir

test/CodeGen/AMDGPU/GlobalISel/legalize-cttz.mir

unittests/CodeGen/GlobalISel/LegalizerHelperTest.cpp

GlobalISel: Allow bitcount ops to have different result type
ClosedPublic