Index: llvm/trunk/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp =================================================================== --- llvm/trunk/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp +++ llvm/trunk/lib/Target/AMDGPU/AMDGPULegalizerInfo.cpp @@ -39,6 +39,7 @@ const LLT S32 = LLT::scalar(32); const LLT S64 = LLT::scalar(64); + const LLT S512 = LLT::scalar(512); const LLT GlobalPtr = GetAddrSpacePtr(AMDGPUAS::GLOBAL_ADDRESS); const LLT ConstantPtr = GetAddrSpacePtr(AMDGPUAS::CONSTANT_ADDRESS); @@ -70,9 +71,16 @@ getActionDefinitionsBuilder(G_FCONSTANT) .legalFor({S32, S64}); + + // G_IMPLICIT_DEF is a no-op so we can make it legal for any value type that + // can fit in a register. + // FIXME: We need to legalize several more operations before we can add + // a test case for size > 512. getActionDefinitionsBuilder(G_IMPLICIT_DEF) - .legalFor({S1, S32, S64, - GlobalPtr, ConstantPtr, LocalPtr, FlatPtr, PrivatePtr}); + .legalIf([=](const LegalityQuery &Query) { + return Query.Types[0].getSizeInBits() <= 512; + }) + .clampScalar(0, S1, S512); getActionDefinitionsBuilder(G_CONSTANT) .legalFor({S1, S32, S64}); Index: llvm/trunk/test/CodeGen/AMDGPU/GlobalISel/legalize-implicit-def.mir =================================================================== --- llvm/trunk/test/CodeGen/AMDGPU/GlobalISel/legalize-implicit-def.mir +++ llvm/trunk/test/CodeGen/AMDGPU/GlobalISel/legalize-implicit-def.mir @@ -0,0 +1,20 @@ +# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py +# RUN: llc -mtriple=amdgcn-mesa-mesa3d -run-pass=legalizer %s -o - | FileCheck %s + +# FIXME: Need to add test for IMPLICIT_DEF > 512 once all the operations used +# to legalize IMPLICIT_DEF are leagl. + +--- +name: test_implicit_def +body: | + bb.0: + liveins: $vgpr0, $vgpr1 + + ; CHECK-LABEL: name: test_implicit_def + ; CHECK: [[DEF:%[0-9]+]]:_(s448) = G_IMPLICIT_DEF + ; CHECK: [[EXTRACT:%[0-9]+]]:_(s32) = G_EXTRACT [[DEF]](s448), 0 + ; CHECK: $vgpr0 = COPY [[EXTRACT]](s32) + %0:_(s448) = G_IMPLICIT_DEF + %1:_(s32) = G_EXTRACT %0, 0 + $vgpr0 = COPY %1 +...