Index: lib/Target/AMDGPU/AsmParser/AMDGPUAsmParser.cpp =================================================================== --- lib/Target/AMDGPU/AsmParser/AMDGPUAsmParser.cpp +++ lib/Target/AMDGPU/AsmParser/AMDGPUAsmParser.cpp @@ -128,7 +128,9 @@ ImmTyDppRowMask, ImmTyDppBankMask, ImmTyDppBoundCtrl, - ImmTySdwaSel, + ImmTySdwaDstSel, + ImmTySdwaSrc0Sel, + ImmTySdwaSrc1Sel, ImmTySdwaDstUnused, ImmTyDMask, ImmTyUNorm, @@ -320,8 +322,16 @@ return isImmTy(ImmTyDppBoundCtrl); } - bool isSDWASel() const { - return isImmTy(ImmTySdwaSel); + bool isSDWADstSel() const { + return isImmTy(ImmTySdwaDstSel); + } + + bool isSDWASrc0Sel() const { + return isImmTy(ImmTySdwaSrc0Sel); + } + + bool isSDWASrc1Sel() const { + return isImmTy(ImmTySdwaSrc1Sel); } bool isSDWADstUnused() const { @@ -431,7 +441,9 @@ case ImmTyDppRowMask: OS << "DppRowMask"; break; case ImmTyDppBankMask: OS << "DppBankMask"; break; case ImmTyDppBoundCtrl: OS << "DppBoundCtrl"; break; - case ImmTySdwaSel: OS << "SdwaSel"; break; + case ImmTySdwaDstSel: OS << "SdwaDstSel"; break; + case ImmTySdwaSrc0Sel: OS << "SdwaSrc0Sel"; break; + case ImmTySdwaSrc1Sel: OS << "SdwaSrc1Sel"; break; case ImmTySdwaDstUnused: OS << "SdwaDstUnused"; break; case ImmTyDMask: OS << "DMask"; break; case ImmTyUNorm: OS << "UNorm"; break; @@ -525,6 +537,8 @@ MCAsmParser &Parser; unsigned ForcedEncodingSize; + bool ForcedDPP; + bool ForcedSDWA; bool isSI() const { return AMDGPU::isSI(getSTI()); @@ -577,7 +591,9 @@ const MCInstrInfo &MII, const MCTargetOptions &Options) : MCTargetAsmParser(Options, STI), MII(MII), Parser(_Parser), - ForcedEncodingSize(0) { + ForcedEncodingSize(0), + ForcedDPP(false), + ForcedSDWA(false) { MCAsmParserExtension::Initialize(Parser); if (getSTI().getFeatureBits().none()) { @@ -592,18 +608,15 @@ MCTargetStreamer &TS = *getParser().getStreamer().getTargetStreamer(); return static_cast(TS); } + + void setForcedEncodingSize(unsigned Size) { ForcedEncodingSize = Size; } + void setForcedDPP(bool ForceDPP_) { ForcedDPP = ForceDPP_; } + void setForcedSDWA(bool ForceSDWA_) { ForcedSDWA = ForceSDWA_; } - unsigned getForcedEncodingSize() const { - return ForcedEncodingSize; - } - - void setForcedEncodingSize(unsigned Size) { - ForcedEncodingSize = Size; - } - - bool isForcedVOP3() const { - return ForcedEncodingSize == 64; - } + unsigned getForcedEncodingSize() const { return ForcedEncodingSize; } + bool isForcedVOP3() const { return ForcedEncodingSize == 64; } + bool isForcedDPP() const { return ForcedDPP; } + bool isForcedSDWA() const { return ForcedSDWA; } std::unique_ptr parseRegister(); bool ParseRegister(unsigned &RegNo, SMLoc &StartLoc, SMLoc &EndLoc) override; @@ -616,6 +629,7 @@ bool MatchingInlineAsm) override; bool ParseDirective(AsmToken DirectiveID) override; OperandMatchResultTy parseOperand(OperandVector &Operands, StringRef Mnemonic); + void parseMnemonicSuffix(StringRef& Name); bool ParseInstruction(ParseInstructionInfo &Info, StringRef Name, SMLoc NameLoc, OperandVector &Operands) override; @@ -626,7 +640,7 @@ bool (*ConvertResult)(int64_t&) = 0); OperandMatchResultTy parseNamedBit(const char *Name, OperandVector &Operands, enum AMDGPUOperand::ImmTy ImmTy = AMDGPUOperand::ImmTyNone); - OperandMatchResultTy parseStringWithPrefix(const char *Prefix, StringRef &Value); + OperandMatchResultTy parseStringWithPrefix(StringRef Prefix, StringRef &Value); OperandMatchResultTy parseImm(OperandVector &Operands); OperandMatchResultTy parseRegOrImm(OperandVector &Operands); @@ -690,10 +704,20 @@ AMDGPUOperand::Ptr defaultBoundCtrl() const; void cvtDPP(MCInst &Inst, const OperandVector &Operands); - OperandMatchResultTy parseSDWASel(OperandVector &Operands); + OperandMatchResultTy parseSDWASel(OperandVector &Operands, StringRef Prefix, + enum AMDGPUOperand::ImmTy Type); OperandMatchResultTy parseSDWADstUnused(OperandVector &Operands); - AMDGPUOperand::Ptr defaultSDWASel() const; + AMDGPUOperand::Ptr defaultSDWASel(enum AMDGPUOperand::ImmTy Type) const; + AMDGPUOperand::Ptr defaultSDWADstSel() const; + AMDGPUOperand::Ptr defaultSDWASrc0Sel() const; + AMDGPUOperand::Ptr defaultSDWASrc1Sel() const; AMDGPUOperand::Ptr defaultSDWADstUnused() const; + void cvtSdwaVop1_mod(MCInst &Inst, const OperandVector &Operands); + void cvtSdwaVop1_nomod(MCInst &Inst, const OperandVector &Operands); + void cvtSdwaVop2_mod(MCInst &Inst, const OperandVector &Operands); + void cvtSdwaVop2_nomod(MCInst &Inst, const OperandVector &Operands); + void cvtSDWA(MCInst &Inst, const OperandVector &Operands, bool HasMods, + bool IsVOP1); }; struct OptionalOperand { @@ -1031,7 +1055,9 @@ uint64_t TSFlags = MII.get(Inst.getOpcode()).TSFlags; if ((getForcedEncodingSize() == 32 && (TSFlags & SIInstrFlags::VOP3)) || - (getForcedEncodingSize() == 64 && !(TSFlags & SIInstrFlags::VOP3))) + (getForcedEncodingSize() == 64 && !(TSFlags & SIInstrFlags::VOP3)) || + (isForcedDPP() && !(TSFlags & SIInstrFlags::DPP)) || + (isForcedSDWA() && !(TSFlags & SIInstrFlags::SDWA)) ) return Match_InvalidOperand; if ((TSFlags & SIInstrFlags::VOP3) && @@ -1366,25 +1392,34 @@ return MatchOperand_NoMatch; } -bool AMDGPUAsmParser::ParseInstruction(ParseInstructionInfo &Info, - StringRef Name, - SMLoc NameLoc, OperandVector &Operands) { - +void AMDGPUAsmParser::parseMnemonicSuffix(StringRef& Name) { // Clear any forced encodings from the previous instruction. setForcedEncodingSize(0); + setForcedDPP(false); + setForcedSDWA(false); - if (Name.endswith("_e64")) + if (Name.endswith("_e64")) { setForcedEncodingSize(64); - else if (Name.endswith("_e32")) + Name = Name.substr(0, Name.size() - 4); + } else if (Name.endswith("_e32")) { setForcedEncodingSize(32); + Name = Name.substr(0, Name.size() - 4); + } else if (Name.endswith("_dpp")) { + setForcedDPP(true); + Name = Name.substr(0, Name.size() - 4); + } else if (Name.endswith("_sdwa")) { + setForcedSDWA(true); + Name = Name.substr(0, Name.size() - 5); + } +} +bool AMDGPUAsmParser::ParseInstruction(ParseInstructionInfo &Info, + StringRef Name, + SMLoc NameLoc, OperandVector &Operands) { // Add the instruction mnemonic + parseMnemonicSuffix(Name); Operands.push_back(AMDGPUOperand::CreateToken(Name, NameLoc)); - - - if (Name.endswith("_e64")) { Name = Name.substr(0, Name.size() - 4); } - if (Name.endswith("_e32")) { Name = Name.substr(0, Name.size() - 4); } - + while (!getLexer().is(AsmToken::EndOfStatement)) { AMDGPUAsmParser::OperandMatchResultTy Res = parseOperand(Operands, Name); @@ -1509,7 +1544,7 @@ } AMDGPUAsmParser::OperandMatchResultTy -AMDGPUAsmParser::parseStringWithPrefix(const char *Prefix, StringRef &Value) { +AMDGPUAsmParser::parseStringWithPrefix(StringRef Prefix, StringRef &Value) { if (getLexer().isNot(AsmToken::Identifier)) { return MatchOperand_NoMatch; } @@ -2240,7 +2275,9 @@ {"row_mask", AMDGPUOperand::ImmTyDppRowMask, false, nullptr}, {"bank_mask", AMDGPUOperand::ImmTyDppBankMask, false, nullptr}, {"bound_ctrl", AMDGPUOperand::ImmTyDppBoundCtrl, false, ConvertBoundCtrl}, - {"sdwa_sel", AMDGPUOperand::ImmTySdwaSel, false, nullptr}, + {"dst_sel", AMDGPUOperand::ImmTySdwaDstSel, false, nullptr}, + {"src0_sel", AMDGPUOperand::ImmTySdwaSrc0Sel, false, nullptr}, + {"src1_sel", AMDGPUOperand::ImmTySdwaSrc1Sel, false, nullptr}, {"dst_unused", AMDGPUOperand::ImmTySdwaDstUnused, false, nullptr}, }; @@ -2252,8 +2289,10 @@ res = parseNamedBit(Op.Name, Operands, Op.Type); } else if (Op.Type == AMDGPUOperand::ImmTyOModSI) { res = parseOModOperand(Operands); - } else if (Op.Type == AMDGPUOperand::ImmTySdwaSel) { - res = parseSDWASel(Operands); + } else if (Op.Type == AMDGPUOperand::ImmTySdwaDstSel || + Op.Type == AMDGPUOperand::ImmTySdwaSrc0Sel || + Op.Type == AMDGPUOperand::ImmTySdwaSrc1Sel) { + res = parseSDWASel(Operands, Op.Name, Op.Type); } else if (Op.Type == AMDGPUOperand::ImmTySdwaDstUnused) { res = parseSDWADstUnused(Operands); } else { @@ -2501,7 +2540,6 @@ } } - // ToDo: fix default values for row_mask and bank_mask addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTyDppRowMask, 0xf); addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTyDppBankMask, 0xf); addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTyDppBoundCtrl); @@ -2512,24 +2550,15 @@ //===----------------------------------------------------------------------===// AMDGPUAsmParser::OperandMatchResultTy -AMDGPUAsmParser::parseSDWASel(OperandVector &Operands) { +AMDGPUAsmParser::parseSDWASel(OperandVector &Operands, StringRef Prefix, + enum AMDGPUOperand::ImmTy Type) { SMLoc S = Parser.getTok().getLoc(); StringRef Value; AMDGPUAsmParser::OperandMatchResultTy res; - res = parseStringWithPrefix("dst_sel", Value); - if (res == MatchOperand_ParseFail) { - return MatchOperand_ParseFail; - } else if (res == MatchOperand_NoMatch) { - res = parseStringWithPrefix("src0_sel", Value); - if (res == MatchOperand_ParseFail) { - return MatchOperand_ParseFail; - } else if (res == MatchOperand_NoMatch) { - res = parseStringWithPrefix("src1_sel", Value); - if (res != MatchOperand_Success) { - return res; - } - } + res = parseStringWithPrefix(Prefix, Value); + if (res != MatchOperand_Success) { + return res; } int64_t Int; @@ -2548,8 +2577,7 @@ return MatchOperand_ParseFail; } - Operands.push_back(AMDGPUOperand::CreateImm(Int, S, - AMDGPUOperand::ImmTySdwaSel)); + Operands.push_back(AMDGPUOperand::CreateImm(Int, S, Type)); return MatchOperand_Success; } @@ -2581,14 +2609,82 @@ return MatchOperand_Success; } -AMDGPUOperand::Ptr AMDGPUAsmParser::defaultSDWASel() const { - return AMDGPUOperand::CreateImm(6, SMLoc(), AMDGPUOperand::ImmTySdwaSel); +AMDGPUOperand::Ptr AMDGPUAsmParser::defaultSDWASel(enum AMDGPUOperand::ImmTy Type) const { + return AMDGPUOperand::CreateImm(6, SMLoc(), Type); +} + +AMDGPUOperand::Ptr AMDGPUAsmParser::defaultSDWADstSel() const { + return defaultSDWASel(AMDGPUOperand::ImmTySdwaDstSel); +} + +AMDGPUOperand::Ptr AMDGPUAsmParser::defaultSDWASrc0Sel() const { + return defaultSDWASel(AMDGPUOperand::ImmTySdwaSrc0Sel); +} + +AMDGPUOperand::Ptr AMDGPUAsmParser::defaultSDWASrc1Sel() const { + return defaultSDWASel(AMDGPUOperand::ImmTySdwaSrc1Sel); } AMDGPUOperand::Ptr AMDGPUAsmParser::defaultSDWADstUnused() const { return AMDGPUOperand::CreateImm(0, SMLoc(), AMDGPUOperand::ImmTySdwaDstUnused); } +void AMDGPUAsmParser::cvtSdwaVop1_mod(MCInst &Inst, const OperandVector &Operands) { + cvtSDWA(Inst, Operands, true, true); +} + +void AMDGPUAsmParser::cvtSdwaVop1_nomod(MCInst &Inst, const OperandVector &Operands) { + cvtSDWA(Inst, Operands, false, true); +} + +void AMDGPUAsmParser::cvtSdwaVop2_mod(MCInst &Inst, const OperandVector &Operands) { + cvtSDWA(Inst, Operands, true, false); +} + +void AMDGPUAsmParser::cvtSdwaVop2_nomod(MCInst &Inst, const OperandVector &Operands) { + cvtSDWA(Inst, Operands, false, false); +} + +void AMDGPUAsmParser::cvtSDWA(MCInst &Inst, const OperandVector &Operands, + bool HasMods, bool IsVOP1) { + OptionalImmIndexMap OptionalIdx; + + unsigned I = 1; + const MCInstrDesc &Desc = MII.get(Inst.getOpcode()); + for (unsigned J = 0; J < Desc.getNumDefs(); ++J) { + ((AMDGPUOperand &)*Operands[I++]).addRegOperands(Inst, 1); + } + + for (unsigned E = Operands.size(); I != E; ++I) { + AMDGPUOperand &Op = ((AMDGPUOperand &)*Operands[I]); + // Add the register arguments + if (!HasMods && Op.isReg()) { + Op.addRegOperands(Inst, 1); + } else if (HasMods && Op.isRegOrImmWithInputMods()) { + Op.addRegOrImmWithInputModsOperands(Inst, 2); + } else if (Op.isImm()) { + // Handle optional arguments + OptionalIdx[Op.getImmTy()] = I; + } else { + llvm_unreachable("Invalid operand type"); + } + } + + if (HasMods) { + addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTyClampSI, 0); + } + if (IsVOP1 && + Inst.getOpcode() != AMDGPU::V_NOP_sdwa) { // V_NOP_sdwa has no optional sdwa arguments + addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTySdwaDstSel, 6); + addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTySdwaDstUnused, 2); + addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTySdwaSrc0Sel, 6); + } else if (!IsVOP1) { // VOP2 + addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTySdwaDstSel, 6); + addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTySdwaDstUnused, 2); + addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTySdwaSrc0Sel, 6); + addOptionalImmOperand(Inst, Operands, OptionalIdx, AMDGPUOperand::ImmTySdwaSrc1Sel, 6); + } +} /// Force static initialization. extern "C" void LLVMInitializeAMDGPUAsmParser() { Index: lib/Target/AMDGPU/SIInstrInfo.td =================================================================== --- lib/Target/AMDGPU/SIInstrInfo.td +++ lib/Target/AMDGPU/SIInstrInfo.td @@ -489,11 +489,9 @@ let ParserMethod = !if(Optional, "parseOptionalOperand", "parse"#CName); let RenderMethod = "addImmOperands"; let IsOptional = Optional; - let DefaultMethod = "default"#CName; + let DefaultMethod = !if(Optional, "default"#CName, ?); } -def sdwa_sel : NamedMatchClass<"SDWASel">; - class NamedOperandBit : Operand { let PrintMethod = "print"#Name; let ParserMatchClass = MatchClass; @@ -547,9 +545,9 @@ def bank_mask : NamedOperandU32<"BankMask", NamedMatchClass<"BankMask">>; def bound_ctrl : NamedOperandBit<"BoundCtrl", NamedMatchClass<"BoundCtrl">>; -def dst_sel : NamedOperandU32<"SDWADstSel", sdwa_sel>; -def src0_sel : NamedOperandU32<"SDWASrc0Sel", sdwa_sel>; -def src1_sel : NamedOperandU32<"SDWASrc1Sel", sdwa_sel>; +def dst_sel : NamedOperandU32<"SDWADstSel", NamedMatchClass<"SDWADstSel">>; +def src0_sel : NamedOperandU32<"SDWASrc0Sel", NamedMatchClass<"SDWASrc0Sel">>; +def src1_sel : NamedOperandU32<"SDWASrc1Sel", NamedMatchClass<"SDWASrc1Sel">>; def dst_unused : NamedOperandU32<"SDWADstUnused", NamedMatchClass<"SDWADstUnused">>; def hwreg : NamedOperandU16<"Hwreg", NamedMatchClass<"Hwreg", 0>>; @@ -1337,7 +1335,7 @@ " $src1_modifiers,")); string args = !if(!eq(HasModifiers, 0), getAsm32<0, NumSrcArgs, DstVT>.ret, - ", "#src0#src1#", $clamp"); + ", "#src0#src1#"$clamp"); string sdwa = !if(!eq(NumSrcArgs, 0), "", !if(!eq(NumSrcArgs, 1), @@ -1679,7 +1677,7 @@ !if(!eq(p.NumSrcArgs, 1), 0, !if(p.HasModifiers, ?, 0))); bits<3> dst_sel = !if(p.HasDst, ?, 6); - bits<2> dst_unused = !if(p.HasDst, ?, 0); + bits<2> dst_unused = !if(p.HasDst, ?, 2); bits<1> clamp = !if(p.HasModifiers, ?, 0); } @@ -1687,6 +1685,7 @@ VOP1_SDWAe , VOP_SDWA , SDWADisableFields

{ + let AsmMatchConverter = !if(!eq(p.HasModifiers,1), "cvtSdwaVop1_mod", "cvtSdwaVop1_nomod"); let AssemblerPredicates = !if(p.HasExt, [isVI], [DisableInst]); let DecoderNamespace = "SDWA"; let DisableDecoder = DisableVIDecoder; @@ -1760,6 +1759,7 @@ VOP2_SDWAe , VOP_SDWA , SDWADisableFields

{ + let AsmMatchConverter = !if(!eq(p.HasModifiers,1), "cvtSdwaVop2_mod", "cvtSdwaVop2_nomod"); let AssemblerPredicates = !if(p.HasExt, [isVI], [DisableInst]); let DecoderNamespace = "SDWA"; let DisableDecoder = DisableVIDecoder; Index: test/MC/AMDGPU/vop_sdwa.s =================================================================== --- test/MC/AMDGPU/vop_sdwa.s +++ test/MC/AMDGPU/vop_sdwa.s @@ -38,3 +38,15 @@ // NOSICI: error: // VI: v_min_u32_sdwa v1, v1, v1 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:BYTE_0 src1_sel:DWORD ; encoding: [0xf9,0x02,0x02,0x1c,0x01,0x06,0x00,0x06] v_min_u32 v1, v1, v1 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:BYTE_0 src1_sel:DWORD + +// NOSICI: error: +// VI: v_mov_b32_sdwa v0, v0 dst_sel:BYTE_0 dst_unused:UNUSED_PRESERVE src0_sel:DWORD ; encoding: [0xf9,0x02,0x00,0x7e,0x00,0x10,0x06,0x06] +v_mov_b32 v0, v0 dst_sel:BYTE_0 src0_sel:DWORD + +// NOSICI: error: +// VI: v_mov_b32_sdwa v0, v0 dst_sel:DWORD dst_unused:UNUSED_PRESERVE src0_sel:DWORD ; encoding: [0xf9,0x02,0x00,0x7e,0x00,0x16,0x06,0x06] +v_mov_b32 v0, v0 src0_sel:DWORD + +// NOSICI: error: +// VI: v_mov_b32_sdwa v0, v0 dst_sel:DWORD dst_unused:UNUSED_PRESERVE src0_sel:DWORD ; encoding: [0xf9,0x02,0x00,0x7e,0x00,0x16,0x06,0x06] +v_mov_b32_sdwa v0, v0