Diff 260886

llvm/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp

Show First 20 Lines • Show All 1,305 Lines • ▼ Show 20 Lines	bool AMDGPUAsmPrinter::PrintAsmOperand(const MachineInstr *MI, unsigned OpNo,
}		}

// TODO: Should be able to support other operand types like globals.		// TODO: Should be able to support other operand types like globals.
const MachineOperand &MO = MI->getOperand(OpNo);		const MachineOperand &MO = MI->getOperand(OpNo);
if (MO.isReg()) {		if (MO.isReg()) {
AMDGPUInstPrinter::printRegOperand(MO.getReg(), O,		AMDGPUInstPrinter::printRegOperand(MO.getReg(), O,
*MF->getSubtarget().getRegisterInfo());		*MF->getSubtarget().getRegisterInfo());
return false;		return false;
		} else if (MO.isImm()) {
		int64_t Val = MO.getImm();
		if (isInlineAsmConst(Val)) {
		printInlineAsmConst(Val, O);
		return false;
		} else { // A literal
		arsenmUnsubmitted Not Done Reply Inline Actions No else after return arsenm: No else after return
		O << Val;
		return false;
		}
}		}

return true;		return true;
}		}

llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUInstPrinter.h

Show First 20 Lines • Show All 264 Lines • ▼ Show 20 Lines	public:
void printOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O);		void printOperand(const MCInst *MI, unsigned OpNo, raw_ostream &O);
void printRel(const MCInst *MI, unsigned OpNo, raw_ostream &O);		void printRel(const MCInst *MI, unsigned OpNo, raw_ostream &O);
void printRSel(const MCInst *MI, unsigned OpNo, raw_ostream &O);		void printRSel(const MCInst *MI, unsigned OpNo, raw_ostream &O);
void printUpdateExecMask(const MCInst *MI, unsigned OpNo, raw_ostream &O);		void printUpdateExecMask(const MCInst *MI, unsigned OpNo, raw_ostream &O);
void printUpdatePred(const MCInst *MI, unsigned OpNo, raw_ostream &O);		void printUpdatePred(const MCInst *MI, unsigned OpNo, raw_ostream &O);
void printWrite(const MCInst *MI, unsigned OpNo, raw_ostream &O);		void printWrite(const MCInst *MI, unsigned OpNo, raw_ostream &O);
};		};

		namespace AMDGPU {

		void printInlineAsmConst(uint64_t Imm, raw_ostream &O);

		} // End namespace AMDGPU

} // End namespace llvm		} // End namespace llvm

#endif		#endif

llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUInstPrinter.cpp

Show First 20 Lines • Show All 433 Lines • ▼ Show 20 Lines	else if (Imm == FloatToBits(-4.0f))
O << "-4.0";		O << "-4.0";
else if (Imm == 0x3e22f983 &&		else if (Imm == 0x3e22f983 &&
STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm])		STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm])
O << "0.15915494";		O << "0.15915494";
else		else
O << formatHex(static_cast<uint64_t>(Imm));		O << formatHex(static_cast<uint64_t>(Imm));
}		}

void AMDGPUInstPrinter::printImmediate64(uint64_t Imm,		static bool printInlineConst64(uint64_t Imm, raw_ostream &O, bool HasInv2Pi) {
const MCSubtargetInfo &STI,
raw_ostream &O) {
int64_t SImm = static_cast<int64_t>(Imm);		int64_t SImm = static_cast<int64_t>(Imm);
if (SImm >= -16 && SImm <= 64) {		if (SImm >= -16 && SImm <= 64) {
O << SImm;		O << SImm;
return;		return true;
}		}

if (Imm == DoubleToBits(0.0))		if (Imm == DoubleToBits(0.0))
O << "0.0";		O << "0.0";
else if (Imm == DoubleToBits(1.0))		else if (Imm == DoubleToBits(1.0))
O << "1.0";		O << "1.0";
else if (Imm == DoubleToBits(-1.0))		else if (Imm == DoubleToBits(-1.0))
O << "-1.0";		O << "-1.0";
else if (Imm == DoubleToBits(0.5))		else if (Imm == DoubleToBits(0.5))
O << "0.5";		O << "0.5";
else if (Imm == DoubleToBits(-0.5))		else if (Imm == DoubleToBits(-0.5))
O << "-0.5";		O << "-0.5";
else if (Imm == DoubleToBits(2.0))		else if (Imm == DoubleToBits(2.0))
O << "2.0";		O << "2.0";
else if (Imm == DoubleToBits(-2.0))		else if (Imm == DoubleToBits(-2.0))
O << "-2.0";		O << "-2.0";
else if (Imm == DoubleToBits(4.0))		else if (Imm == DoubleToBits(4.0))
O << "4.0";		O << "4.0";
else if (Imm == DoubleToBits(-4.0))		else if (Imm == DoubleToBits(-4.0))
O << "-4.0";		O << "-4.0";
else if (Imm == 0x3fc45f306dc9c882 &&		else if (Imm == 0x3fc45f306dc9c882 && HasInv2Pi)
STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm])
O << "0.15915494309189532";		O << "0.15915494309189532";
else {		else {
		return false;
		}
		return true;
		}

		void AMDGPUInstPrinter::printImmediate64(uint64_t Imm,
		const MCSubtargetInfo &STI,
		raw_ostream &O) {
		bool HasInv2Pi = STI.getFeatureBits()[AMDGPU::FeatureInv2PiInlineImm];
		if (!printInlineConst64(Imm, O, HasInv2Pi)) {
assert(isUInt<32>(Imm) \|\| Imm == 0x3fc45f306dc9c882);		assert(isUInt<32>(Imm) \|\| Imm == 0x3fc45f306dc9c882);

// In rare situations, we will have a 32-bit literal in a 64-bit		// In rare situations, we will have a 32-bit literal in a 64-bit
// operand. This is technically allowed for the encoding of s_mov_b64.		// operand. This is technically allowed for the encoding of s_mov_b64.
O << formatHex(static_cast<uint64_t>(Imm));		O << formatHex(static_cast<uint64_t>(Imm));
}		}
}		}

		namespace llvm {
		namespace AMDGPU {

		void printInlineAsmConst(uint64_t Imm, raw_ostream &O) {
		printInlineConst64(Imm, O, true);
		}

		} // End namespace AMDGPU
		} // End namespace llvm

void AMDGPUInstPrinter::printBLGP(const MCInst *MI, unsigned OpNo,		void AMDGPUInstPrinter::printBLGP(const MCInst *MI, unsigned OpNo,
const MCSubtargetInfo &STI,		const MCSubtargetInfo &STI,
raw_ostream &O) {		raw_ostream &O) {
unsigned Imm = MI->getOperand(OpNo).getImm();		unsigned Imm = MI->getOperand(OpNo).getImm();
if (!Imm)		if (!Imm)
return;		return;

O << " blgp:" << Imm;		O << " blgp:" << Imm;
▲ Show 20 Lines • Show All 1,081 Lines • Show Last 20 Lines

llvm/lib/Target/AMDGPU/SIISelLowering.h

Show First 20 Lines • Show All 377 Lines • ▼ Show 20 Lines	public:
MachineSDNode *wrapAddr64Rsrc(SelectionDAG &DAG, const SDLoc &DL,		MachineSDNode *wrapAddr64Rsrc(SelectionDAG &DAG, const SDLoc &DL,
SDValue Ptr) const;		SDValue Ptr) const;
MachineSDNode *buildRSRC(SelectionDAG &DAG, const SDLoc &DL, SDValue Ptr,		MachineSDNode *buildRSRC(SelectionDAG &DAG, const SDLoc &DL, SDValue Ptr,
uint32_t RsrcDword1, uint64_t RsrcDword2And3) const;		uint32_t RsrcDword1, uint64_t RsrcDword2And3) const;
std::pair<unsigned, const TargetRegisterClass *>		std::pair<unsigned, const TargetRegisterClass *>
getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,		getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI,
StringRef Constraint, MVT VT) const override;		StringRef Constraint, MVT VT) const override;
ConstraintType getConstraintType(StringRef Constraint) const override;		ConstraintType getConstraintType(StringRef Constraint) const override;
		void LowerAsmOperandForConstraint(SDValue Op,
		std::string &Constraint,
		std::vector<SDValue> &Ops,
		SelectionDAG &DAG) const override;
SDValue copyToM0(SelectionDAG &DAG, SDValue Chain, const SDLoc &DL,		SDValue copyToM0(SelectionDAG &DAG, SDValue Chain, const SDLoc &DL,
SDValue V) const;		SDValue V) const;

void finalizeLowering(MachineFunction &MF) const override;		void finalizeLowering(MachineFunction &MF) const override;

void computeKnownBitsForFrameIndex(const SDValue Op,		void computeKnownBitsForFrameIndex(const SDValue Op,
KnownBits &Known,		KnownBits &Known,
const APInt &DemandedElts,		const APInt &DemandedElts,
▲ Show 20 Lines • Show All 56 Lines • Show Last 20 Lines

llvm/lib/Target/AMDGPU/SIISelLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

	Show First 20 Lines • Show All 10,701 Lines • ▼ Show 20 Lines
	SITargetLowering::getConstraintType(StringRef Constraint) const {			SITargetLowering::getConstraintType(StringRef Constraint) const {
	if (Constraint.size() == 1) {			if (Constraint.size() == 1) {
	switch (Constraint[0]) {			switch (Constraint[0]) {
	default: break;			default: break;
	case 's':			case 's':
	case 'v':			case 'v':
	case 'a':			case 'a':
	return C_RegisterClass;			return C_RegisterClass;
				case 'A':
				return C_Other;
	}			}
	}			}
	return TargetLowering::getConstraintType(Constraint);			return TargetLowering::getConstraintType(Constraint);
	}			}

				void SITargetLowering::LowerAsmOperandForConstraint(SDValue Op,
				std::string &Constraint,
				std::vector<SDValue> &Ops,
				SelectionDAG &DAG) const {
				if (Constraint.length() == 1 && Constraint[0] == 'A') {
				unsigned Size = Op.getValueSizeInBits();
				if (Size > 64)
				return;

				uint64_t Val;
				bool IsConst = false;
				if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op)) {
				Val = C->getSExtValue();
				IsConst = true;
				} else if (ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Op)) {
				Val = C->getValueAPF().bitcastToAPInt().getSExtValue();
				IsConst = true;
				}

				dpAuthorUnsubmitted Done Reply Inline Actions Should we enforce this limitation? GCC seems to allow arbitrary vector size and type provided that all elements are equal and may be inlined. dp: Should we enforce this limitation? GCC seems to allow arbitrary vector size and type provided…
				arsenmUnsubmitted Done Reply Inline Actions You mean it also accepts <4 x i8> because it's a 32-bit type? arsenm: You mean it also accepts <4 x i8> because it's a 32-bit type?
				dpAuthorUnsubmitted Done Reply Inline Actions I was wrong about GCC 'vectors'. Looks like they are not regular types and used only for auto-vectorization. Here is the GCC implementation: (define_constraint "A" "Inline immediate parameter" (and (match_code "const_int,const_double,const_vector") (match_test "gcn_inline_constant_p (op)"))) ... bool gcn_inline_constant_p (rtx x) { if (GET_CODE (x) == CONST_INT) return INTVAL (x) >= -16 && INTVAL (x) <= 64; if (GET_CODE (x) == CONST_DOUBLE) return gcn_inline_fp_constant_p (x, false); if (GET_CODE (x) == CONST_VECTOR) { int n; if (!vgpr_vector_mode_p (GET_MODE (x))) return false; n = gcn_inline_constant_p (CONST_VECTOR_ELT (x, 0)); if (!n) return false; for (int i = 1; i < 64; i++) if (CONST_VECTOR_ELT (x, i) != CONST_VECTOR_ELT (x, 0)) return false; return 1; } return false; } ... inline bool vgpr_vector_mode_p (machine_mode mode) { return (mode == V64QImode \|\| mode == V64HImode \|\| mode == V64SImode \|\| mode == V64DImode \|\| mode == V64HFmode \|\| mode == V64SFmode \|\| mode == V64DFmode); } dp: I was wrong about GCC 'vectors'. Looks like they are not regular types and used only for auto…
				if (IsConst) {
				bool HasInv2Pi = Subtarget->hasInv2PiInlineImm();
				if ((Size == 16 && AMDGPU::isInlinableLiteral16(Val, HasInv2Pi)) \|\|
				(Size == 32 && AMDGPU::isInlinableLiteral32(Val, HasInv2Pi)) \|\|
				(Size == 64 && AMDGPU::isInlinableLiteral64(Val, HasInv2Pi))) {
				auto IVal = AMDGPU::createInlineAsmConst(Val, Size);
				arsenmUnsubmitted Done Reply Inline Actions This should be getZExtValue? It looks like the tests worked correctly here, but not sure why it didn't matter arsenm: This should be getZExtValue? It looks like the tests worked correctly here, but not sure why it…
				dpAuthorUnsubmitted Done Reply Inline Actions This does not really matter because isInlinableLiteralXX truncates input value to XX bits before checking. However getting sign-extended values is useful to easily recognize negative integer constants and get prettier output. Consider this code (actually a corner case): ... asm "v_mov_b32 $0, $1", "=v,A"(half bitcast (i16 -1 to half)) Currently the code ends up as v_mov_b32 v0, -1 If we replace getSExtValue with getZExtValue, the result would be v_mov_b32 v0, 0xFFFF dp: This does not really matter because isInlinableLiteralXX truncates input value to XX bits…
				auto Res = DAG.getTargetConstant(IVal, SDLoc(Op), MVT::i64);
				Ops.push_back(Res);
				}
				}
				} else {
				TargetLowering::LowerAsmOperandForConstraint(Op, Constraint, Ops, DAG);
				}
				}

	// Figure out which registers should be reserved for stack access. Only after			// Figure out which registers should be reserved for stack access. Only after
	// the function is legalized do we know all of the non-spill stack objects or if			// the function is legalized do we know all of the non-spill stack objects or if
	// calls are present.			// calls are present.
	void SITargetLowering::finalizeLowering(MachineFunction &MF) const {			void SITargetLowering::finalizeLowering(MachineFunction &MF) const {
	MachineRegisterInfo &MRI = MF.getRegInfo();			MachineRegisterInfo &MRI = MF.getRegInfo();
	SIMachineFunctionInfo *Info = MF.getInfo<SIMachineFunctionInfo>();			SIMachineFunctionInfo *Info = MF.getInfo<SIMachineFunctionInfo>();
	const GCNSubtarget &ST = MF.getSubtarget<GCNSubtarget>();			const GCNSubtarget &ST = MF.getSubtarget<GCNSubtarget>();
	const SIRegisterInfo *TRI = Subtarget->getRegisterInfo();			const SIRegisterInfo *TRI = Subtarget->getRegisterInfo();
	▲ Show 20 Lines • Show All 358 Lines • Show Last 20 Lines

llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h

Show First 20 Lines • Show All 763 Lines • ▼ Show 20 Lines	bool isInlineCompatible(SIModeRegisterDefaults CalleeMode) const {
// Allow inlining denormals enabled into denormals flushed functions.		// Allow inlining denormals enabled into denormals flushed functions.
return oneWayCompatible(FP64FP16InputDenormals, CalleeMode.FP64FP16InputDenormals) &&		return oneWayCompatible(FP64FP16InputDenormals, CalleeMode.FP64FP16InputDenormals) &&
oneWayCompatible(FP64FP16OutputDenormals, CalleeMode.FP64FP16OutputDenormals) &&		oneWayCompatible(FP64FP16OutputDenormals, CalleeMode.FP64FP16OutputDenormals) &&
oneWayCompatible(FP32InputDenormals, CalleeMode.FP32InputDenormals) &&		oneWayCompatible(FP32InputDenormals, CalleeMode.FP32InputDenormals) &&
oneWayCompatible(FP32OutputDenormals, CalleeMode.FP32OutputDenormals);		oneWayCompatible(FP32OutputDenormals, CalleeMode.FP32OutputDenormals);
}		}
};		};

		LLVM_READNONE
		uint64_t createInlineAsmConst(uint64_t Val, unsigned Size);

		LLVM_READNONE
		bool isInlineAsmConst(uint64_t Val);

} // end namespace AMDGPU		} // end namespace AMDGPU
} // end namespace llvm		} // end namespace llvm

#endif // LLVM_LIB_TARGET_AMDGPU_UTILS_AMDGPUBASEINFO_H		#endif // LLVM_LIB_TARGET_AMDGPU_UTILS_AMDGPUBASEINFO_H

llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.cpp

//===- AMDGPUBaseInfo.cpp - AMDGPU Base encoding information --------------===//		//===- AMDGPUBaseInfo.cpp - AMDGPU Base encoding information --------------===//
//		//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.		// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "AMDGPUBaseInfo.h"		#include "AMDGPUBaseInfo.h"
#include "AMDGPU.h"		#include "AMDGPU.h"
#include "AMDGPUAsmUtils.h"		#include "AMDGPUAsmUtils.h"
#include "AMDGPUTargetTransformInfo.h"		#include "AMDGPUTargetTransformInfo.h"
#include "SIDefines.h"		#include "SIDefines.h"
#include "llvm/ADT/StringRef.h"		#include "llvm/ADT/StringRef.h"
#include "llvm/ADT/Triple.h"		#include "llvm/ADT/Triple.h"
		#include "llvm/ADT/APFloat.h"
#include "llvm/BinaryFormat/ELF.h"		#include "llvm/BinaryFormat/ELF.h"
#include "llvm/CodeGen/MachineMemOperand.h"		#include "llvm/CodeGen/MachineMemOperand.h"
#include "llvm/IR/Attributes.h"		#include "llvm/IR/Attributes.h"
#include "llvm/IR/Constants.h"		#include "llvm/IR/Constants.h"
#include "llvm/IR/Function.h"		#include "llvm/IR/Function.h"
#include "llvm/IR/GlobalValue.h"		#include "llvm/IR/GlobalValue.h"
#include "llvm/IR/Instruction.h"		#include "llvm/IR/Instruction.h"
#include "llvm/IR/IntrinsicsAMDGPU.h"		#include "llvm/IR/IntrinsicsAMDGPU.h"
▲ Show 20 Lines • Show All 1,112 Lines • ▼ Show 20 Lines

unsigned getRegOperandSize(const MCRegisterInfo *MRI, const MCInstrDesc &Desc,		unsigned getRegOperandSize(const MCRegisterInfo *MRI, const MCInstrDesc &Desc,
unsigned OpNo) {		unsigned OpNo) {
assert(OpNo < Desc.NumOperands);		assert(OpNo < Desc.NumOperands);
unsigned RCID = Desc.OpInfo[OpNo].RegClass;		unsigned RCID = Desc.OpInfo[OpNo].RegClass;
return getRegBitWidth(MRI->getRegClass(RCID)) / 8;		return getRegBitWidth(MRI->getRegClass(RCID)) / 8;
}		}

		static bool isInlinableIntLiteral(int64_t Literal) {
		return Literal >= -16 && Literal <= 64;
		}

bool isInlinableLiteral64(int64_t Literal, bool HasInv2Pi) {		bool isInlinableLiteral64(int64_t Literal, bool HasInv2Pi) {
if (Literal >= -16 && Literal <= 64)		if (isInlinableIntLiteral(Literal))
return true;		return true;

uint64_t Val = static_cast<uint64_t>(Literal);		uint64_t Val = static_cast<uint64_t>(Literal);
return (Val == DoubleToBits(0.0)) \|\|		return (Val == DoubleToBits(0.0)) \|\|
(Val == DoubleToBits(1.0)) \|\|		(Val == DoubleToBits(1.0)) \|\|
(Val == DoubleToBits(-1.0)) \|\|		(Val == DoubleToBits(-1.0)) \|\|
(Val == DoubleToBits(0.5)) \|\|		(Val == DoubleToBits(0.5)) \|\|
(Val == DoubleToBits(-0.5)) \|\|		(Val == DoubleToBits(-0.5)) \|\|
(Val == DoubleToBits(2.0)) \|\|		(Val == DoubleToBits(2.0)) \|\|
(Val == DoubleToBits(-2.0)) \|\|		(Val == DoubleToBits(-2.0)) \|\|
(Val == DoubleToBits(4.0)) \|\|		(Val == DoubleToBits(4.0)) \|\|
(Val == DoubleToBits(-4.0)) \|\|		(Val == DoubleToBits(-4.0)) \|\|
(Val == 0x3fc45f306dc9c882 && HasInv2Pi);		(Val == 0x3fc45f306dc9c882 && HasInv2Pi);
}		}

bool isInlinableLiteral32(int32_t Literal, bool HasInv2Pi) {		bool isInlinableLiteral32(int32_t Literal, bool HasInv2Pi) {
if (Literal >= -16 && Literal <= 64)		if (isInlinableIntLiteral(Literal))
return true;		return true;

// The actual type of the operand does not seem to matter as long		// The actual type of the operand does not seem to matter as long
// as the bits match one of the inline immediate values. For example:		// as the bits match one of the inline immediate values. For example:
//		//
// -nan has the hexadecimal encoding of 0xfffffffe which is -2 in decimal,		// -nan has the hexadecimal encoding of 0xfffffffe which is -2 in decimal,
// so it is a legal inline immediate.		// so it is a legal inline immediate.
//		//
Show All 12 Lines	return (Val == FloatToBits(0.0f)) \|\|
(Val == FloatToBits(-4.0f)) \|\|		(Val == FloatToBits(-4.0f)) \|\|
(Val == 0x3e22f983 && HasInv2Pi);		(Val == 0x3e22f983 && HasInv2Pi);
}		}

bool isInlinableLiteral16(int16_t Literal, bool HasInv2Pi) {		bool isInlinableLiteral16(int16_t Literal, bool HasInv2Pi) {
if (!HasInv2Pi)		if (!HasInv2Pi)
return false;		return false;

if (Literal >= -16 && Literal <= 64)		if (isInlinableIntLiteral(Literal))
return true;		return true;

uint16_t Val = static_cast<uint16_t>(Literal);		uint16_t Val = static_cast<uint16_t>(Literal);
return Val == 0x3C00 \|\| // 1.0		return Val == 0x3C00 \|\| // 1.0
Val == 0xBC00 \|\| // -1.0		Val == 0xBC00 \|\| // -1.0
Val == 0x3800 \|\| // 0.5		Val == 0x3800 \|\| // 0.5
Val == 0xB800 \|\| // -0.5		Val == 0xB800 \|\| // -0.5
Val == 0x4000 \|\| // 2.0		Val == 0x4000 \|\| // 2.0
▲ Show 20 Lines • Show All 205 Lines • ▼ Show 20 Lines
}		}

const GcnBufferFormatInfo *getGcnBufferFormatInfo(uint8_t Format,		const GcnBufferFormatInfo *getGcnBufferFormatInfo(uint8_t Format,
const MCSubtargetInfo &STI) {		const MCSubtargetInfo &STI) {
return isGFX10(STI) ? getGfx10PlusBufferFormatInfo(Format)		return isGFX10(STI) ? getGfx10PlusBufferFormatInfo(Format)
: getGfx9BufferFormatInfo(Format);		: getGfx9BufferFormatInfo(Format);
}		}

		// Convert fp inline constants to 64-bit. f64 has the following advantages:
		// 1) When printed, these constants are valid for any operand type.
		// 2) Encoding of f64 inline constants is different from any 32-bit literal.
		// This may be useful for future extensions.
		uint64_t createInlineAsmConst(uint64_t Val, unsigned Size) {
		assert(Size == 16 \|\| Size == 32 \|\| Size == 64);

		if (isInlinableIntLiteral(Val))
		return Val;

		// Convert inv2pi.
		if ((Size == 16 && Val == 0x3118) \|\|
		(Size == 32 && Val == 0x3e22f983))
		return 0x3fc45f306dc9c882;
		arsenmUnsubmitted Done Reply Inline Actions Logic doesn't make sense here? Returns the 64-bit value if it's 16 or 32? arsenm: Logic doesn't make sense here? Returns the 64-bit value if it's 16 or 32?
		dpAuthorUnsubmitted Done Reply Inline Actions When working on this fix I was under an impression that types of values passed to inline assembler are not required to match instruction operand types. In other words, I assumed that the following code is legal: "v_mov_b32 $0, $1", "=v,A"(half 0xH3C00) // 1.0h Also I assumed that this code required a type conversion to end up as "v_mov_b32 ..., 1.0" and not "v_mov_b32 ..., 0x3C00" because in the latter case the constant cannot be encoded as inline value. That assumption complicated implementation. Was the assumption incorrect? If types of values passed to inline assembler are required to match types of corresponding assembler operands, the implementation would be much simpler. dp: When working on this fix I was under an impression that types of values passed to inline…
		arsenmUnsubmitted Not Done Reply Inline Actions We have to use 32-bit instruction to materialize 16-bit values. This should be zero extended. This should end up as v_mov_b32 $0, 0x00003c00. For some cases we don't currently use in codegen, (and I'm not sure are supported by the assembler), some 64-bit operands accept 32-bit literals which are zero extended arsenm: We have to use 32-bit instruction to materialize 16-bit values. This should be zero extended.

		// Convert remaining fp constants.
		if (Size < 64) {
		bool Lost;
		const fltSemantics *FltSemantics =
		(Size == 16) ? &APFloat::IEEEhalf() : &APFloat::IEEEsingle();
		APFloat FPLiteral(*FltSemantics, APInt(Size, Val));
		FPLiteral.convert(APFloat::IEEEdouble(),
		APFloat::rmNearestTiesToEven,
		&Lost);
		return FPLiteral.bitcastToAPInt().getZExtValue();
		}
		arsenmUnsubmitted Done Reply Inline Actions I wouldn't expect any FP rounding in the assembler arsenm: I wouldn't expect any FP rounding in the assembler
		dpAuthorUnsubmitted Done Reply Inline Actions See my comments above. dp: See my comments above.

		return Val;
		}

		bool isInlineAsmConst(uint64_t Val) {
		return AMDGPU::isInlinableLiteral64(Val, true);
		}

} // namespace AMDGPU		} // namespace AMDGPU
} // namespace llvm		} // namespace llvm

llvm/test/CodeGen/AMDGPU/inline-constraints.ll

	; RUN: llc < %s -march=amdgcn -mcpu=bonaire -verify-machineinstrs \| FileCheck --check-prefix=GCN %s			; RUN: not llc < %s -march=amdgcn -mcpu=bonaire -verify-machineinstrs \| FileCheck --check-prefix=GCN %s
	; RUN: llc < %s -march=amdgcn -mcpu=tonga -verify-machineinstrs \| FileCheck --check-prefix=GCN %s			; RUN: not llc < %s -march=amdgcn -mcpu=tonga -verify-machineinstrs \| FileCheck --check-prefix=GCN --check-prefix=VI %s

				; RUN: not llc < %s -march=amdgcn -mcpu=bonaire -verify-machineinstrs 2>&1 \| FileCheck --check-prefix=NOGCN --check-prefix=NOSI %s
				; RUN: not llc < %s -march=amdgcn -mcpu=tonga -verify-machineinstrs 2>&1 \| FileCheck --check-prefix=NOGCN %s

	; GCN-LABEL: {{^}}inline_reg_constraints:			; GCN-LABEL: {{^}}inline_reg_constraints:
	; GCN: flat_load_dword v{{[0-9]+}}, v[{{[0-9]+:[0-9]+}}]			; GCN: flat_load_dword v{{[0-9]+}}, v[{{[0-9]+:[0-9]+}}]
	; GCN: flat_load_dwordx2 v[{{[0-9]+:[0-9]+}}], v[{{[0-9]+:[0-9]+}}]			; GCN: flat_load_dwordx2 v[{{[0-9]+:[0-9]+}}], v[{{[0-9]+:[0-9]+}}]
	; GCN: flat_load_dwordx2 v[{{[0-9]+:[0-9]+}}], v[{{[0-9]+:[0-9]+}}]			; GCN: flat_load_dwordx2 v[{{[0-9]+:[0-9]+}}], v[{{[0-9]+:[0-9]+}}]
	; GCN: flat_load_dwordx4 v[{{[0-9]+:[0-9]+}}], v[{{[0-9]+:[0-9]+}}]			; GCN: flat_load_dwordx4 v[{{[0-9]+:[0-9]+}}], v[{{[0-9]+:[0-9]+}}]
	; GCN: flat_load_dwordx4 v[{{[0-9]+:[0-9]+}}], v[{{[0-9]+:[0-9]+}}]			; GCN: flat_load_dwordx4 v[{{[0-9]+:[0-9]+}}], v[{{[0-9]+:[0-9]+}}]
	; GCN: s_load_dword s{{[0-9]+}}, s[{{[0-9]+:[0-9]+}}]			; GCN: s_load_dword s{{[0-9]+}}, s[{{[0-9]+:[0-9]+}}]
	▲ Show 20 Lines • Show All 58 Lines • ▼ Show 20 Lines
	; GCN-LABEL: {{^}}inline_sreg_constraint_imm_f64:			; GCN-LABEL: {{^}}inline_sreg_constraint_imm_f64:
	; GCN-DAG: s_mov_b32 s[[REG_LO:[0-9]+]], 0{{$}}			; GCN-DAG: s_mov_b32 s[[REG_LO:[0-9]+]], 0{{$}}
	; GCN-DAG: s_mov_b32 s[[REG_HI:[0-9]+]], 0x3ff00000{{$}}			; GCN-DAG: s_mov_b32 s[[REG_HI:[0-9]+]], 0x3ff00000{{$}}
	; GCN: ; use s{{\[}}[[REG_LO]]:[[REG_HI]]{{\]}}			; GCN: ; use s{{\[}}[[REG_LO]]:[[REG_HI]]{{\]}}
	define amdgpu_kernel void @inline_sreg_constraint_imm_f64() {			define amdgpu_kernel void @inline_sreg_constraint_imm_f64() {
	tail call void asm sideeffect "; use $0", "s"(double 1.0)			tail call void asm sideeffect "; use $0", "s"(double 1.0)
	ret void			ret void
	}			}

				;==============================================================================
				; 'A' constraint, 16-bit operand
				;==============================================================================

				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_H0:
				; VI: v_mov_b32 {{v[0-9]+}}, 64
				define i32 @inline_A_constraint_H0() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i16 64)
				ret i32 %v0
				}

				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_H1:
				; VI: v_mov_b32 {{v[0-9]+}}, -16
				define i32 @inline_A_constraint_H1() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i16 -16)
				ret i32 %v0
				}

				arsenmUnsubmitted Not Done Reply Inline Actions FP value tests including the subtarget dependent inv 2pi one? arsenm: FP value tests including the subtarget dependent inv 2pi one?
				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_H2:
				; VI: v_mov_b32 {{v[0-9]+}}, 1.0
				define i32 @inline_A_constraint_H2() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i16 bitcast (half 1.0 to i16))
				ret i32 %v0
				}

				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_H3:
				; VI: v_mov_b32 {{v[0-9]+}}, -1.0
				define i32 @inline_A_constraint_H3() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i16 bitcast (half -1.0 to i16))
				ret i32 %v0
				}

				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_H4:
				; VI: v_mov_b32 {{v[0-9]+}}, 0.15915494309189532
				define i32 @inline_A_constraint_H4() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(half 0xH3118)
				ret i32 %v0
				}

				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_H5:
				; VI: v_mov_b32 {{v[0-9]+}}, 0.15915494309189532
				define i32 @inline_A_constraint_H5() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i16 bitcast (half 0xH3118 to i16))
				ret i32 %v0
				}

				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_H6:
				; VI: v_mov_b32 {{v[0-9]+}}, -0.5
				define i32 @inline_A_constraint_H6() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(half -0.5)
				ret i32 %v0
				}

				; NOGCN: error: invalid operand for inline asm constraint 'A'
				define i32 @inline_A_constraint_H7() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i16 bitcast (half 0xH3119 to i16))
				ret i32 %v0
				}

				; NOGCN: error: invalid operand for inline asm constraint 'A'
				define i32 @inline_A_constraint_H8() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i16 bitcast (half 0xH3117 to i16))
				ret i32 %v0
				}

				; NOGCN: error: invalid operand for inline asm constraint 'A'
				define i32 @inline_A_constraint_H9() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i16 65)
				ret i32 %v0
				}

				;==============================================================================
				; 'A' constraint, 32-bit operand
				;==============================================================================

				; GCN-LABEL: {{^}}inline_A_constraint_F0:
				; GCN: v_mov_b32 {{v[0-9]+}}, -16
				define i32 @inline_A_constraint_F0() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i32 -16)
				ret i32 %v0
				}

				; GCN-LABEL: {{^}}inline_A_constraint_F1:
				; GCN: v_mov_b32 {{v[0-9]+}}, 1
				define i32 @inline_A_constraint_F1() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i32 1)
				ret i32 %v0
				}

				; GCN-LABEL: {{^}}inline_A_constraint_F2:
				; GCN: v_mov_b32 {{v[0-9]+}}, -0.5
				define i32 @inline_A_constraint_F2() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i32 bitcast (float -0.5 to i32))
				ret i32 %v0
				}

				; GCN-LABEL: {{^}}inline_A_constraint_F3:
				; GCN: v_mov_b32 {{v[0-9]+}}, 2.0
				define i32 @inline_A_constraint_F3() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i32 bitcast (float 2.0 to i32))
				ret i32 %v0
				}

				; GCN-LABEL: {{^}}inline_A_constraint_F4:
				; GCN: v_mov_b32 {{v[0-9]+}}, -4.0
				define i32 @inline_A_constraint_F4() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(float -4.0)
				ret i32 %v0
				}

				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_F5:
				; VI: v_mov_b32 {{v[0-9]+}}, 0.15915494309189532
				define i32 @inline_A_constraint_F5() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i32 1042479491)
				ret i32 %v0
				}

				; GCN-LABEL: {{^}}inline_A_constraint_F6:
				; GCN: v_mov_b32 {{v[0-9]+}}, 0.5
				define i32 @inline_A_constraint_F6() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(float 0.5)
				ret i32 %v0
				}

				; NOGCN: error: invalid operand for inline asm constraint 'A'
				define i32 @inline_A_constraint_F7() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i32 1042479490)
				ret i32 %v0
				}

				; NOGCN: error: invalid operand for inline asm constraint 'A'
				define i32 @inline_A_constraint_F8() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i32 -17)
				ret i32 %v0
				}

				;==============================================================================
				; 'A' constraint, 64-bit operand
				;==============================================================================

				; GCN-LABEL: {{^}}inline_A_constraint_D0:
				; GCN: v_mov_b32 {{v[0-9]+}}, -16
				define i32 @inline_A_constraint_D0() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i64 -16)
				ret i32 %v0
				}

				; GCN-LABEL: {{^}}inline_A_constraint_D1:
				; GCN: v_mov_b32 {{v[0-9]+}}, -2.0
				define i32 @inline_A_constraint_D1() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i64 bitcast (double -2.0 to i64))
				ret i32 %v0
				}

				; GCN-LABEL: {{^}}inline_A_constraint_D2:
				; GCN: v_mov_b32 {{v[0-9]+}}, 0.5
				define i32 @inline_A_constraint_D2() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(double 0.5)
				ret i32 %v0
				}

				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_D3:
				; VI: v_mov_b32 {{v[0-9]+}}, 0.15915494309189532
				define i32 @inline_A_constraint_D3() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(double 0.15915494309189532)
				ret i32 %v0
				}

				; NOSI: error: invalid operand for inline asm constraint 'A'
				; VI-LABEL: {{^}}inline_A_constraint_D4:
				; VI: v_mov_b32 {{v[0-9]+}}, 0.15915494309189532
				define i32 @inline_A_constraint_D4() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i64 bitcast (double 0.15915494309189532 to i64))
				ret i32 %v0
				}

				; GCN-LABEL: {{^}}inline_A_constraint_D5:
				; GCN: v_mov_b32 {{v[0-9]+}}, -2.0
				define i32 @inline_A_constraint_D5() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(double -2.0)
				ret i32 %v0
				}

				; NOGCN: error: invalid operand for inline asm constraint 'A'
				define i32 @inline_A_constraint_D8() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(double 1.1)
				ret i32 %v0
				}

				; NOGCN: error: invalid operand for inline asm constraint 'A'
				define i32 @inline_A_constraint_D9() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i64 bitcast (double 0.1 to i64))
				ret i32 %v0
				}

				;==============================================================================
				; 'A' constraint, type errors
				;==============================================================================

				; NOGCN: error: invalid operand for inline asm constraint 'A'
				define i32 @inline_A_constraint_E1(i32 %x) {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i32 %x)
				ret i32 %v0
				}

				; NOGCN: error: invalid operand for inline asm constraint 'A'
				define i32 @inline_A_constraint_E2() {
				%v0 = tail call i32 asm "v_mov_b32 $0, $1", "=v,A"(i128 100000000000000000000)
				ret i32 %v0
				}
				arsenmUnsubmitted Not Done Reply Inline Actions can you also add some tests for packed <2 x i16>/<2 x half> operands arsenm: can you also add some tests for packed <2 x i16>/<2 x half> operands

This is an archive of the discontinued LLVM Phabricator instance.

[AMDGPU][CODEGEN] Added 'A' constraint for inline assembler
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 260886

llvm/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp

llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUInstPrinter.h

llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUInstPrinter.cpp

llvm/lib/Target/AMDGPU/SIISelLowering.h

llvm/lib/Target/AMDGPU/SIISelLowering.cpp

llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h

llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.cpp

llvm/test/CodeGen/AMDGPU/inline-constraints.ll

This is an archive of the discontinued LLVM Phabricator instance.

[AMDGPU][CODEGEN] Added 'A' constraint for inline assemblerClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 260886

llvm/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp

llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUInstPrinter.h

llvm/lib/Target/AMDGPU/MCTargetDesc/AMDGPUInstPrinter.cpp

llvm/lib/Target/AMDGPU/SIISelLowering.h

llvm/lib/Target/AMDGPU/SIISelLowering.cpp

llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.h

llvm/lib/Target/AMDGPU/Utils/AMDGPUBaseInfo.cpp

llvm/test/CodeGen/AMDGPU/inline-constraints.ll

[AMDGPU][CODEGEN] Added 'A' constraint for inline assembler
ClosedPublic