Diff 477896

llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 1,131 Lines • ▼ Show 20 Lines	bool TargetLowering::SimplifyDemandedBits(
case ISD::SCALAR_TO_VECTOR: {		case ISD::SCALAR_TO_VECTOR: {
if (!DemandedElts[0])		if (!DemandedElts[0])
return TLO.CombineTo(Op, TLO.DAG.getUNDEF(VT));		return TLO.CombineTo(Op, TLO.DAG.getUNDEF(VT));

KnownBits SrcKnown;		KnownBits SrcKnown;
SDValue Src = Op.getOperand(0);		SDValue Src = Op.getOperand(0);
unsigned SrcBitWidth = Src.getScalarValueSizeInBits();		unsigned SrcBitWidth = Src.getScalarValueSizeInBits();
APInt SrcDemandedBits = DemandedBits.zext(SrcBitWidth);		APInt SrcDemandedBits = DemandedBits.zext(SrcBitWidth);
if (SimplifyDemandedBits(Src, SrcDemandedBits, SrcKnown, TLO, Depth + 1))		if (SimplifyDemandedBits(Src, SrcDemandedBits, SrcKnown, TLO, Depth + 1))
		dmgreenUnsubmitted Not Done Reply Inline Actions Could this just use construct known bits of both sides and use KnownBits::mul? It might be able to get value out of the low bits then too. dmgreen: Could this just use construct known bits of both sides and use KnownBits::mul? It might be able…
		benmxwl-armAuthorUnsubmitted Done Reply Inline Actions Please correct me if I've made a silly mistake here, but it does not seem to be exactly KnownBits::mul: Optional<unsigned> MaxVScale = Attr.getVScaleRangeMax(); if (!MaxVScale.has_value()) return false; if (auto MulImm = dyn_cast<ConstantSDNode>(Op.getOperand(0))) { unsigned RequiredBits = Log2_64(MaxVScale) + 1; if (RequiredBits >= BitWidth) return false; Known.Zero.setHighBits(BitWidth - RequiredBits); Known = KnownBits::mul(Known, KnownBits::makeConstant(MulImm->getAPIntValue())); } return false; If the MaxVScale is 16 (5 bits) The known zero bits are everything above Log2(16 * Mul) + 1. The above snippet seems to end up with Log2((2^5 - 1) * Mul) + 1 (which is off by 1 bit) Also it seems that KnowBits::mul can't handle negative multipliers and always reports no known bits in that case. benmxwl-arm: Please correct me if I've made a silly mistake here, but it does not seem to be exactly…
		dmgreenUnsubmitted Not Done Reply Inline Actions Ah - I was worried about that - because it works on bits and not ranges, the results are not as exact as they could otherwise be. I was also considering the vscale turning into a shift, but that may be SVE specific. dmgreen: Ah - I was worried about that - because it works on bits and not ranges, the results are not as…
return true;		return true;

// Upper elements are undef, so only get the knownbits if we just demand		// Upper elements are undef, so only get the knownbits if we just demand
// the bottom element.		// the bottom element.
if (DemandedElts == 1)		if (DemandedElts == 1)
Known = SrcKnown.anyextOrTrunc(BitWidth);		Known = SrcKnown.anyextOrTrunc(BitWidth);
break;		break;
		dmgreenUnsubmitted Done Reply Inline Actions The `Negative =` needn't be part of the if. dmgreen: The `Negative =` needn't be part of the if.
}		}
case ISD::BUILD_VECTOR:		case ISD::BUILD_VECTOR:
// Collect the known bits that are shared by every demanded element.		// Collect the known bits that are shared by every demanded element.
// TODO: Call SimplifyDemandedBits for non-constant demanded elements.		// TODO: Call SimplifyDemandedBits for non-constant demanded elements.
Known = TLO.DAG.computeKnownBits(Op, DemandedElts, Depth);		Known = TLO.DAG.computeKnownBits(Op, DemandedElts, Depth);
return false; // Don't fall through, will infinitely loop.		return false; // Don't fall through, will infinitely loop.
case ISD::LOAD: {		case ISD::LOAD: {
auto *LD = cast<LoadSDNode>(Op);		auto *LD = cast<LoadSDNode>(Op);
▲ Show 20 Lines • Show All 1,516 Lines • ▼ Show 20 Lines	if (isOperationLegalOrCustom(ISD::SHL, VT)) {
if (unsigned ShAmt = getShiftLeftAmt(Op1))		if (unsigned ShAmt = getShiftLeftAmt(Op1))
return foldMul(ISD::ADD, Op1.getOperand(0), Op0, ShAmt);		return foldMul(ISD::ADD, Op1.getOperand(0), Op0, ShAmt);
}		}
}		}

[[fallthrough]];		[[fallthrough]];
}		}
default:		default:
if (Op.getOpcode() >= ISD::BUILTIN_OP_END) {		// We also ask the target about intrinsics (which could be specific to it).
		if (Op.getOpcode() >= ISD::BUILTIN_OP_END \|\|
		Op.getOpcode() == ISD::INTRINSIC_WO_CHAIN) {
if (SimplifyDemandedBitsForTargetNode(Op, DemandedBits, DemandedElts,		if (SimplifyDemandedBitsForTargetNode(Op, DemandedBits, DemandedElts,
Known, TLO, Depth))		Known, TLO, Depth))
return true;		return true;
break;		break;
}		}

// Just use computeKnownBits to compute output bits.		// Just use computeKnownBits to compute output bits.
Known = TLO.DAG.computeKnownBits(Op, DemandedElts, Depth);		Known = TLO.DAG.computeKnownBits(Op, DemandedElts, Depth);
▲ Show 20 Lines • Show All 7,503 Lines • Show Last 20 Lines

llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 86 Lines • ▼ Show 20 Lines
#include <algorithm>		#include <algorithm>
#include <bitset>		#include <bitset>
#include <cassert>		#include <cassert>
#include <cctype>		#include <cctype>
#include <cstdint>		#include <cstdint>
#include <cstdlib>		#include <cstdlib>
#include <iterator>		#include <iterator>
#include <limits>		#include <limits>
		#include <optional>
#include <tuple>		#include <tuple>
#include <utility>		#include <utility>
#include <vector>		#include <vector>

using namespace llvm;		using namespace llvm;
using namespace llvm::PatternMatch;		using namespace llvm::PatternMatch;

#define DEBUG_TYPE "aarch64-lower"		#define DEBUG_TYPE "aarch64-lower"
▲ Show 20 Lines • Show All 14,898 Lines • ▼ Show 20 Lines	if (Lg2 == 1) {
Created.push_back(Negs.getNode());		Created.push_back(Negs.getNode());
Created.push_back(AndPos.getNode());		Created.push_back(AndPos.getNode());
Created.push_back(AndNeg.getNode());		Created.push_back(AndNeg.getNode());
}		}

return CSNeg;		return CSNeg;
}		}

static bool IsSVECntIntrinsic(SDValue S) {		static std::optional<unsigned> IsSVECntIntrinsic(SDValue S) {
switch(getIntrinsicID(S.getNode())) {		switch(getIntrinsicID(S.getNode())) {
default:		default:
break;		break;
case Intrinsic::aarch64_sve_cntb:		case Intrinsic::aarch64_sve_cntb:
		return 8;
case Intrinsic::aarch64_sve_cnth:		case Intrinsic::aarch64_sve_cnth:
		return 16;
case Intrinsic::aarch64_sve_cntw:		case Intrinsic::aarch64_sve_cntw:
		return 32;
case Intrinsic::aarch64_sve_cntd:		case Intrinsic::aarch64_sve_cntd:
return true;		return 64;
}		}
return false;		return {};
}		}

/// Calculates what the pre-extend type is, based on the extension		/// Calculates what the pre-extend type is, based on the extension
/// operation node provided by \p Extend.		/// operation node provided by \p Extend.
///		///
/// In the case that \p Extend is a SIGN_EXTEND or a ZERO_EXTEND, the		/// In the case that \p Extend is a SIGN_EXTEND or a ZERO_EXTEND, the
/// pre-extend type is pulled directly from the operand, while other extend		/// pre-extend type is pulled directly from the operand, while other extend
/// operations need a bit more inspection to get this information.		/// operations need a bit more inspection to get this information.
▲ Show 20 Lines • Show All 8,263 Lines • ▼ Show 20 Lines	case AArch64ISD::VSHL: {

if ((ZeroBits & UnusedBits) != ZeroBits)		if ((ZeroBits & UnusedBits) != ZeroBits)
return false;		return false;

// All bits that are zeroed by (VSHL (VLSHR Val X) X) are not		// All bits that are zeroed by (VSHL (VLSHR Val X) X) are not
// used - simplify to just Val.		// used - simplify to just Val.
return TLO.CombineTo(Op, ShiftR->getOperand(0));		return TLO.CombineTo(Op, ShiftR->getOperand(0));
}		}
		case ISD::INTRINSIC_WO_CHAIN: {
		if (auto ElementSize = IsSVECntIntrinsic(Op)) {
		unsigned MaxSVEVectorSizeInBits = Subtarget->getMaxSVEVectorSizeInBits();
		if (!MaxSVEVectorSizeInBits)
		MaxSVEVectorSizeInBits = AArch64::SVEMaxBitsPerVector;
		unsigned MaxElements = MaxSVEVectorSizeInBits / *ElementSize;
		// The SVE count intrinsics don't support the multiplier immediate so we
		// don't have to account for that here. The value returned may be slightly
		// over the true required bits, as this is based on the "ALL" pattern. The
		// other patterns are also exposed by these intrinsics, but they all
		// return a value that's strictly less than "ALL".
		unsigned RequiredBits = Log2_32(MaxElements) + 1;
		unsigned BitWidth = Known.Zero.getBitWidth();
		if (RequiredBits < BitWidth)
		Known.Zero.setHighBits(BitWidth - RequiredBits);
		return false;
		}
		}
}		}

return TargetLowering::SimplifyDemandedBitsForTargetNode(		return TargetLowering::SimplifyDemandedBitsForTargetNode(
		dmgreenUnsubmitted Done Reply Inline Actions Can you move this into the switch under INTRINSIC_WO_CHAIN. Just so it doesn't need to be checked for every instruction. dmgreen: Can you move this into the switch under INTRINSIC_WO_CHAIN. Just so it doesn't need to be…
Op, OriginalDemandedBits, OriginalDemandedElts, Known, TLO, Depth);		Op, OriginalDemandedBits, OriginalDemandedElts, Known, TLO, Depth);
}		}

bool AArch64TargetLowering::isTargetCanonicalConstantNode(SDValue Op) const {		bool AArch64TargetLowering::isTargetCanonicalConstantNode(SDValue Op) const {
return Op.getOpcode() == AArch64ISD::DUP \|\|		return Op.getOpcode() == AArch64ISD::DUP \|\|
Op.getOpcode() == AArch64ISD::MOVI \|\|		Op.getOpcode() == AArch64ISD::MOVI \|\|
		dmgreenUnsubmitted Done Reply Inline Actions Is there a reason why this is this based on SVEMaxBitsPerVector and not the maximum value in VScaleRange? Or a combo of both if vscale_range is unbounded for some reason. dmgreen: Is there a reason why this is this based on SVEMaxBitsPerVector and not the maximum value in…
		benmxwl-armAuthorUnsubmitted Done Reply Inline Actions No real reason, it just was a little simpler. But it does not add much extra complexity doing the combo check. benmxwl-arm: No real reason, it just was a little simpler. But it does not add much extra complexity doing…
(Op.getOpcode() == ISD::EXTRACT_SUBVECTOR &&		(Op.getOpcode() == ISD::EXTRACT_SUBVECTOR &&
		dmgreenUnsubmitted Done Reply Inline Actions Nit: Log2_32? dmgreen: Nit: Log2_32?
Op.getOperand(0).getOpcode() == AArch64ISD::DUP) \|\|		Op.getOperand(0).getOpcode() == AArch64ISD::DUP) \|\|
TargetLowering::isTargetCanonicalConstantNode(Op);		TargetLowering::isTargetCanonicalConstantNode(Op);
}		}

bool AArch64TargetLowering::isConstantUnsignedBitfieldExtractLegal(		bool AArch64TargetLowering::isConstantUnsignedBitfieldExtractLegal(
unsigned Opc, LLT Ty1, LLT Ty2) const {		unsigned Opc, LLT Ty1, LLT Ty2) const {
return Ty1 == Ty2 && (Ty1 == LLT::scalar(32) \|\| Ty1 == LLT::scalar(64));		return Ty1 == Ty2 && (Ty1 == LLT::scalar(32) \|\| Ty1 == LLT::scalar(64));
}		}
▲ Show 20 Lines • Show All 91 Lines • Show Last 20 Lines

llvm/test/CodeGen/AArch64/vscale-and-sve-cnt-demandedbits.ll

Show All 23 Lines	; CHECK-NEXT: ret
%result = add i32 %and_redundant, %and_required		%result = add i32 %and_redundant, %and_required
ret i32 %result		ret i32 %result
}		}

define i64 @cntb_and_elimination() {		define i64 @cntb_and_elimination() {
; CHECK-LABEL: cntb_and_elimination:		; CHECK-LABEL: cntb_and_elimination:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cntb x8		; CHECK-NEXT: cntb x8
; CHECK-NEXT: and x9, x8, #0x1ff		; CHECK-NEXT: and x9, x8, #0x1fc
; CHECK-NEXT: and x8, x8, #0x3fffffffc		; CHECK-NEXT: add x0, x8, x9
; CHECK-NEXT: add x0, x9, x8
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cntb = call i64 @llvm.aarch64.sve.cntb(i32 31)		%cntb = call i64 @llvm.aarch64.sve.cntb(i32 31)
%and_redundant = and i64 %cntb, 511		%and_redundant = and i64 %cntb, 511
%and_required = and i64 %cntb, 17179869180		%and_required = and i64 %cntb, 17179869180
%result = add i64 %and_redundant, %and_required		%result = add i64 %and_redundant, %and_required
ret i64 %result		ret i64 %result
}		}

define i64 @cnth_and_elimination() {		define i64 @cnth_and_elimination() {
; CHECK-LABEL: cnth_and_elimination:		; CHECK-LABEL: cnth_and_elimination:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cnth x8		; CHECK-NEXT: cnth x8
; CHECK-NEXT: and x9, x8, #0x3ff		; CHECK-NEXT: and x9, x8, #0xfc
; CHECK-NEXT: and x8, x8, #0x3fffffffc		; CHECK-NEXT: add x0, x8, x9
; CHECK-NEXT: add x0, x9, x8
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cnth = call i64 @llvm.aarch64.sve.cnth(i32 31)		%cnth = call i64 @llvm.aarch64.sve.cnth(i32 31)
%and_redundant = and i64 %cnth, 1023		%and_redundant = and i64 %cnth, 1023
%and_required = and i64 %cnth, 17179869180		%and_required = and i64 %cnth, 17179869180
%result = add i64 %and_redundant, %and_required		%result = add i64 %and_redundant, %and_required
ret i64 %result		ret i64 %result
}		}

define i64 @cntw_and_elimination() {		define i64 @cntw_and_elimination() {
; CHECK-LABEL: cntw_and_elimination:		; CHECK-LABEL: cntw_and_elimination:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cntw x8		; CHECK-NEXT: cntw x8
; CHECK-NEXT: and x9, x8, #0x7f		; CHECK-NEXT: and x9, x8, #0x7c
; CHECK-NEXT: and x8, x8, #0x3fffffffc		; CHECK-NEXT: add x0, x8, x9
; CHECK-NEXT: add x0, x9, x8
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cntw = call i64 @llvm.aarch64.sve.cntw(i32 31)		%cntw = call i64 @llvm.aarch64.sve.cntw(i32 31)
%and_redundant = and i64 %cntw, 127		%and_redundant = and i64 %cntw, 127
%and_required = and i64 %cntw, 17179869180		%and_required = and i64 %cntw, 17179869180
%result = add i64 %and_redundant, %and_required		%result = add i64 %and_redundant, %and_required
ret i64 %result		ret i64 %result
}		}

define i64 @cntd_and_elimination() {		define i64 @cntd_and_elimination() {
; CHECK-LABEL: cntd_and_elimination:		; CHECK-LABEL: cntd_and_elimination:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cntd x8		; CHECK-NEXT: cntd x8
; CHECK-NEXT: and x9, x8, #0x3f		; CHECK-NEXT: and x9, x8, #0x3c
; CHECK-NEXT: and x8, x8, #0x3fffffffc		; CHECK-NEXT: add x0, x8, x9
; CHECK-NEXT: add x0, x9, x8
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cntd = call i64 @llvm.aarch64.sve.cntd(i32 31)		%cntd = call i64 @llvm.aarch64.sve.cntd(i32 31)
%and_redundant = and i64 %cntd, 63		%and_redundant = and i64 %cntd, 63
%and_required = and i64 %cntd, 17179869180		%and_required = and i64 %cntd, 17179869180
%result = add i64 %and_redundant, %and_required		%result = add i64 %and_redundant, %and_required
ret i64 %result		ret i64 %result
}		}

Show All 19 Lines	; CHECK-NEXT: ret
%vscale = call i32 @llvm.vscale.i32()		%vscale = call i32 @llvm.vscale.i32()
%sext = sext i32 %vscale to i64		%sext = sext i32 %vscale to i64
ret i64 %sext		ret i64 %sext
}		}

define i64 @count_bytes_trunc_zext() {		define i64 @count_bytes_trunc_zext() {
; CHECK-LABEL: count_bytes_trunc_zext:		; CHECK-LABEL: count_bytes_trunc_zext:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cntb x8		; CHECK-NEXT: cntb x0
; CHECK-NEXT: and x0, x8, #0xffffffff
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cnt = call i64 @llvm.aarch64.sve.cntb(i32 31)		%cnt = call i64 @llvm.aarch64.sve.cntb(i32 31)
%trunc = trunc i64 %cnt to i32		%trunc = trunc i64 %cnt to i32
%zext = zext i32 %trunc to i64		%zext = zext i32 %trunc to i64
ret i64 %zext		ret i64 %zext
}		}

define i64 @count_halfs_trunc_zext() {		define i64 @count_halfs_trunc_zext() {
; CHECK-LABEL: count_halfs_trunc_zext:		; CHECK-LABEL: count_halfs_trunc_zext:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cnth x8		; CHECK-NEXT: cnth x0
; CHECK-NEXT: and x0, x8, #0xffffffff
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cnt = call i64 @llvm.aarch64.sve.cnth(i32 31)		%cnt = call i64 @llvm.aarch64.sve.cnth(i32 31)
%trunc = trunc i64 %cnt to i32		%trunc = trunc i64 %cnt to i32
%zext = zext i32 %trunc to i64		%zext = zext i32 %trunc to i64
ret i64 %zext		ret i64 %zext
}		}

define i64 @count_words_trunc_zext() {		define i64 @count_words_trunc_zext() {
; CHECK-LABEL: count_words_trunc_zext:		; CHECK-LABEL: count_words_trunc_zext:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cntw x8		; CHECK-NEXT: cntw x0
; CHECK-NEXT: and x0, x8, #0xffffffff
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cnt = call i64 @llvm.aarch64.sve.cntw(i32 31)		%cnt = call i64 @llvm.aarch64.sve.cntw(i32 31)
%trunc = trunc i64 %cnt to i32		%trunc = trunc i64 %cnt to i32
%zext = zext i32 %trunc to i64		%zext = zext i32 %trunc to i64
ret i64 %zext		ret i64 %zext
}		}

define i64 @count_doubles_trunc_zext() {		define i64 @count_doubles_trunc_zext() {
; CHECK-LABEL: count_doubles_trunc_zext:		; CHECK-LABEL: count_doubles_trunc_zext:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cntd x8		; CHECK-NEXT: cntd x0
; CHECK-NEXT: and x0, x8, #0xffffffff
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cnt = call i64 @llvm.aarch64.sve.cntd(i32 31)		%cnt = call i64 @llvm.aarch64.sve.cntd(i32 31)
%trunc = trunc i64 %cnt to i32		%trunc = trunc i64 %cnt to i32
%zext = zext i32 %trunc to i64		%zext = zext i32 %trunc to i64
ret i64 %zext		ret i64 %zext
}		}

define i64 @count_bytes_trunc_sext() {		define i64 @count_bytes_trunc_sext() {
; CHECK-LABEL: count_bytes_trunc_sext:		; CHECK-LABEL: count_bytes_trunc_sext:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cntb x8		; CHECK-NEXT: cntb x0
; CHECK-NEXT: sxtw x0, w8
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cnt = call i64 @llvm.aarch64.sve.cntb(i32 31)		%cnt = call i64 @llvm.aarch64.sve.cntb(i32 31)
%trunc = trunc i64 %cnt to i32		%trunc = trunc i64 %cnt to i32
%sext = sext i32 %trunc to i64		%sext = sext i32 %trunc to i64
ret i64 %sext		ret i64 %sext
}		}

define i64 @count_halfs_trunc_sext() {		define i64 @count_halfs_trunc_sext() {
; CHECK-LABEL: count_halfs_trunc_sext:		; CHECK-LABEL: count_halfs_trunc_sext:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cnth x8		; CHECK-NEXT: cnth x0
; CHECK-NEXT: sxtw x0, w8
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cnt = call i64 @llvm.aarch64.sve.cnth(i32 31)		%cnt = call i64 @llvm.aarch64.sve.cnth(i32 31)
%trunc = trunc i64 %cnt to i32		%trunc = trunc i64 %cnt to i32
%sext = sext i32 %trunc to i64		%sext = sext i32 %trunc to i64
ret i64 %sext		ret i64 %sext
}		}

define i64 @count_words_trunc_sext() {		define i64 @count_words_trunc_sext() {
; CHECK-LABEL: count_words_trunc_sext:		; CHECK-LABEL: count_words_trunc_sext:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cntw x8		; CHECK-NEXT: cntw x0
; CHECK-NEXT: sxtw x0, w8
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cnt = call i64 @llvm.aarch64.sve.cntw(i32 31)		%cnt = call i64 @llvm.aarch64.sve.cntw(i32 31)
%trunc = trunc i64 %cnt to i32		%trunc = trunc i64 %cnt to i32
%sext = sext i32 %trunc to i64		%sext = sext i32 %trunc to i64
ret i64 %sext		ret i64 %sext
}		}

define i64 @count_doubles_trunc_sext() {		define i64 @count_doubles_trunc_sext() {
; CHECK-LABEL: count_doubles_trunc_sext:		; CHECK-LABEL: count_doubles_trunc_sext:
; CHECK: // %bb.0:		; CHECK: // %bb.0:
; CHECK-NEXT: cntd x8		; CHECK-NEXT: cntd x0
; CHECK-NEXT: sxtw x0, w8
; CHECK-NEXT: ret		; CHECK-NEXT: ret
%cnt = call i64 @llvm.aarch64.sve.cntd(i32 31)		%cnt = call i64 @llvm.aarch64.sve.cntd(i32 31)
%trunc = trunc i64 %cnt to i32		%trunc = trunc i64 %cnt to i32
%sext = sext i32 %trunc to i64		%sext = sext i32 %trunc to i64
ret i64 %sext		ret i64 %sext
}		}

define i32 @vscale_with_multiplier() vscale_range(1,16) {		define i32 @vscale_with_multiplier() vscale_range(1,16) {
▲ Show 20 Lines • Show All 42 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[TargetLowering][AArch64] Teach DemandedBits about SVE count intrinsics
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 477896

llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

llvm/test/CodeGen/AArch64/vscale-and-sve-cnt-demandedbits.ll

This is an archive of the discontinued LLVM Phabricator instance.

[TargetLowering][AArch64] Teach DemandedBits about SVE count intrinsicsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 477896

llvm/lib/CodeGen/SelectionDAG/TargetLowering.cpp

llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

llvm/test/CodeGen/AArch64/vscale-and-sve-cnt-demandedbits.ll

[TargetLowering][AArch64] Teach DemandedBits about SVE count intrinsics
ClosedPublic