Diff 328456

clang/include/clang/Basic/arm_neon.td

	Show First 20 Lines • Show All 1,204 Lines • ▼ Show 20 Lines
	def FRINTA_S64 : SInst<"vrnda", "..", "dQd">;			def FRINTA_S64 : SInst<"vrnda", "..", "dQd">;
	def FRINTP_S64 : SInst<"vrndp", "..", "dQd">;			def FRINTP_S64 : SInst<"vrndp", "..", "dQd">;
	def FRINTM_S64 : SInst<"vrndm", "..", "dQd">;			def FRINTM_S64 : SInst<"vrndm", "..", "dQd">;
	def FRINTX_S64 : SInst<"vrndx", "..", "dQd">;			def FRINTX_S64 : SInst<"vrndx", "..", "dQd">;
	def FRINTZ_S64 : SInst<"vrnd", "..", "dQd">;			def FRINTZ_S64 : SInst<"vrnd", "..", "dQd">;
	def FRINTI_S64 : SInst<"vrndi", "..", "dQd">;			def FRINTI_S64 : SInst<"vrndi", "..", "dQd">;
	}			}

				let ArchGuard = "__ARM_ARCH >= 8 && defined(__aarch64__) && defined(__ARM_FEATURE_FRINT)" in {
				ktkachovUnsubmitted Done Reply Inline Actions Clang should use the same feature guard as GCC here, as it is mandated by ACLE: __ARM_FEATURE_FRINT See the relevant section in https://developer.arm.com/documentation/101028/0012/8--Data-processing-intrinsics ktkachov: Clang should use the same feature guard as GCC here, as it is mandated by ACLE…
				jaykang10AuthorUnsubmitted Done Reply Inline Actions Thanks for letting know!!! That was what I want to know. jaykang10: Thanks for letting know!!! That was what I want to know.
				def FRINT32X_S32 : SInst<"vrnd32x", "..", "fQf">;
				def FRINT32Z_S32 : SInst<"vrnd32z", "..", "fQf">;
				def FRINT64X_S32 : SInst<"vrnd64x", "..", "fQf">;
				def FRINT64Z_S32 : SInst<"vrnd64z", "..", "fQf">;
				}

	////////////////////////////////////////////////////////////////////////////////			////////////////////////////////////////////////////////////////////////////////
	// MaxNum/MinNum Floating Point			// MaxNum/MinNum Floating Point

	let ArchGuard = "__ARM_ARCH >= 8 && defined(__ARM_FEATURE_NUMERIC_MAXMIN)" in {			let ArchGuard = "__ARM_ARCH >= 8 && defined(__ARM_FEATURE_NUMERIC_MAXMIN)" in {
	def FMAXNM_S32 : SInst<"vmaxnm", "...", "fQf">;			def FMAXNM_S32 : SInst<"vmaxnm", "...", "fQf">;
	def FMINNM_S32 : SInst<"vminnm", "...", "fQf">;			def FMINNM_S32 : SInst<"vminnm", "...", "fQf">;
	}			}

	▲ Show 20 Lines • Show All 852 Lines • Show Last 20 Lines

clang/lib/Basic/Targets/AArch64.cpp

Show First 20 Lines • Show All 176 Lines • ▼ Show 20 Lines
void AArch64TargetInfo::getTargetDefinesARMV84A(const LangOptions &Opts,		void AArch64TargetInfo::getTargetDefinesARMV84A(const LangOptions &Opts,
MacroBuilder &Builder) const {		MacroBuilder &Builder) const {
// Also include the Armv8.3 defines		// Also include the Armv8.3 defines
getTargetDefinesARMV83A(Opts, Builder);		getTargetDefinesARMV83A(Opts, Builder);
}		}

void AArch64TargetInfo::getTargetDefinesARMV85A(const LangOptions &Opts,		void AArch64TargetInfo::getTargetDefinesARMV85A(const LangOptions &Opts,
MacroBuilder &Builder) const {		MacroBuilder &Builder) const {
		Builder.defineMacro("__ARM_FEATURE_FRINT", "1");
		SjoerdMeijerUnsubmitted Done Reply Inline Actions I think we need to add a test new macro in: Preprocessor/aarch64-target-features.c SjoerdMeijer: I think we need to add a test new macro in: Preprocessor/aarch64-target-features.c
		SjoerdMeijerUnsubmitted Done Reply Inline Actions Sorry, wanted to say that we need to add a test for this new macro. SjoerdMeijer: Sorry, wanted to say that we need to add a test for this new macro.
		jaykang10AuthorUnsubmitted Done Reply Inline Actions The macro is used in "arm_neon.h" which is generated at building time of clang as below so I thought we do not need to add the test for it. #if __ARM_ARCH >= 8 && defined(__aarch64__) && defined(__ARM_FEATURE_FRINT) ... #ifdef __LITTLE_ENDIAN__ __ai float32x2_t vrnd32x_f32(float32x2_t __p0) { float32x2_t __ret; __ret = (float32x2_t) __builtin_neon_vrnd32x_v((int8x8_t)__p0, 9); return __ret; } #else __ai float32x2_t vrnd32x_f32(float32x2_t __p0) { float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); float32x2_t __ret; __ret = (float32x2_t) __builtin_neon_vrnd32x_v((int8x8_t)__rev0, 9); __ret = __builtin_shufflevector(__ret, __ret, 1, 0); return __ret; } #endif ... If it is not enough, I will add a test for it. jaykang10: The macro is used in "arm_neon.h" which is generated at building time of clang as below so I…
		SjoerdMeijerUnsubmitted Done Reply Inline Actions We let the preprocessor emit a new macro, so that's what we need to test, which I believe we need to do in that file I quoted earlier. The fact that it is used elsewhere is an indirect test. SjoerdMeijer: We let the preprocessor emit a new macro, so that's what we need to test, which I believe we…
		jaykang10AuthorUnsubmitted Done Reply Inline Actions Yep, I will add it. jaykang10: Yep, I will add it.
// Also include the Armv8.4 defines		// Also include the Armv8.4 defines
getTargetDefinesARMV84A(Opts, Builder);		getTargetDefinesARMV84A(Opts, Builder);
}		}

void AArch64TargetInfo::getTargetDefinesARMV86A(const LangOptions &Opts,		void AArch64TargetInfo::getTargetDefinesARMV86A(const LangOptions &Opts,
MacroBuilder &Builder) const {		MacroBuilder &Builder) const {
// Also include the Armv8.5 defines		// Also include the Armv8.5 defines
// FIXME: Armv8.6 makes the following extensions mandatory:		// FIXME: Armv8.6 makes the following extensions mandatory:
▲ Show 20 Lines • Show All 327 Lines • ▼ Show 20 Lines	for (const auto &Feature : Features) {
if (Feature == "+bf16")		if (Feature == "+bf16")
HasBFloat16 = true;		HasBFloat16 = true;
if (Feature == "+lse")		if (Feature == "+lse")
HasLSE = true;		HasLSE = true;
if (Feature == "+ls64")		if (Feature == "+ls64")
HasLS64 = true;		HasLS64 = true;
if (Feature == "+flagm")		if (Feature == "+flagm")
HasFlagM = true;		HasFlagM = true;
}		}

		ktkachovUnsubmitted Done Reply Inline Actions I don't think this flag should exist as it's inconsistent with GCC. In GCC these instructions are enabled through -march=armv8.5-a . Generally, these intrinsics should use the same target as the assembly instructions? ktkachov: I don't think this flag should exist as it's inconsistent with GCC. In GCC these instructions…
		jaykang10AuthorUnsubmitted Done Reply Inline Actions You are right! I will update it. jaykang10: You are right! I will update it.
setDataLayout();		setDataLayout();

return true;		return true;
}		}

TargetInfo::CallingConvCheckResult		TargetInfo::CallingConvCheckResult
AArch64TargetInfo::checkCallingConvention(CallingConv CC) const {		AArch64TargetInfo::checkCallingConvention(CallingConv CC) const {
switch (CC) {		switch (CC) {
▲ Show 20 Lines • Show All 386 Lines • Show Last 20 Lines

clang/lib/CodeGen/CGBuiltin.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 5,659 Lines • ▼ Show 20 Lines	static const ARMVectorIntrinsicInfo ARMSIMDIntrinsicMap [] = {
NEONMAP1(vst1q_x2_v, arm_neon_vst1x2, 0),		NEONMAP1(vst1q_x2_v, arm_neon_vst1x2, 0),
NEONMAP1(vst1q_x3_v, arm_neon_vst1x3, 0),		NEONMAP1(vst1q_x3_v, arm_neon_vst1x3, 0),
NEONMAP1(vst1q_x4_v, arm_neon_vst1x4, 0),		NEONMAP1(vst1q_x4_v, arm_neon_vst1x4, 0),
NEONMAP1(vst2_lane_v, arm_neon_vst2lane, 0),		NEONMAP1(vst2_lane_v, arm_neon_vst2lane, 0),
NEONMAP1(vst2_v, arm_neon_vst2, 0),		NEONMAP1(vst2_v, arm_neon_vst2, 0),
NEONMAP1(vst2q_lane_v, arm_neon_vst2lane, 0),		NEONMAP1(vst2q_lane_v, arm_neon_vst2lane, 0),
NEONMAP1(vst2q_v, arm_neon_vst2, 0),		NEONMAP1(vst2q_v, arm_neon_vst2, 0),
NEONMAP1(vst3_lane_v, arm_neon_vst3lane, 0),		NEONMAP1(vst3_lane_v, arm_neon_vst3lane, 0),
NEONMAP1(vst3_v, arm_neon_vst3, 0),		NEONMAP1(vst3_v, arm_neon_vst3, 0),
		Lint: Pre-merge checks Inline Actions clang-format: please reformat the code - NEONMAP1(__a64_vcvtq_low_bf16_v, aarch64_neon_bfcvtn, 0), - NEONMAP0(splat_lane_v), - NEONMAP0(splat_laneq_v), - NEONMAP0(splatq_lane_v), - NEONMAP0(splatq_laneq_v), - NEONMAP1(vabs_v, aarch64_neon_abs, 0), - NEONMAP1(vabsq_v, aarch64_neon_abs, 0), - NEONMAP0(vadd_v), - NEONMAP0(vaddhn_v), - NEONMAP0(vaddq_p128), 448 diff lines are omitted. See full path. Lint: Pre-merge checks: clang-format: please reformat the code ``` - NEONMAP1(__a64_vcvtq_low_bf16_v…
NEONMAP1(vst3q_lane_v, arm_neon_vst3lane, 0),		NEONMAP1(vst3q_lane_v, arm_neon_vst3lane, 0),
NEONMAP1(vst3q_v, arm_neon_vst3, 0),		NEONMAP1(vst3q_v, arm_neon_vst3, 0),
NEONMAP1(vst4_lane_v, arm_neon_vst4lane, 0),		NEONMAP1(vst4_lane_v, arm_neon_vst4lane, 0),
NEONMAP1(vst4_v, arm_neon_vst4, 0),		NEONMAP1(vst4_v, arm_neon_vst4, 0),
NEONMAP1(vst4q_lane_v, arm_neon_vst4lane, 0),		NEONMAP1(vst4q_lane_v, arm_neon_vst4lane, 0),
NEONMAP1(vst4q_v, arm_neon_vst4, 0),		NEONMAP1(vst4q_v, arm_neon_vst4, 0),
NEONMAP0(vsubhn_v),		NEONMAP0(vsubhn_v),
NEONMAP0(vtrn_v),		NEONMAP0(vtrn_v),
▲ Show 20 Lines • Show All 163 Lines • ▼ Show 20 Lines	static const ARMVectorIntrinsicInfo AArch64SIMDIntrinsicMap[] = {
NEONMAP1(vraddhn_v, aarch64_neon_raddhn, Add1ArgType),		NEONMAP1(vraddhn_v, aarch64_neon_raddhn, Add1ArgType),
NEONMAP1(vrax1q_v, aarch64_crypto_rax1, 0),		NEONMAP1(vrax1q_v, aarch64_crypto_rax1, 0),
NEONMAP2(vrecpe_v, aarch64_neon_frecpe, aarch64_neon_urecpe, 0),		NEONMAP2(vrecpe_v, aarch64_neon_frecpe, aarch64_neon_urecpe, 0),
NEONMAP2(vrecpeq_v, aarch64_neon_frecpe, aarch64_neon_urecpe, 0),		NEONMAP2(vrecpeq_v, aarch64_neon_frecpe, aarch64_neon_urecpe, 0),
NEONMAP1(vrecps_v, aarch64_neon_frecps, Add1ArgType),		NEONMAP1(vrecps_v, aarch64_neon_frecps, Add1ArgType),
NEONMAP1(vrecpsq_v, aarch64_neon_frecps, Add1ArgType),		NEONMAP1(vrecpsq_v, aarch64_neon_frecps, Add1ArgType),
NEONMAP2(vrhadd_v, aarch64_neon_urhadd, aarch64_neon_srhadd, Add1ArgType \| UnsignedAlts),		NEONMAP2(vrhadd_v, aarch64_neon_urhadd, aarch64_neon_srhadd, Add1ArgType \| UnsignedAlts),
NEONMAP2(vrhaddq_v, aarch64_neon_urhadd, aarch64_neon_srhadd, Add1ArgType \| UnsignedAlts),		NEONMAP2(vrhaddq_v, aarch64_neon_urhadd, aarch64_neon_srhadd, Add1ArgType \| UnsignedAlts),
		NEONMAP1(vrnd32x_v, aarch64_neon_frint32x, Add1ArgType),
		NEONMAP1(vrnd32xq_v, aarch64_neon_frint32x, Add1ArgType),
		NEONMAP1(vrnd32z_v, aarch64_neon_frint32z, Add1ArgType),
		NEONMAP1(vrnd32zq_v, aarch64_neon_frint32z, Add1ArgType),
		NEONMAP1(vrnd64x_v, aarch64_neon_frint64x, Add1ArgType),
		NEONMAP1(vrnd64xq_v, aarch64_neon_frint64x, Add1ArgType),
		NEONMAP1(vrnd64z_v, aarch64_neon_frint64z, Add1ArgType),
		NEONMAP1(vrnd64zq_v, aarch64_neon_frint64z, Add1ArgType),
NEONMAP0(vrndi_v),		NEONMAP0(vrndi_v),
NEONMAP0(vrndiq_v),		NEONMAP0(vrndiq_v),
NEONMAP2(vrshl_v, aarch64_neon_urshl, aarch64_neon_srshl, Add1ArgType \| UnsignedAlts),		NEONMAP2(vrshl_v, aarch64_neon_urshl, aarch64_neon_srshl, Add1ArgType \| UnsignedAlts),
NEONMAP2(vrshlq_v, aarch64_neon_urshl, aarch64_neon_srshl, Add1ArgType \| UnsignedAlts),		NEONMAP2(vrshlq_v, aarch64_neon_urshl, aarch64_neon_srshl, Add1ArgType \| UnsignedAlts),
NEONMAP2(vrshr_n_v, aarch64_neon_urshl, aarch64_neon_srshl, UnsignedAlts),		NEONMAP2(vrshr_n_v, aarch64_neon_urshl, aarch64_neon_srshl, UnsignedAlts),
NEONMAP2(vrshrq_n_v, aarch64_neon_urshl, aarch64_neon_srshl, UnsignedAlts),		NEONMAP2(vrshrq_n_v, aarch64_neon_urshl, aarch64_neon_srshl, UnsignedAlts),
NEONMAP2(vrsqrte_v, aarch64_neon_frsqrte, aarch64_neon_ursqrte, 0),		NEONMAP2(vrsqrte_v, aarch64_neon_frsqrte, aarch64_neon_ursqrte, 0),
NEONMAP2(vrsqrteq_v, aarch64_neon_frsqrte, aarch64_neon_ursqrte, 0),		NEONMAP2(vrsqrteq_v, aarch64_neon_frsqrte, aarch64_neon_ursqrte, 0),
▲ Show 20 Lines • Show All 4,700 Lines • ▼ Show 20 Lines
}		}
case NEON::BI__builtin_neon_vrndh_f16: {		case NEON::BI__builtin_neon_vrndh_f16: {
Ops.push_back(EmitScalarExpr(E->getArg(0)));		Ops.push_back(EmitScalarExpr(E->getArg(0)));
Int = Builder.getIsFPConstrained()		Int = Builder.getIsFPConstrained()
? Intrinsic::experimental_constrained_trunc		? Intrinsic::experimental_constrained_trunc
: Intrinsic::trunc;		: Intrinsic::trunc;
return EmitNeonCall(CGM.getIntrinsic(Int, HalfTy), Ops, "vrndz");		return EmitNeonCall(CGM.getIntrinsic(Int, HalfTy), Ops, "vrndz");
}		}
		case NEON::BI__builtin_neon_vrnd32x_v:
		case NEON::BI__builtin_neon_vrnd32xq_v: {
		Ops.push_back(EmitScalarExpr(E->getArg(0)));
		Int = Intrinsic::aarch64_neon_frint32x;
		return EmitNeonCall(CGM.getIntrinsic(Int, Ty), Ops, "vrnd32x");
		}
		case NEON::BI__builtin_neon_vrnd32z_v:
		case NEON::BI__builtin_neon_vrnd32zq_v: {
		Ops.push_back(EmitScalarExpr(E->getArg(0)));
		Int = Intrinsic::aarch64_neon_frint32z;
		return EmitNeonCall(CGM.getIntrinsic(Int, Ty), Ops, "vrnd32z");
		}
		case NEON::BI__builtin_neon_vrnd64x_v:
		case NEON::BI__builtin_neon_vrnd64xq_v: {
		Ops.push_back(EmitScalarExpr(E->getArg(0)));
		Int = Intrinsic::aarch64_neon_frint64x;
		return EmitNeonCall(CGM.getIntrinsic(Int, Ty), Ops, "vrnd64x");
		}
		case NEON::BI__builtin_neon_vrnd64z_v:
		case NEON::BI__builtin_neon_vrnd64zq_v: {
		Ops.push_back(EmitScalarExpr(E->getArg(0)));
		Int = Intrinsic::aarch64_neon_frint64z;
		return EmitNeonCall(CGM.getIntrinsic(Int, Ty), Ops, "vrnd64z");
		}
case NEON::BI__builtin_neon_vrnd_v:		case NEON::BI__builtin_neon_vrnd_v:
case NEON::BI__builtin_neon_vrndq_v: {		case NEON::BI__builtin_neon_vrndq_v: {
Int = Builder.getIsFPConstrained()		Int = Builder.getIsFPConstrained()
? Intrinsic::experimental_constrained_trunc		? Intrinsic::experimental_constrained_trunc
: Intrinsic::trunc;		: Intrinsic::trunc;
return EmitNeonCall(CGM.getIntrinsic(Int, Ty), Ops, "vrndz");		return EmitNeonCall(CGM.getIntrinsic(Int, Ty), Ops, "vrndz");
}		}
case NEON::BI__builtin_neon_vcvt_f64_v:		case NEON::BI__builtin_neon_vcvt_f64_v:
▲ Show 20 Lines • Show All 7,398 Lines • Show Last 20 Lines

clang/test/CodeGen/aarch64-v8.5a-neon-frint3264-intrinsic.c

This file was added.

				// RUN: %clang_cc1 -triple arm64-none-linux-gnu -target-feature +neon -target-feature +v8.5a\
				// RUN: -flax-vector-conversions=none -S -disable-O0-optnone -emit-llvm -o - %s \
				// RUN: \| opt -S -mem2reg \
				// RUN: \| FileCheck %s

				// REQUIRES: aarch64-registered-target

				#include <arm_neon.h>

				// CHECK-LABEL: test_vrnd32x_f32
				// CHECK: [[RND:%.*]] = call <2 x float> @llvm.aarch64.neon.frint32x.v2f32(<2 x float> %a)
				// CHECK: ret <2 x float> [[RND]]
				float32x2_t test_vrnd32x_f32(float32x2_t a) {
				return vrnd32x_f32(a);
				}

				// CHECK-LABEL: test_vrnd32xq_f32
				// CHECK: [[RND:%.*]] = call <4 x float> @llvm.aarch64.neon.frint32x.v4f32(<4 x float> %a)
				// CHECK: ret <4 x float> [[RND]]
				float32x4_t test_vrnd32xq_f32(float32x4_t a) {
				return vrnd32xq_f32(a);
				}

				// CHECK-LABEL: test_vrnd32z_f32
				// CHECK: [[RND:%.*]] = call <2 x float> @llvm.aarch64.neon.frint32z.v2f32(<2 x float> %a)
				// CHECK: ret <2 x float> [[RND]]
				float32x2_t test_vrnd32z_f32(float32x2_t a) {
				return vrnd32z_f32(a);
				}

				// CHECK-LABEL: test_vrnd32zq_f32
				// CHECK: [[RND:%.*]] = call <4 x float> @llvm.aarch64.neon.frint32z.v4f32(<4 x float> %a)
				// CHECK: ret <4 x float> [[RND]]
				float32x4_t test_vrnd32zq_f32(float32x4_t a) {
				return vrnd32zq_f32(a);
				}

				// CHECK-LABEL: test_vrnd64x_f32
				// CHECK: [[RND:%.*]] = call <2 x float> @llvm.aarch64.neon.frint64x.v2f32(<2 x float> %a)
				// CHECK: ret <2 x float> [[RND]]
				float32x2_t test_vrnd64x_f32(float32x2_t a) {
				return vrnd64x_f32(a);
				}

				// CHECK-LABEL: test_vrnd64xq_f32
				// CHECK: [[RND:%.*]] = call <4 x float> @llvm.aarch64.neon.frint64x.v4f32(<4 x float> %a)
				// CHECK: ret <4 x float> [[RND]]
				float32x4_t test_vrnd64xq_f32(float32x4_t a) {
				return vrnd64xq_f32(a);
				}

				// CHECK-LABEL: test_vrnd64z_f32
				// CHECK: [[RND:%.*]] = call <2 x float> @llvm.aarch64.neon.frint64z.v2f32(<2 x float> %a)
				// CHECK: ret <2 x float> [[RND]]
				float32x2_t test_vrnd64z_f32(float32x2_t a) {
				return vrnd64z_f32(a);
				}

				// CHECK-LABEL: test_vrnd64zq_f32
				// CHECK: [[RND:%.*]] = call <4 x float> @llvm.aarch64.neon.frint64z.v4f32(<4 x float> %a)
				// CHECK: ret <4 x float> [[RND]]
				float32x4_t test_vrnd64zq_f32(float32x4_t a) {
				return vrnd64zq_f32(a);
				}

clang/test/Preprocessor/aarch64-target-features.c

	Show First 20 Lines • Show All 52 Lines • ▼ Show 20 Lines

	// RUN: %clang -target aarch64_be-eabi -x c -E -dM %s -o - \| FileCheck %s -check-prefix CHECK-BIGENDIAN			// RUN: %clang -target aarch64_be-eabi -x c -E -dM %s -o - \| FileCheck %s -check-prefix CHECK-BIGENDIAN
	// CHECK-BIGENDIAN: __ARM_BIG_ENDIAN 1			// CHECK-BIGENDIAN: __ARM_BIG_ENDIAN 1

	// RUN: %clang -target aarch64-none-linux-gnu -march=armv8-a+crypto -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRYPTO %s			// RUN: %clang -target aarch64-none-linux-gnu -march=armv8-a+crypto -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRYPTO %s
	// RUN: %clang -target arm64-none-linux-gnu -march=armv8-a+crypto -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRYPTO %s			// RUN: %clang -target arm64-none-linux-gnu -march=armv8-a+crypto -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRYPTO %s
	// CHECK-CRYPTO: __ARM_FEATURE_CRYPTO 1			// CHECK-CRYPTO: __ARM_FEATURE_CRYPTO 1

				// RUN: %clang -target aarch64-none-linux-gnu -march=armv8.5-a -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-8_5 %s
				SjoerdMeijerUnsubmitted Done Reply Inline Actions would be good to have a negative test too, i.e. a CHECK-NOT of this for e.g. v8.4a. SjoerdMeijer: would be good to have a negative test too, i.e. a CHECK-NOT of this for e.g. v8.4a.
				jaykang10AuthorUnsubmitted Done Reply Inline Actions Yep, I will add it. jaykang10: Yep, I will add it.
				// CHECK-8_5: __ARM_FEATURE_FRINT 1

				// RUN: %clang -target aarch64-none-linux-gnu -march=armv8.4-a -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-8_4 %s
				// CHECK-8_4-NOT: __ARM_FEATURE_FRINT 1

	// RUN: %clang -target aarch64-none-linux-gnu -mcrc -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s			// RUN: %clang -target aarch64-none-linux-gnu -mcrc -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s
	// RUN: %clang -target arm64-none-linux-gnu -mcrc -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s			// RUN: %clang -target arm64-none-linux-gnu -mcrc -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s
	// RUN: %clang -target aarch64-none-linux-gnu -march=armv8-a+crc -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s			// RUN: %clang -target aarch64-none-linux-gnu -march=armv8-a+crc -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s
	// RUN: %clang -target arm64-none-linux-gnu -march=armv8-a+crc -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s			// RUN: %clang -target arm64-none-linux-gnu -march=armv8-a+crc -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s
	// RUN: %clang -target aarch64-none-linux-gnu -march=armv8.1-a -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s			// RUN: %clang -target aarch64-none-linux-gnu -march=armv8.1-a -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s
	// RUN: %clang -target arm64-none-linux-gnu -march=armv8.1-a -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s			// RUN: %clang -target arm64-none-linux-gnu -march=armv8.1-a -x c -E -dM %s -o - \| FileCheck --check-prefix=CHECK-CRC32 %s
	// CHECK-CRC32: __ARM_FEATURE_CRC32 1			// CHECK-CRC32: __ARM_FEATURE_CRC32 1

	▲ Show 20 Lines • Show All 396 Lines • Show Last 20 Lines

llvm/include/llvm/IR/IntrinsicsAArch64.td

Show First 20 Lines • Show All 456 Lines • ▼ Show 20 Lines	let TargetPrefix = "aarch64", IntrProperties = [IntrNoMem] in {
def int_aarch64_neon_fcvtpu : AdvSIMD_FPToIntRounding_Intrinsic;		def int_aarch64_neon_fcvtpu : AdvSIMD_FPToIntRounding_Intrinsic;
def int_aarch64_neon_fcvtzs : AdvSIMD_FPToIntRounding_Intrinsic;		def int_aarch64_neon_fcvtzs : AdvSIMD_FPToIntRounding_Intrinsic;
def int_aarch64_neon_fcvtzu : AdvSIMD_FPToIntRounding_Intrinsic;		def int_aarch64_neon_fcvtzu : AdvSIMD_FPToIntRounding_Intrinsic;

// Vector FP Rounding: only ties to even is unrepresented by a normal		// Vector FP Rounding: only ties to even is unrepresented by a normal
// intrinsic.		// intrinsic.
def int_aarch64_neon_frintn : AdvSIMD_1FloatArg_Intrinsic;		def int_aarch64_neon_frintn : AdvSIMD_1FloatArg_Intrinsic;

		// v8.5-A Vector FP Rounding
		def int_aarch64_neon_frint32x : AdvSIMD_1FloatArg_Intrinsic;
		def int_aarch64_neon_frint32z : AdvSIMD_1FloatArg_Intrinsic;
		def int_aarch64_neon_frint64x : AdvSIMD_1FloatArg_Intrinsic;
		def int_aarch64_neon_frint64z : AdvSIMD_1FloatArg_Intrinsic;

// Scalar FP->Int conversions		// Scalar FP->Int conversions

// Vector FP Inexact Narrowing		// Vector FP Inexact Narrowing
def int_aarch64_neon_fcvtxn : AdvSIMD_1VectorArg_Expand_Intrinsic;		def int_aarch64_neon_fcvtxn : AdvSIMD_1VectorArg_Expand_Intrinsic;

// Scalar FP Inexact Narrowing		// Scalar FP Inexact Narrowing
def int_aarch64_sisd_fcvtxn : DefaultAttrsIntrinsic<[llvm_float_ty], [llvm_double_ty],		def int_aarch64_sisd_fcvtxn : DefaultAttrsIntrinsic<[llvm_float_ty], [llvm_double_ty],
[IntrNoMem]>;		[IntrNoMem]>;

// v8.2-A Dot Product		// v8.2-A Dot Product
def int_aarch64_neon_udot : AdvSIMD_Dot_Intrinsic;		def int_aarch64_neon_udot : AdvSIMD_Dot_Intrinsic;
def int_aarch64_neon_sdot : AdvSIMD_Dot_Intrinsic;		def int_aarch64_neon_sdot : AdvSIMD_Dot_Intrinsic;

// v8.6-A Matrix Multiply Intrinsics		// v8.6-A Matrix Multiply Intrinsics
		SjoerdMeijerUnsubmitted Done Reply Inline Actions Nit and unrelated: but perhaps you can fix the indent here. SjoerdMeijer: Nit and unrelated: but perhaps you can fix the indent here.
		jaykang10AuthorUnsubmitted Done Reply Inline Actions Yep, I will update it. jaykang10: Yep, I will update it.
def int_aarch64_neon_ummla : AdvSIMD_MatMul_Intrinsic;		def int_aarch64_neon_ummla : AdvSIMD_MatMul_Intrinsic;
def int_aarch64_neon_smmla : AdvSIMD_MatMul_Intrinsic;		def int_aarch64_neon_smmla : AdvSIMD_MatMul_Intrinsic;
def int_aarch64_neon_usmmla : AdvSIMD_MatMul_Intrinsic;		def int_aarch64_neon_usmmla : AdvSIMD_MatMul_Intrinsic;
def int_aarch64_neon_usdot : AdvSIMD_Dot_Intrinsic;		def int_aarch64_neon_usdot : AdvSIMD_Dot_Intrinsic;
def int_aarch64_neon_bfdot : AdvSIMD_Dot_Intrinsic;		def int_aarch64_neon_bfdot : AdvSIMD_Dot_Intrinsic;
def int_aarch64_neon_bfmmla		def int_aarch64_neon_bfmmla
: DefaultAttrsIntrinsic<[llvm_v4f32_ty],		: DefaultAttrsIntrinsic<[llvm_v4f32_ty],
[llvm_v4f32_ty, llvm_v8bf16_ty, llvm_v8bf16_ty],		[llvm_v4f32_ty, llvm_v8bf16_ty, llvm_v8bf16_ty],
▲ Show 20 Lines • Show All 2,008 Lines • Show Last 20 Lines

llvm/lib/Target/AArch64/AArch64InstrInfo.td

This file is larger than 256 KB, so syntax highlighting is disabled by default.

	Show First 20 Lines • Show All 4,085 Lines • ▼ Show 20 Lines
	defm FRINTI : SIMDTwoVectorFP<1, 1, 0b11001, "frinti", fnearbyint>;			defm FRINTI : SIMDTwoVectorFP<1, 1, 0b11001, "frinti", fnearbyint>;
	defm FRINTM : SIMDTwoVectorFP<0, 0, 0b11001, "frintm", ffloor>;			defm FRINTM : SIMDTwoVectorFP<0, 0, 0b11001, "frintm", ffloor>;
	defm FRINTN : SIMDTwoVectorFP<0, 0, 0b11000, "frintn", int_aarch64_neon_frintn>;			defm FRINTN : SIMDTwoVectorFP<0, 0, 0b11000, "frintn", int_aarch64_neon_frintn>;
	defm FRINTP : SIMDTwoVectorFP<0, 1, 0b11000, "frintp", fceil>;			defm FRINTP : SIMDTwoVectorFP<0, 1, 0b11000, "frintp", fceil>;
	defm FRINTX : SIMDTwoVectorFP<1, 0, 0b11001, "frintx", frint>;			defm FRINTX : SIMDTwoVectorFP<1, 0, 0b11001, "frintx", frint>;
	defm FRINTZ : SIMDTwoVectorFP<0, 1, 0b11001, "frintz", ftrunc>;			defm FRINTZ : SIMDTwoVectorFP<0, 1, 0b11001, "frintz", ftrunc>;

	let Predicates = [HasFRInt3264] in {			let Predicates = [HasFRInt3264] in {
	defm FRINT32Z : FRIntNNTVector<0, 0, "frint32z">;			defm FRINT32Z : FRIntNNTVector<0, 0, "frint32z", int_aarch64_neon_frint32z>;
	defm FRINT64Z : FRIntNNTVector<0, 1, "frint64z">;			defm FRINT64Z : FRIntNNTVector<0, 1, "frint64z", int_aarch64_neon_frint64z>;
	defm FRINT32X : FRIntNNTVector<1, 0, "frint32x">;			defm FRINT32X : FRIntNNTVector<1, 0, "frint32x", int_aarch64_neon_frint32x>;
	defm FRINT64X : FRIntNNTVector<1, 1, "frint64x">;			defm FRINT64X : FRIntNNTVector<1, 1, "frint64x", int_aarch64_neon_frint64x>;
	} // HasFRInt3264			} // HasFRInt3264

	defm FRSQRTE: SIMDTwoVectorFP<1, 1, 0b11101, "frsqrte", int_aarch64_neon_frsqrte>;			defm FRSQRTE: SIMDTwoVectorFP<1, 1, 0b11101, "frsqrte", int_aarch64_neon_frsqrte>;
	defm FSQRT : SIMDTwoVectorFP<1, 1, 0b11111, "fsqrt", fsqrt>;			defm FSQRT : SIMDTwoVectorFP<1, 1, 0b11111, "fsqrt", fsqrt>;
	defm NEG : SIMDTwoVectorBHSD<1, 0b01011, "neg",			defm NEG : SIMDTwoVectorBHSD<1, 0b01011, "neg",
	UnOpFrag<(sub immAllZerosV, node:$LHS)> >;			UnOpFrag<(sub immAllZerosV, node:$LHS)> >;
	defm NOT : SIMDTwoVectorB<1, 0b00, 0b00101, "not", vnot>;			defm NOT : SIMDTwoVectorB<1, 0b00, 0b00101, "not", vnot>;
	// Aliases for MVN -> NOT.			// Aliases for MVN -> NOT.
	▲ Show 20 Lines • Show All 3,844 Lines • Show Last 20 Lines

llvm/test/CodeGen/AArch64/v8.5a-neon-frint3264-intrinsic.ll

This file was added.

				; RUN: llc < %s -mtriple=aarch64-eabi -mattr=+v8.5a \| FileCheck %s

				SjoerdMeijerUnsubmitted Done Reply Inline Actions Nit: fptoint seems to be implied by v8.5a, so don't need to specify it here? SjoerdMeijer: Nit: fptoint seems to be implied by v8.5a, so don't need to specify it here?
				jaykang10AuthorUnsubmitted Done Reply Inline Actions Oops! You are right! I will update it. jaykang10: Oops! You are right! I will update it.
				declare <2 x float> @llvm.aarch64.neon.frint32x.v2f32(<2 x float>)
				declare <4 x float> @llvm.aarch64.neon.frint32x.v4f32(<4 x float>)
				declare <2 x float> @llvm.aarch64.neon.frint32z.v2f32(<2 x float>)
				declare <4 x float> @llvm.aarch64.neon.frint32z.v4f32(<4 x float>)

				define dso_local <2 x float> @t_vrnd32x_f32(<2 x float> %a) {
				; CHECK-LABEL: t_vrnd32x_f32:
				; CHECK: frint32x v0.2s, v0.2s
				; CHECK-NEXT: ret
				entry:
				%val = tail call <2 x float> @llvm.aarch64.neon.frint32x.v2f32(<2 x float> %a)
				ret <2 x float> %val
				}

				define dso_local <4 x float> @t_vrnd32xq_f32(<4 x float> %a) {
				; CHECK-LABEL: t_vrnd32xq_f32:
				; CHECK: frint32x v0.4s, v0.4s
				; CHECK-NEXT: ret
				entry:
				%val = tail call <4 x float> @llvm.aarch64.neon.frint32x.v4f32(<4 x float> %a)
				ret <4 x float> %val
				}

				define dso_local <2 x float> @t_vrnd32z_f32(<2 x float> %a) {
				; CHECK-LABEL: t_vrnd32z_f32:
				; CHECK: frint32z v0.2s, v0.2s
				; CHECK-NEXT: ret
				entry:
				%val = tail call <2 x float> @llvm.aarch64.neon.frint32z.v2f32(<2 x float> %a)
				ret <2 x float> %val
				}

				define dso_local <4 x float> @t_vrnd32zq_f32(<4 x float> %a) {
				; CHECK-LABEL: t_vrnd32zq_f32:
				; CHECK: frint32z v0.4s, v0.4s
				; CHECK-NEXT: ret
				entry:
				%val = tail call <4 x float> @llvm.aarch64.neon.frint32z.v4f32(<4 x float> %a)
				ret <4 x float> %val
				}

				declare <2 x float> @llvm.aarch64.neon.frint64x.v2f32(<2 x float>)
				declare <4 x float> @llvm.aarch64.neon.frint64x.v4f32(<4 x float>)
				declare <2 x float> @llvm.aarch64.neon.frint64z.v2f32(<2 x float>)
				declare <4 x float> @llvm.aarch64.neon.frint64z.v4f32(<4 x float>)

				define dso_local <2 x float> @t_vrnd64x_f32(<2 x float> %a) {
				; CHECK-LABEL: t_vrnd64x_f32:
				; CHECK: frint64x v0.2s, v0.2s
				; CHECK-NEXT: ret
				entry:
				%val = tail call <2 x float> @llvm.aarch64.neon.frint64x.v2f32(<2 x float> %a)
				ret <2 x float> %val
				}

				define dso_local <4 x float> @t_vrnd64xq_f32(<4 x float> %a) {
				; CHECK-LABEL: t_vrnd64xq_f32:
				; CHECK: frint64x v0.4s, v0.4s
				; CHECK-NEXT: ret
				entry:
				%val = tail call <4 x float> @llvm.aarch64.neon.frint64x.v4f32(<4 x float> %a)
				ret <4 x float> %val
				}

				define dso_local <2 x float> @t_vrnd64z_f32(<2 x float> %a) {
				; CHECK-LABEL: t_vrnd64z_f32:
				; CHECK: frint64z v0.2s, v0.2s
				; CHECK-NEXT: ret
				entry:
				%val = tail call <2 x float> @llvm.aarch64.neon.frint64z.v2f32(<2 x float> %a)
				ret <2 x float> %val
				}

				define dso_local <4 x float> @t_vrnd64zq_f32(<4 x float> %a) {
				; CHECK-LABEL: t_vrnd64zq_f32:
				; CHECK: frint64z v0.4s, v0.4s
				; CHECK-NEXT: ret
				entry:
				%val = tail call <4 x float> @llvm.aarch64.neon.frint64z.v4f32(<4 x float> %a)
				ret <4 x float> %val
				}

This is an archive of the discontinued LLVM Phabricator instance.

[AArch64] Add missing intrinsics for vrnd
ClosedPublic

Details

Diff Detail

Unit TestsFailed

Event Timeline

Revision Contents

Diff 328456

clang/include/clang/Basic/arm_neon.td

clang/lib/Basic/Targets/AArch64.cpp

clang/lib/CodeGen/CGBuiltin.cpp

clang/test/CodeGen/aarch64-v8.5a-neon-frint3264-intrinsic.c

clang/test/Preprocessor/aarch64-target-features.c

llvm/include/llvm/IR/IntrinsicsAArch64.td

llvm/lib/Target/AArch64/AArch64InstrInfo.td

llvm/test/CodeGen/AArch64/v8.5a-neon-frint3264-intrinsic.ll

This is an archive of the discontinued LLVM Phabricator instance.

[AArch64] Add missing intrinsics for vrndClosedPublic

Details

Diff Detail

Unit TestsFailed

Event Timeline

Revision Contents

Diff 328456

clang/include/clang/Basic/arm_neon.td

clang/lib/Basic/Targets/AArch64.cpp

clang/lib/CodeGen/CGBuiltin.cpp

clang/test/CodeGen/aarch64-v8.5a-neon-frint3264-intrinsic.c

clang/test/Preprocessor/aarch64-target-features.c

llvm/include/llvm/IR/IntrinsicsAArch64.td

llvm/lib/Target/AArch64/AArch64InstrInfo.td

llvm/test/CodeGen/AArch64/v8.5a-neon-frint3264-intrinsic.ll

[AArch64] Add missing intrinsics for vrnd
ClosedPublic