Diff 245105

clang/include/clang/Basic/arm_mve.td

	Show First 20 Lines • Show All 421 Lines • ▼ Show 20 Lines

	let params = [s8, u8, s16, u16] in {			let params = [s8, u8, s16, u16] in {
	def vmovlbq: Intrinsic<DblVector, (args Vector:$a),			def vmovlbq: Intrinsic<DblVector, (args Vector:$a),
	(extend (unzip $a, 0), DblVector, (unsignedflag Scalar))>;			(extend (unzip $a, 0), DblVector, (unsignedflag Scalar))>;
	def vmovltq: Intrinsic<DblVector, (args Vector:$a),			def vmovltq: Intrinsic<DblVector, (args Vector:$a),
	(extend (unzip $a, 1), DblVector, (unsignedflag Scalar))>;			(extend (unzip $a, 1), DblVector, (unsignedflag Scalar))>;
	}			}

				let params = [s16, u16, s32, u32] in {
				def vmovnbq: Intrinsic<HalfVector, (args HalfVector:$inactive, Vector:$a),
				(trunc (zip $a, (vreinterpret (vrev $inactive, (bitsize Scalar)), Vector)),
				HalfVector)>;
				def vmovntq: Intrinsic<HalfVector, (args HalfVector:$inactive, Vector:$a),
				(trunc (zip (vreinterpret $inactive, Vector), $a), HalfVector)>;
				}

	let params = T.Float in {			let params = T.Float in {
	def vrndq: Intrinsic<Vector, (args Vector:$a),			def vrndq: Intrinsic<Vector, (args Vector:$a),
	(IRIntBase<"trunc", [Vector]> $a)>;			(IRIntBase<"trunc", [Vector]> $a)>;
	def vrndmq: Intrinsic<Vector, (args Vector:$a),			def vrndmq: Intrinsic<Vector, (args Vector:$a),
	(IRIntBase<"floor", [Vector]> $a)>;			(IRIntBase<"floor", [Vector]> $a)>;
	def vrndpq: Intrinsic<Vector, (args Vector:$a),			def vrndpq: Intrinsic<Vector, (args Vector:$a),
	(IRIntBase<"ceil", [Vector]> $a)>;			(IRIntBase<"ceil", [Vector]> $a)>;
	def vrndaq: Intrinsic<Vector, (args Vector:$a),			def vrndaq: Intrinsic<Vector, (args Vector:$a),
	▲ Show 20 Lines • Show All 833 Lines • Show Last 20 Lines

clang/include/clang/Basic/arm_mve_defs.td

	Show First 20 Lines • Show All 125 Lines • ▼ Show 20 Lines
	def fptosi: IRBuilder<"CreateFPToSI">;			def fptosi: IRBuilder<"CreateFPToSI">;
	def fptoui: IRBuilder<"CreateFPToUI">;			def fptoui: IRBuilder<"CreateFPToUI">;
	def vrev: CGHelperFn<"ARMMVEVectorElementReverse"> {			def vrev: CGHelperFn<"ARMMVEVectorElementReverse"> {
	let special_params = [IRBuilderIntParam<1, "unsigned">];			let special_params = [IRBuilderIntParam<1, "unsigned">];
	}			}
	def unzip: CGHelperFn<"VectorUnzip"> {			def unzip: CGHelperFn<"VectorUnzip"> {
	let special_params = [IRBuilderIntParam<1, "bool">];			let special_params = [IRBuilderIntParam<1, "bool">];
	}			}
				def zip: CGHelperFn<"VectorZip">;

	// Helper for making boolean flags in IR			// Helper for making boolean flags in IR
	def i1: IRBuilderBase {			def i1: IRBuilderBase {
	let prefix = "llvm::ConstantInt::get(Builder.getInt1Ty(), ";			let prefix = "llvm::ConstantInt::get(Builder.getInt1Ty(), ";
	let special_params = [IRBuilderIntParam<0, "bool">];			let special_params = [IRBuilderIntParam<0, "bool">];
	}			}

	// A node that makes an Address out of a pointer-typed Value, by			// A node that makes an Address out of a pointer-typed Value, by
	Show All 40 Lines
	// the return value of the seq construction as a whole.			// the return value of the seq construction as a whole.
	def seq;			def seq;

	// Another magic operation is 'unsignedflag', which you give a scalar			// Another magic operation is 'unsignedflag', which you give a scalar
	// _type_ as an argument, and it expands into 1 for an unsigned type			// _type_ as an argument, and it expands into 1 for an unsigned type
	// and 0 for a signed (or floating) one.			// and 0 for a signed (or floating) one.
	def unsignedflag;			def unsignedflag;

				// 'bitsize' also takes a scalar type, and expands into an integer
				// constant giving its size in bits.
				def bitsize;

	// If you put CustomCodegen<"foo"> in an intrinsic's codegen field, it			// If you put CustomCodegen<"foo"> in an intrinsic's codegen field, it
	// indicates that the IR generation for that intrinsic is done by handwritten			// indicates that the IR generation for that intrinsic is done by handwritten
	// C++ and not autogenerated at all. The effect in the MVE builtin codegen			// C++ and not autogenerated at all. The effect in the MVE builtin codegen
	// function is to break out of the main switch and fall through to the			// function is to break out of the main switch and fall through to the
	// manual-codegen cases below it, having set the CustomCodeGenType enumerated			// manual-codegen cases below it, having set the CustomCodeGenType enumerated
	// variable to the value given by the 'type' string here.			// variable to the value given by the 'type' string here.
	class CustomCodegen<string type_> { string type = type_; }			class CustomCodegen<string type_> { string type = type_; }

	▲ Show 20 Lines • Show All 375 Lines • Show Last 20 Lines

clang/lib/CodeGen/CGBuiltin.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 7,061 Lines • ▼ Show 20 Lines	static llvm::Value VectorUnzip(CGBuilderTy &Builder, llvm::Value V, bool Odd) {
SmallVector<uint32_t, 16> Indices;		SmallVector<uint32_t, 16> Indices;
unsigned InputElements = V->getType()->getVectorNumElements();		unsigned InputElements = V->getType()->getVectorNumElements();
for (unsigned i = 0; i < InputElements; i += 2)		for (unsigned i = 0; i < InputElements; i += 2)
Indices.push_back(i + Odd);		Indices.push_back(i + Odd);
return Builder.CreateShuffleVector(V, llvm::UndefValue::get(V->getType()),		return Builder.CreateShuffleVector(V, llvm::UndefValue::get(V->getType()),
Indices);		Indices);
}		}

		static llvm::Value VectorZip(CGBuilderTy &Builder, llvm::Value V0,
		llvm::Value *V1) {
		// Make a shufflevector that interleaves two vectors element by element.
		assert(V0->getType() == V1->getType() && "Can't zip different vector types");
		SmallVector<uint32_t, 16> Indices;
		unsigned InputElements = V0->getType()->getVectorNumElements();
		for (unsigned i = 0; i < InputElements; i++) {
		Indices.push_back(i);
		Indices.push_back(i + InputElements);
		}
		return Builder.CreateShuffleVector(V0, V1, Indices);
		}

template<unsigned HighBit, unsigned OtherBits>		template<unsigned HighBit, unsigned OtherBits>
static llvm::Value ARMMVEConstantSplat(CGBuilderTy &Builder, llvm::Type VT) {		static llvm::Value ARMMVEConstantSplat(CGBuilderTy &Builder, llvm::Type VT) {
// MVE-specific helper function to make a vector splat of a constant such as		// MVE-specific helper function to make a vector splat of a constant such as
// UINT_MAX or INT_MIN, in which all bits below the highest one are equal.		// UINT_MAX or INT_MIN, in which all bits below the highest one are equal.
llvm::Type *T = VT->getVectorElementType();		llvm::Type *T = VT->getVectorElementType();
unsigned LaneBits = T->getPrimitiveSizeInBits();		unsigned LaneBits = T->getPrimitiveSizeInBits();
uint32_t Value = HighBit << (LaneBits - 1);		uint32_t Value = HighBit << (LaneBits - 1);
if (OtherBits)		if (OtherBits)
▲ Show 20 Lines • Show All 8,118 Lines • Show Last 20 Lines

clang/test/CodeGen/arm-mve-intrinsics/vmovn.c

This file was added.

				// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py
				// RUN: %clang_cc1 -triple thumbv8.1m.main-arm-none-eabi -target-feature +mve -mfloat-abi hard -fallow-half-arguments-and-returns -O0 -disable-O0-optnone -S -emit-llvm -o - %s \| opt -S -mem2reg \| FileCheck --check-prefix=LE %s
				// RUN: %clang_cc1 -triple thumbebv8.1m.main-arm-none-eabi -target-feature +mve -mfloat-abi hard -fallow-half-arguments-and-returns -O0 -disable-O0-optnone -S -emit-llvm -o - %s \| opt -S -mem2reg \| FileCheck --check-prefix=BE %s
				// RUN: %clang_cc1 -triple thumbv8.1m.main-arm-none-eabi -target-feature +mve -mfloat-abi hard -fallow-half-arguments-and-returns -O0 -disable-O0-optnone -DPOLYMORPHIC -S -emit-llvm -o - %s \| opt -S -mem2reg \| FileCheck --check-prefix=LE %s
				// RUN: %clang_cc1 -triple thumbebv8.1m.main-arm-none-eabi -target-feature +mve -mfloat-abi hard -fallow-half-arguments-and-returns -O0 -disable-O0-optnone -DPOLYMORPHIC -S -emit-llvm -o - %s \| opt -S -mem2reg \| FileCheck --check-prefix=BE %s

				#include <arm_mve.h>

				// LE-LABEL: @test_vmovnbq_s16(
				// LE-NEXT: entry:
				// LE-NEXT: [[TMP0:%.]] = shufflevector <16 x i8> [[A:%.]], <16 x i8> undef, <16 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6, i32 9, i32 8, i32 11, i32 10, i32 13, i32 12, i32 15, i32 14>
				dmgreenUnsubmitted Not Done Reply Inline Actions These would be vreinterpret's in bigendian? dmgreen: These would be vreinterpret's in bigendian?
				simon_tathamAuthorUnsubmitted Done Reply Inline Actions Yes – they're constructed by the `vreinterpret` record in the clang-side tablegen. Good point; perhaps I should expand the clang test to include a check of the BE output too. simon_tatham: Yes – they're constructed by the `vreinterpret` record in the clang-side tablegen. Good point…
				// LE-NEXT: [[TMP1:%.*]] = bitcast <16 x i8> [[TMP0]] to <8 x i16>
				// LE-NEXT: [[TMP2:%.]] = shufflevector <8 x i16> [[B:%.]], <8 x i16> [[TMP1]], <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				// LE-NEXT: [[TMP3:%.*]] = trunc <16 x i16> [[TMP2]] to <16 x i8>
				// LE-NEXT: ret <16 x i8> [[TMP3]]
				//
				// BE-LABEL: @test_vmovnbq_s16(
				// BE-NEXT: entry:
				// BE-NEXT: [[TMP0:%.]] = shufflevector <16 x i8> [[A:%.]], <16 x i8> undef, <16 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6, i32 9, i32 8, i32 11, i32 10, i32 13, i32 12, i32 15, i32 14>
				// BE-NEXT: [[TMP1:%.*]] = call <8 x i16> @llvm.arm.mve.vreinterpretq.v8i16.v16i8(<16 x i8> [[TMP0]])
				// BE-NEXT: [[TMP2:%.]] = shufflevector <8 x i16> [[B:%.]], <8 x i16> [[TMP1]], <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				// BE-NEXT: [[TMP3:%.*]] = trunc <16 x i16> [[TMP2]] to <16 x i8>
				// BE-NEXT: ret <16 x i8> [[TMP3]]
				//
				int8x16_t test_vmovnbq_s16(int8x16_t a, int16x8_t b)
				{
				#ifdef POLYMORPHIC
				return vmovnbq(a, b);
				#else /* POLYMORPHIC */
				return vmovnbq_s16(a, b);
				#endif /* POLYMORPHIC */
				}

				// LE-LABEL: @test_vmovnbq_s32(
				// LE-NEXT: entry:
				// LE-NEXT: [[TMP0:%.]] = shufflevector <8 x i16> [[A:%.]], <8 x i16> undef, <8 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6>
				// LE-NEXT: [[TMP1:%.*]] = bitcast <8 x i16> [[TMP0]] to <4 x i32>
				// LE-NEXT: [[TMP2:%.]] = shufflevector <4 x i32> [[B:%.]], <4 x i32> [[TMP1]], <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				// LE-NEXT: [[TMP3:%.*]] = trunc <8 x i32> [[TMP2]] to <8 x i16>
				// LE-NEXT: ret <8 x i16> [[TMP3]]
				//
				// BE-LABEL: @test_vmovnbq_s32(
				// BE-NEXT: entry:
				// BE-NEXT: [[TMP0:%.]] = shufflevector <8 x i16> [[A:%.]], <8 x i16> undef, <8 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6>
				// BE-NEXT: [[TMP1:%.*]] = call <4 x i32> @llvm.arm.mve.vreinterpretq.v4i32.v8i16(<8 x i16> [[TMP0]])
				// BE-NEXT: [[TMP2:%.]] = shufflevector <4 x i32> [[B:%.]], <4 x i32> [[TMP1]], <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				// BE-NEXT: [[TMP3:%.*]] = trunc <8 x i32> [[TMP2]] to <8 x i16>
				// BE-NEXT: ret <8 x i16> [[TMP3]]
				//
				int16x8_t test_vmovnbq_s32(int16x8_t a, int32x4_t b)
				{
				#ifdef POLYMORPHIC
				return vmovnbq(a, b);
				#else /* POLYMORPHIC */
				return vmovnbq_s32(a, b);
				#endif /* POLYMORPHIC */
				}

				// LE-LABEL: @test_vmovnbq_u16(
				// LE-NEXT: entry:
				// LE-NEXT: [[TMP0:%.]] = shufflevector <16 x i8> [[A:%.]], <16 x i8> undef, <16 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6, i32 9, i32 8, i32 11, i32 10, i32 13, i32 12, i32 15, i32 14>
				// LE-NEXT: [[TMP1:%.*]] = bitcast <16 x i8> [[TMP0]] to <8 x i16>
				// LE-NEXT: [[TMP2:%.]] = shufflevector <8 x i16> [[B:%.]], <8 x i16> [[TMP1]], <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				// LE-NEXT: [[TMP3:%.*]] = trunc <16 x i16> [[TMP2]] to <16 x i8>
				// LE-NEXT: ret <16 x i8> [[TMP3]]
				//
				// BE-LABEL: @test_vmovnbq_u16(
				// BE-NEXT: entry:
				// BE-NEXT: [[TMP0:%.]] = shufflevector <16 x i8> [[A:%.]], <16 x i8> undef, <16 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6, i32 9, i32 8, i32 11, i32 10, i32 13, i32 12, i32 15, i32 14>
				// BE-NEXT: [[TMP1:%.*]] = call <8 x i16> @llvm.arm.mve.vreinterpretq.v8i16.v16i8(<16 x i8> [[TMP0]])
				// BE-NEXT: [[TMP2:%.]] = shufflevector <8 x i16> [[B:%.]], <8 x i16> [[TMP1]], <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				// BE-NEXT: [[TMP3:%.*]] = trunc <16 x i16> [[TMP2]] to <16 x i8>
				// BE-NEXT: ret <16 x i8> [[TMP3]]
				//
				uint8x16_t test_vmovnbq_u16(uint8x16_t a, uint16x8_t b)
				{
				#ifdef POLYMORPHIC
				return vmovnbq(a, b);
				#else /* POLYMORPHIC */
				return vmovnbq_u16(a, b);
				#endif /* POLYMORPHIC */
				}

				// LE-LABEL: @test_vmovnbq_u32(
				// LE-NEXT: entry:
				// LE-NEXT: [[TMP0:%.]] = shufflevector <8 x i16> [[A:%.]], <8 x i16> undef, <8 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6>
				// LE-NEXT: [[TMP1:%.*]] = bitcast <8 x i16> [[TMP0]] to <4 x i32>
				// LE-NEXT: [[TMP2:%.]] = shufflevector <4 x i32> [[B:%.]], <4 x i32> [[TMP1]], <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				// LE-NEXT: [[TMP3:%.*]] = trunc <8 x i32> [[TMP2]] to <8 x i16>
				// LE-NEXT: ret <8 x i16> [[TMP3]]
				//
				// BE-LABEL: @test_vmovnbq_u32(
				// BE-NEXT: entry:
				// BE-NEXT: [[TMP0:%.]] = shufflevector <8 x i16> [[A:%.]], <8 x i16> undef, <8 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6>
				// BE-NEXT: [[TMP1:%.*]] = call <4 x i32> @llvm.arm.mve.vreinterpretq.v4i32.v8i16(<8 x i16> [[TMP0]])
				// BE-NEXT: [[TMP2:%.]] = shufflevector <4 x i32> [[B:%.]], <4 x i32> [[TMP1]], <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				// BE-NEXT: [[TMP3:%.*]] = trunc <8 x i32> [[TMP2]] to <8 x i16>
				// BE-NEXT: ret <8 x i16> [[TMP3]]
				//
				uint16x8_t test_vmovnbq_u32(uint16x8_t a, uint32x4_t b)
				{
				#ifdef POLYMORPHIC
				return vmovnbq(a, b);
				#else /* POLYMORPHIC */
				return vmovnbq_u32(a, b);
				#endif /* POLYMORPHIC */
				}

				// LE-LABEL: @test_vmovntq_s16(
				// LE-NEXT: entry:
				// LE-NEXT: [[TMP0:%.]] = bitcast <16 x i8> [[A:%.]] to <8 x i16>
				// LE-NEXT: [[TMP1:%.]] = shufflevector <8 x i16> [[TMP0]], <8 x i16> [[B:%.]], <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				// LE-NEXT: [[TMP2:%.*]] = trunc <16 x i16> [[TMP1]] to <16 x i8>
				// LE-NEXT: ret <16 x i8> [[TMP2]]
				//
				// BE-LABEL: @test_vmovntq_s16(
				// BE-NEXT: entry:
				// BE-NEXT: [[TMP0:%.]] = call <8 x i16> @llvm.arm.mve.vreinterpretq.v8i16.v16i8(<16 x i8> [[A:%.]])
				// BE-NEXT: [[TMP1:%.]] = shufflevector <8 x i16> [[TMP0]], <8 x i16> [[B:%.]], <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				// BE-NEXT: [[TMP2:%.*]] = trunc <16 x i16> [[TMP1]] to <16 x i8>
				// BE-NEXT: ret <16 x i8> [[TMP2]]
				//
				int8x16_t test_vmovntq_s16(int8x16_t a, int16x8_t b)
				{
				#ifdef POLYMORPHIC
				return vmovntq(a, b);
				#else /* POLYMORPHIC */
				return vmovntq_s16(a, b);
				#endif /* POLYMORPHIC */
				}

				// LE-LABEL: @test_vmovntq_s32(
				// LE-NEXT: entry:
				// LE-NEXT: [[TMP0:%.]] = bitcast <8 x i16> [[A:%.]] to <4 x i32>
				// LE-NEXT: [[TMP1:%.]] = shufflevector <4 x i32> [[TMP0]], <4 x i32> [[B:%.]], <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				// LE-NEXT: [[TMP2:%.*]] = trunc <8 x i32> [[TMP1]] to <8 x i16>
				// LE-NEXT: ret <8 x i16> [[TMP2]]
				//
				// BE-LABEL: @test_vmovntq_s32(
				// BE-NEXT: entry:
				// BE-NEXT: [[TMP0:%.]] = call <4 x i32> @llvm.arm.mve.vreinterpretq.v4i32.v8i16(<8 x i16> [[A:%.]])
				// BE-NEXT: [[TMP1:%.]] = shufflevector <4 x i32> [[TMP0]], <4 x i32> [[B:%.]], <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				// BE-NEXT: [[TMP2:%.*]] = trunc <8 x i32> [[TMP1]] to <8 x i16>
				// BE-NEXT: ret <8 x i16> [[TMP2]]
				//
				int16x8_t test_vmovntq_s32(int16x8_t a, int32x4_t b)
				{
				#ifdef POLYMORPHIC
				return vmovntq(a, b);
				#else /* POLYMORPHIC */
				return vmovntq_s32(a, b);
				#endif /* POLYMORPHIC */
				}

				// LE-LABEL: @test_vmovntq_u16(
				// LE-NEXT: entry:
				// LE-NEXT: [[TMP0:%.]] = bitcast <16 x i8> [[A:%.]] to <8 x i16>
				// LE-NEXT: [[TMP1:%.]] = shufflevector <8 x i16> [[TMP0]], <8 x i16> [[B:%.]], <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				// LE-NEXT: [[TMP2:%.*]] = trunc <16 x i16> [[TMP1]] to <16 x i8>
				// LE-NEXT: ret <16 x i8> [[TMP2]]
				//
				// BE-LABEL: @test_vmovntq_u16(
				// BE-NEXT: entry:
				// BE-NEXT: [[TMP0:%.]] = call <8 x i16> @llvm.arm.mve.vreinterpretq.v8i16.v16i8(<16 x i8> [[A:%.]])
				// BE-NEXT: [[TMP1:%.]] = shufflevector <8 x i16> [[TMP0]], <8 x i16> [[B:%.]], <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				// BE-NEXT: [[TMP2:%.*]] = trunc <16 x i16> [[TMP1]] to <16 x i8>
				// BE-NEXT: ret <16 x i8> [[TMP2]]
				//
				uint8x16_t test_vmovntq_u16(uint8x16_t a, uint16x8_t b)
				{
				#ifdef POLYMORPHIC
				return vmovntq(a, b);
				#else /* POLYMORPHIC */
				return vmovntq_u16(a, b);
				#endif /* POLYMORPHIC */
				}

				// LE-LABEL: @test_vmovntq_u32(
				// LE-NEXT: entry:
				// LE-NEXT: [[TMP0:%.]] = bitcast <8 x i16> [[A:%.]] to <4 x i32>
				// LE-NEXT: [[TMP1:%.]] = shufflevector <4 x i32> [[TMP0]], <4 x i32> [[B:%.]], <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				// LE-NEXT: [[TMP2:%.*]] = trunc <8 x i32> [[TMP1]] to <8 x i16>
				// LE-NEXT: ret <8 x i16> [[TMP2]]
				//
				// BE-LABEL: @test_vmovntq_u32(
				// BE-NEXT: entry:
				// BE-NEXT: [[TMP0:%.]] = call <4 x i32> @llvm.arm.mve.vreinterpretq.v4i32.v8i16(<8 x i16> [[A:%.]])
				// BE-NEXT: [[TMP1:%.]] = shufflevector <4 x i32> [[TMP0]], <4 x i32> [[B:%.]], <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				// BE-NEXT: [[TMP2:%.*]] = trunc <8 x i32> [[TMP1]] to <8 x i16>
				// BE-NEXT: ret <8 x i16> [[TMP2]]
				//
				uint16x8_t test_vmovntq_u32(uint16x8_t a, uint32x4_t b)
				{
				#ifdef POLYMORPHIC
				return vmovntq(a, b);
				#else /* POLYMORPHIC */
				return vmovntq_u32(a, b);
				#endif /* POLYMORPHIC */
				}

clang/utils/TableGen/MveEmitter.cpp

Show First 20 Lines • Show All 1,182 Lines • ▼ Show 20 Lines	if (Op->getName() == "seq") {
if (!TypeRec->isSubClassOf("Type"))		if (!TypeRec->isSubClassOf("Type"))
PrintFatalError("unsignedflag's argument should be a type");		PrintFatalError("unsignedflag's argument should be a type");
if (const auto *ST = dyn_cast<ScalarType>(getType(TypeRec, Param))) {		if (const auto *ST = dyn_cast<ScalarType>(getType(TypeRec, Param))) {
return std::make_shared<IntLiteralResult>(		return std::make_shared<IntLiteralResult>(
getScalarType("u32"), ST->kind() == ScalarTypeKind::UnsignedInt);		getScalarType("u32"), ST->kind() == ScalarTypeKind::UnsignedInt);
} else {		} else {
PrintFatalError("unsignedflag's argument should be a scalar type");		PrintFatalError("unsignedflag's argument should be a scalar type");
}		}
		} else if (Op->getName() == "bitsize") {
		if (D->getNumArgs() != 1)
		PrintFatalError("bitsize should have exactly one argument");
		Record *TypeRec = cast<DefInit>(D->getArg(0))->getDef();
		if (!TypeRec->isSubClassOf("Type"))
		PrintFatalError("bitsize's argument should be a type");
		if (const auto *ST = dyn_cast<ScalarType>(getType(TypeRec, Param))) {
		return std::make_shared<IntLiteralResult>(getScalarType("u32"),
		ST->sizeInBits());
		} else {
		PrintFatalError("bitsize's argument should be a scalar type");
		}
} else {		} else {
std::vector<Result::Ptr> Args;		std::vector<Result::Ptr> Args;
for (unsigned i = 0, e = D->getNumArgs(); i < e; ++i)		for (unsigned i = 0, e = D->getNumArgs(); i < e; ++i)
Args.push_back(getCodeForDagArg(D, i, Scope, Param));		Args.push_back(getCodeForDagArg(D, i, Scope, Param));
if (Op->isSubClassOf("IRBuilderBase")) {		if (Op->isSubClassOf("IRBuilderBase")) {
std::set<unsigned> AddressArgs;		std::set<unsigned> AddressArgs;
std::map<unsigned, std::string> IntegerArgs;		std::map<unsigned, std::string> IntegerArgs;
for (Record *sp : Op->getValueAsListOfDefs("special_params")) {		for (Record *sp : Op->getValueAsListOfDefs("special_params")) {
▲ Show 20 Lines • Show All 741 Lines • Show Last 20 Lines

llvm/lib/Target/ARM/ARMInstrMVE.td

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 4,316 Lines • ▼ Show 20 Lines	let Predicates = [HasMVEInt] in {
def : Pat<(v8i16 (MVEvmovn (v8i16 MQPR:$Qd_src), (v8i16 MQPR:$Qm), (i32 0))),		def : Pat<(v8i16 (MVEvmovn (v8i16 MQPR:$Qd_src), (v8i16 MQPR:$Qm), (i32 0))),
(v8i16 (MVE_VMOVNi32bh (v8i16 MQPR:$Qd_src), (v8i16 MQPR:$Qm)))>;		(v8i16 (MVE_VMOVNi32bh (v8i16 MQPR:$Qd_src), (v8i16 MQPR:$Qm)))>;
def : Pat<(v8i16 (MVEvmovn (v8i16 MQPR:$Qd_src), (v8i16 MQPR:$Qm), (i32 1))),		def : Pat<(v8i16 (MVEvmovn (v8i16 MQPR:$Qd_src), (v8i16 MQPR:$Qm), (i32 1))),
(v8i16 (MVE_VMOVNi32th (v8i16 MQPR:$Qd_src), (v8i16 MQPR:$Qm)))>;		(v8i16 (MVE_VMOVNi32th (v8i16 MQPR:$Qd_src), (v8i16 MQPR:$Qm)))>;
def : Pat<(v16i8 (MVEvmovn (v16i8 MQPR:$Qd_src), (v16i8 MQPR:$Qm), (i32 0))),		def : Pat<(v16i8 (MVEvmovn (v16i8 MQPR:$Qd_src), (v16i8 MQPR:$Qm), (i32 0))),
(v16i8 (MVE_VMOVNi16bh (v16i8 MQPR:$Qd_src), (v16i8 MQPR:$Qm)))>;		(v16i8 (MVE_VMOVNi16bh (v16i8 MQPR:$Qd_src), (v16i8 MQPR:$Qm)))>;
def : Pat<(v16i8 (MVEvmovn (v16i8 MQPR:$Qd_src), (v16i8 MQPR:$Qm), (i32 1))),		def : Pat<(v16i8 (MVEvmovn (v16i8 MQPR:$Qd_src), (v16i8 MQPR:$Qm), (i32 1))),
(v16i8 (MVE_VMOVNi16th (v16i8 MQPR:$Qd_src), (v16i8 MQPR:$Qm)))>;		(v16i8 (MVE_VMOVNi16th (v16i8 MQPR:$Qd_src), (v16i8 MQPR:$Qm)))>;

		def : Pat<(v8i16 (MVEvmovn (v8i16 MQPR:$Qm),
		(v8i16 (ARMvrev32 MQPR:$Qd_src)), (i32 1))),
		(v8i16 (MVE_VMOVNi32bh (v8i16 MQPR:$Qd_src), (v8i16 MQPR:$Qm)))>;
		def : Pat<(v16i8 (MVEvmovn (v16i8 MQPR:$Qm),
		(v16i8 (ARMvrev16 MQPR:$Qd_src)), (i32 1))),
		(v16i8 (MVE_VMOVNi16bh (v16i8 MQPR:$Qd_src), (v16i8 MQPR:$Qm)))>;
}		}


class MVE_VCVT_ff<string iname, string suffix, bit op, bit T,		class MVE_VCVT_ff<string iname, string suffix, bit op, bit T,
list<dag> pattern=[]>		list<dag> pattern=[]>
: MVE_qDest_qSrc<iname, suffix, (outs MQPR:$Qd), (ins MQPR:$Qd_src, MQPR:$Qm),		: MVE_qDest_qSrc<iname, suffix, (outs MQPR:$Qd), (ins MQPR:$Qd_src, MQPR:$Qm),
"$Qd, $Qm", vpred_n, "$Qd = $Qd_src", pattern> {		"$Qd, $Qm", vpred_n, "$Qd = $Qd_src", pattern> {
let Inst{28} = op;		let Inst{28} = op;
let Inst{21-16} = 0b111111;		let Inst{21-16} = 0b111111;
let Inst{12} = T;		let Inst{12} = T;
let Inst{8-7} = 0b00;		let Inst{8-7} = 0b00;
▲ Show 20 Lines • Show All 2,287 Lines • Show Last 20 Lines

llvm/test/CodeGen/Thumb2/mve-intrinsics/vmovn.ll

This file was added.

				; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
				; RUN: llc -mtriple=thumbv8.1m.main -mattr=+mve -verify-machineinstrs -o - %s \| FileCheck --check-prefix=LE %s
				; RUN: llc -mtriple=thumbebv8.1m.main -mattr=+mve -verify-machineinstrs -o - %s \| FileCheck --check-prefix=BE %s

				define arm_aapcs_vfpcc <16 x i8> @test_vmovnbq_s16(<16 x i8> %a, <8 x i16> %b) {
				; LE-LABEL: test_vmovnbq_s16:
				; LE: @ %bb.0: @ %entry
				; LE-NEXT: vmovnb.i16 q0, q1
				; LE-NEXT: bx lr
				;
				; BE-LABEL: test_vmovnbq_s16:
				; BE: @ %bb.0: @ %entry
				; BE-NEXT: vrev64.16 q2, q1
				; BE-NEXT: vrev64.8 q1, q0
				; BE-NEXT: vmovnb.i16 q1, q2
				; BE-NEXT: vrev64.8 q0, q1
				; BE-NEXT: bx lr
				entry:
				%0 = shufflevector <16 x i8> %a, <16 x i8> undef, <16 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6, i32 9, i32 8, i32 11, i32 10, i32 13, i32 12, i32 15, i32 14>
				%1 = tail call <8 x i16> @llvm.arm.mve.vreinterpretq.v8i16.v16i8(<16 x i8> %0)
				%2 = shufflevector <8 x i16> %b, <8 x i16> %1, <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				%3 = trunc <16 x i16> %2 to <16 x i8>
				ret <16 x i8> %3
				}

				define arm_aapcs_vfpcc <8 x i16> @test_vmovnbq_s32(<8 x i16> %a, <4 x i32> %b) {
				; LE-LABEL: test_vmovnbq_s32:
				; LE: @ %bb.0: @ %entry
				; LE-NEXT: vmovnb.i32 q0, q1
				; LE-NEXT: bx lr
				;
				; BE-LABEL: test_vmovnbq_s32:
				; BE: @ %bb.0: @ %entry
				; BE-NEXT: vrev64.32 q2, q1
				; BE-NEXT: vrev64.16 q1, q0
				; BE-NEXT: vmovnb.i32 q1, q2
				; BE-NEXT: vrev64.16 q0, q1
				; BE-NEXT: bx lr
				entry:
				%0 = shufflevector <8 x i16> %a, <8 x i16> undef, <8 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6>
				%1 = tail call <4 x i32> @llvm.arm.mve.vreinterpretq.v4i32.v8i16(<8 x i16> %0)
				%2 = shufflevector <4 x i32> %b, <4 x i32> %1, <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				%3 = trunc <8 x i32> %2 to <8 x i16>
				ret <8 x i16> %3
				}

				define arm_aapcs_vfpcc <16 x i8> @test_vmovnbq_u16(<16 x i8> %a, <8 x i16> %b) {
				; LE-LABEL: test_vmovnbq_u16:
				; LE: @ %bb.0: @ %entry
				; LE-NEXT: vmovnb.i16 q0, q1
				; LE-NEXT: bx lr
				;
				; BE-LABEL: test_vmovnbq_u16:
				; BE: @ %bb.0: @ %entry
				; BE-NEXT: vrev64.16 q2, q1
				; BE-NEXT: vrev64.8 q1, q0
				; BE-NEXT: vmovnb.i16 q1, q2
				; BE-NEXT: vrev64.8 q0, q1
				; BE-NEXT: bx lr
				entry:
				%0 = shufflevector <16 x i8> %a, <16 x i8> undef, <16 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6, i32 9, i32 8, i32 11, i32 10, i32 13, i32 12, i32 15, i32 14>
				%1 = tail call <8 x i16> @llvm.arm.mve.vreinterpretq.v8i16.v16i8(<16 x i8> %0)
				%2 = shufflevector <8 x i16> %b, <8 x i16> %1, <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				%3 = trunc <16 x i16> %2 to <16 x i8>
				ret <16 x i8> %3
				}

				define arm_aapcs_vfpcc <8 x i16> @test_vmovnbq_u32(<8 x i16> %a, <4 x i32> %b) {
				; LE-LABEL: test_vmovnbq_u32:
				; LE: @ %bb.0: @ %entry
				; LE-NEXT: vmovnb.i32 q0, q1
				; LE-NEXT: bx lr
				;
				; BE-LABEL: test_vmovnbq_u32:
				; BE: @ %bb.0: @ %entry
				; BE-NEXT: vrev64.32 q2, q1
				; BE-NEXT: vrev64.16 q1, q0
				; BE-NEXT: vmovnb.i32 q1, q2
				; BE-NEXT: vrev64.16 q0, q1
				; BE-NEXT: bx lr
				entry:
				%0 = shufflevector <8 x i16> %a, <8 x i16> undef, <8 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6>
				%1 = tail call <4 x i32> @llvm.arm.mve.vreinterpretq.v4i32.v8i16(<8 x i16> %0)
				%2 = shufflevector <4 x i32> %b, <4 x i32> %1, <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				%3 = trunc <8 x i32> %2 to <8 x i16>
				ret <8 x i16> %3
				}

				define arm_aapcs_vfpcc <16 x i8> @test_vmovntq_s16(<16 x i8> %a, <8 x i16> %b) {
				; LE-LABEL: test_vmovntq_s16:
				; LE: @ %bb.0: @ %entry
				; LE-NEXT: vmovnt.i16 q0, q1
				; LE-NEXT: bx lr
				;
				; BE-LABEL: test_vmovntq_s16:
				; BE: @ %bb.0: @ %entry
				; BE-NEXT: vrev64.16 q2, q1
				; BE-NEXT: vrev64.8 q1, q0
				; BE-NEXT: vmovnt.i16 q1, q2
				; BE-NEXT: vrev64.8 q0, q1
				; BE-NEXT: bx lr
				entry:
				%0 = tail call <8 x i16> @llvm.arm.mve.vreinterpretq.v8i16.v16i8(<16 x i8> %a)
				%1 = shufflevector <8 x i16> %0, <8 x i16> %b, <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				%2 = trunc <16 x i16> %1 to <16 x i8>
				ret <16 x i8> %2
				}

				define arm_aapcs_vfpcc <8 x i16> @test_vmovntq_s32(<8 x i16> %a, <4 x i32> %b) {
				; LE-LABEL: test_vmovntq_s32:
				; LE: @ %bb.0: @ %entry
				; LE-NEXT: vmovnt.i32 q0, q1
				; LE-NEXT: bx lr
				;
				; BE-LABEL: test_vmovntq_s32:
				; BE: @ %bb.0: @ %entry
				; BE-NEXT: vrev64.32 q2, q1
				; BE-NEXT: vrev64.16 q1, q0
				; BE-NEXT: vmovnt.i32 q1, q2
				; BE-NEXT: vrev64.16 q0, q1
				; BE-NEXT: bx lr
				entry:
				%0 = tail call <4 x i32> @llvm.arm.mve.vreinterpretq.v4i32.v8i16(<8 x i16> %a)
				%1 = shufflevector <4 x i32> %0, <4 x i32> %b, <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				%2 = trunc <8 x i32> %1 to <8 x i16>
				ret <8 x i16> %2
				}

				define arm_aapcs_vfpcc <16 x i8> @test_vmovntq_u16(<16 x i8> %a, <8 x i16> %b) {
				; LE-LABEL: test_vmovntq_u16:
				; LE: @ %bb.0: @ %entry
				; LE-NEXT: vmovnt.i16 q0, q1
				; LE-NEXT: bx lr
				;
				; BE-LABEL: test_vmovntq_u16:
				; BE: @ %bb.0: @ %entry
				; BE-NEXT: vrev64.16 q2, q1
				; BE-NEXT: vrev64.8 q1, q0
				; BE-NEXT: vmovnt.i16 q1, q2
				; BE-NEXT: vrev64.8 q0, q1
				; BE-NEXT: bx lr
				entry:
				%0 = tail call <8 x i16> @llvm.arm.mve.vreinterpretq.v8i16.v16i8(<16 x i8> %a)
				%1 = shufflevector <8 x i16> %0, <8 x i16> %b, <16 x i32> <i32 0, i32 8, i32 1, i32 9, i32 2, i32 10, i32 3, i32 11, i32 4, i32 12, i32 5, i32 13, i32 6, i32 14, i32 7, i32 15>
				%2 = trunc <16 x i16> %1 to <16 x i8>
				ret <16 x i8> %2
				}

				define arm_aapcs_vfpcc <8 x i16> @test_vmovntq_u32(<8 x i16> %a, <4 x i32> %b) {
				; LE-LABEL: test_vmovntq_u32:
				; LE: @ %bb.0: @ %entry
				; LE-NEXT: vmovnt.i32 q0, q1
				; LE-NEXT: bx lr
				;
				; BE-LABEL: test_vmovntq_u32:
				; BE: @ %bb.0: @ %entry
				; BE-NEXT: vrev64.32 q2, q1
				; BE-NEXT: vrev64.16 q1, q0
				; BE-NEXT: vmovnt.i32 q1, q2
				; BE-NEXT: vrev64.16 q0, q1
				; BE-NEXT: bx lr
				entry:
				%0 = tail call <4 x i32> @llvm.arm.mve.vreinterpretq.v4i32.v8i16(<8 x i16> %a)
				%1 = shufflevector <4 x i32> %0, <4 x i32> %b, <8 x i32> <i32 0, i32 4, i32 1, i32 5, i32 2, i32 6, i32 3, i32 7>
				%2 = trunc <8 x i32> %1 to <8 x i16>
				ret <8 x i16> %2
				}

				declare <8 x i16> @llvm.arm.mve.vreinterpretq.v8i16.v16i8(<16 x i8>)
				declare <4 x i32> @llvm.arm.mve.vreinterpretq.v4i32.v8i16(<8 x i16>)

This is an archive of the discontinued LLVM Phabricator instance.

[ARM,MVE] Add the vmovnbq,vmovntq intrinsic family.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 245105

clang/include/clang/Basic/arm_mve.td

clang/include/clang/Basic/arm_mve_defs.td

clang/lib/CodeGen/CGBuiltin.cpp

clang/test/CodeGen/arm-mve-intrinsics/vmovn.c

clang/utils/TableGen/MveEmitter.cpp

llvm/lib/Target/ARM/ARMInstrMVE.td

llvm/test/CodeGen/Thumb2/mve-intrinsics/vmovn.ll

This is an archive of the discontinued LLVM Phabricator instance.

[ARM,MVE] Add the vmovnbq,vmovntq intrinsic family.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 245105

clang/include/clang/Basic/arm_mve.td

clang/include/clang/Basic/arm_mve_defs.td

clang/lib/CodeGen/CGBuiltin.cpp

clang/test/CodeGen/arm-mve-intrinsics/vmovn.c

clang/utils/TableGen/MveEmitter.cpp

llvm/lib/Target/ARM/ARMInstrMVE.td

llvm/test/CodeGen/Thumb2/mve-intrinsics/vmovn.ll

[ARM,MVE] Add the vmovnbq,vmovntq intrinsic family.
ClosedPublic