Diff 273974

mlir/lib/Conversion/SPIRVToLLVM/ConvertSPIRVToLLVM.cpp

Show First 20 Lines • Show All 47 Lines • ▼ Show 20 Lines	if (type.isIntOrFloat())
return type.getIntOrFloatBitWidth();		return type.getIntOrFloatBitWidth();
auto vecType = type.dyn_cast<VectorType>();		auto vecType = type.dyn_cast<VectorType>();
auto elementType = vecType.getElementType();		auto elementType = vecType.getElementType();
assert(elementType.isIntOrFloat() &&		assert(elementType.isIntOrFloat() &&
"only integers and floats have a bitwidth");		"only integers and floats have a bitwidth");
return elementType.getIntOrFloatBitWidth();		return elementType.getIntOrFloatBitWidth();
}		}

		/// Returns the bit width of LLVMType integer or vector.
		static unsigned getLLVMTypeBitWidth(LLVM::LLVMType type) {
		return type.isVectorTy() ? type.getVectorElementType()
		.getUnderlyingType()
		->getIntegerBitWidth()
		: type.getUnderlyingType()->getIntegerBitWidth();
		}

/// Creates `IntegerAttribute` with all bits set for given type		/// Creates `IntegerAttribute` with all bits set for given type
IntegerAttr minusOneIntegerAttribute(Type type, Builder builder) {		IntegerAttr minusOneIntegerAttribute(Type type, Builder builder) {
if (auto vecType = type.dyn_cast<VectorType>()) {		if (auto vecType = type.dyn_cast<VectorType>()) {
auto integerType = vecType.getElementType().cast<IntegerType>();		auto integerType = vecType.getElementType().cast<IntegerType>();
return builder.getIntegerAttr(integerType, -1);		return builder.getIntegerAttr(integerType, -1);
}		}
auto integerType = type.cast<IntegerType>();		auto integerType = type.cast<IntegerType>();
return builder.getIntegerAttr(integerType, -1);		return builder.getIntegerAttr(integerType, -1);
}		}

		/// Creates `llvm.mlir.constant` with all bits set for the given type.
		static Value createConstantAllBitsSet(Location loc, Type srcType, Type dstType,
		ConversionPatternRewriter &rewriter) {
		antiagainstUnsubmitted Done Reply Inline Actions We can just use `PatternRewriter` here unless we need functionalities from the `ConversionPatternRewriter` subclass. This makes the function more applicable so later if you need to call it somewhere there is no need to potentially change again. antiagainst: We can just use `PatternRewriter` here unless we need functionalities from the…
		if (srcType.isa<VectorType>())
		rriddleUnsubmitted Done Reply Inline Actions nit: Please add braces here, the body isn't really "trivial" rriddle: nit: Please add braces here, the body isn't really "trivial"
		return rewriter.create<LLVM::ConstantOp>(
		loc, dstType,
		SplatElementsAttr::get(srcType.cast<ShapedType>(),
		minusOneIntegerAttribute(srcType, rewriter)));
		return rewriter.create<LLVM::ConstantOp>(
		loc, dstType, minusOneIntegerAttribute(srcType, rewriter));
		}

		/// Truncates or extends the value. If the bitwidth of the value is the same
		/// as `dstType` bitwidth, the value remains unchanged.
		ftynseUnsubmitted Done Reply Inline Actions Couldn't parse this sentence ftynse: Couldn't parse this sentence
		static Value optionallyTruncateOrExtend(Location loc, Value value, Type dstType,
		ConversionPatternRewriter &rewriter) {
		ftynseUnsubmitted Done Reply Inline Actions Nit: this could use a more descriptive name, something like `optionallyTruncateOrExtend`. There are many other types of casting. ftynse: Nit: this could use a more descriptive name, something like `optionallyTruncateOrExtend`. There…
		auto srcType = value.getType();
		auto llvmType = dstType.cast<LLVM::LLVMType>();
		unsigned targetBitWidth = getLLVMTypeBitWidth(llvmType);
		unsigned valueBitWidth =
		ftynseUnsubmitted Done Reply Inline Actions Would it be possible to factor this out into `getLLVMTypeBitWidth()`, and call it here and inside `getValueBitWidth` ? ftynse: Would it be possible to factor this out into `getLLVMTypeBitWidth()`, and call it here and…
		srcType.isa<LLVM::LLVMType>()
		? getLLVMTypeBitWidth(srcType.cast<LLVM::LLVMType>())
		: getBitWidth(srcType);

		if (valueBitWidth < targetBitWidth)
		return rewriter.create<LLVM::ZExtOp>(loc, llvmType, value);
		// If the bit widths of `Count` and `Offset` are greater than the bit width
		antiagainstUnsubmitted Done Reply Inline Actions It seems this comment should not be placed here. This is a generic utility function and we can document its contract as "unconditionally truncate without checking the value". This comment should be placed at the call site in bitfiled insert pattern. antiagainst: It seems this comment should not be placed here. This is a generic utility function and we can…
		antiagainstUnsubmitted Done Reply Inline Actions Or actually make the comment of this function explicit that this is for bitfield ops, which I think is the case for the next patch. antiagainst: Or actually make the comment of this function explicit that this is for bitfield ops, which I…
		// of the target type, they are truncated. Truncation is safe since `Count`
		// and `Offset` must be no more than 64 for op behaviour to be defined. Hence,
		// both values can be expressed in 8 bits.
		if (valueBitWidth > targetBitWidth)
		return rewriter.create<LLVM::TruncOp>(loc, llvmType, value);
		return value;
		}

		/// Broadcasts the value to vector with `numElements` number of elements
		static void broadcast(Location loc, Value toBroadcast, Value &broadcasted,
		antiagainstUnsubmitted Done Reply Inline Actions Why not using the function return value for `broadcasted`? antiagainst: Why not using the function return value for `broadcasted`?
		unsigned numElements, LLVMTypeConverter &typeConverter,
		ConversionPatternRewriter &rewriter) {
		auto vectorType = VectorType::get(numElements, toBroadcast.getType());
		auto llvmVectorType = typeConverter.convertType(vectorType);
		auto llvmI32Type = typeConverter.convertType(rewriter.getIntegerType(32));
		broadcasted = rewriter.create<LLVM::UndefOp>(loc, llvmVectorType);
		for (unsigned i = 0; i < numElements; ++i) {
		auto index = rewriter.create<LLVM::ConstantOp>(
		ftynseUnsubmitted Done Reply Inline Actions Don't evaluate the upper bound on each iteration. We routinely use the idiom `for (unsigned i = 0, e = vectorType.getNumElements(); i < e; ++i)` for this reason. Also, MLIR and LLVM overwhelmingly uses `unsigned` for sizes and loops around them ftynse: Don't evaluate the upper bound on each iteration. We routinely use the idiom `for (unsigned i =…
		loc, llvmI32Type, rewriter.getI32IntegerAttr(i));
		broadcasted = rewriter.create<LLVM::InsertElementOp>(
		ftynseUnsubmitted Done Reply Inline Actions Can we cache the result of converting the type in a local variable? ftynse: Can we cache the result of converting the type in a local variable?
		loc, llvmVectorType, broadcasted, toBroadcast, index);
		}
		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// Operation conversion		// Operation conversion
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

namespace {		namespace {

		class BitFieldInsertPattern
		: public SPIRVToLLVMConversion<spirv::BitFieldInsertOp> {
		public:
		using SPIRVToLLVMConversion<spirv::BitFieldInsertOp>::SPIRVToLLVMConversion;

		LogicalResult
		matchAndRewrite(spirv::BitFieldInsertOp op, ArrayRef<Value> operands,
		ConversionPatternRewriter &rewriter) const override {
		auto srcType = op.getType();
		auto dstType = this->typeConverter.convertType(srcType);
		rriddleUnsubmitted Done Reply Inline Actions nit: `this->` shouldn't be necessary unless you are inside of a template. rriddle: nit: `this->` shouldn't be necessary unless you are inside of a template.
		if (!dstType)
		return failure();
		Location loc = op.getLoc();

		// Broadcast `Offset` and `Count` to match the type of `Base` and `Insert`.
		// If `Base` is of a vector type, construct a vector that has:
		// - same number of elements as `Base`
		// - each element has the type that is the same as the type of `Offset` or
		// `Count`
		antiagainstUnsubmitted Done Reply Inline Actions Super nit: align `Count` with `each` antiagainst: Super nit: align `Count` with `each`
		// - each element has the same value as `Offset` or `Count`
		Value offset;
		Value count;
		if (auto vectorType = srcType.dyn_cast<VectorType>()) {
		unsigned numElements = vectorType.getNumElements();
		broadcast(loc, op.offset(), offset, numElements, typeConverter, rewriter);
		broadcast(loc, op.count(), count, numElements, typeConverter, rewriter);
		} else {
		offset = op.offset();
		count = op.count();
		}

		// Create a mask with all bits set of the same type as `srcType`
		Value minusOne = createConstantAllBitsSet(loc, srcType, dstType, rewriter);

		// Need to cast `Offset` and `Count` if their bit width is different
		// from `Base` bit width.
		Value optionallyCastedCount =
		optionallyTruncateOrExtend(loc, count, dstType, rewriter);
		Value optionallyCastedOffset =
		optionallyTruncateOrExtend(loc, offset, dstType, rewriter);

		// Create a mask with bits set outside [Offset, Offset + Count - 1].
		Value maskShiftedByCount = rewriter.create<LLVM::ShlOp>(
		loc, dstType, minusOne, optionallyCastedCount);
		Value negated = rewriter.create<LLVM::XOrOp>(loc, dstType,
		maskShiftedByCount, minusOne);
		Value maskShiftedByCountAndOffset = rewriter.create<LLVM::ShlOp>(
		loc, dstType, negated, optionallyCastedOffset);
		Value mask = rewriter.create<LLVM::XOrOp>(
		loc, dstType, maskShiftedByCountAndOffset, minusOne);

		// Extract unchanged bits from the `Base` that are outside of
		// [Offset, Offset + Count - 1]. Then `or` with shifted `Insert`.
		Value baseAndMask =
		rewriter.create<LLVM::AndOp>(loc, dstType, op.base(), mask);
		Value insertShiftedByOffset = rewriter.create<LLVM::ShlOp>(
		loc, dstType, op.insert(), optionallyCastedOffset);
		rewriter.replaceOpWithNewOp<LLVM::OrOp>(op, dstType, baseAndMask,
		insertShiftedByOffset);
		ftynseUnsubmitted Done Reply Inline Actions I think this needs to replace the uses of `op` with the results of the newly created OrOp ftynse: I think this needs to replace the uses of `op` with the results of the newly created OrOp
		return success();
		}
		};

/// Converts SPIR-V operations that have straightforward LLVM equivalent		/// Converts SPIR-V operations that have straightforward LLVM equivalent
/// into LLVM dialect operations.		/// into LLVM dialect operations.
template <typename SPIRVOp, typename LLVMOp>		template <typename SPIRVOp, typename LLVMOp>
class DirectConversionPattern : public SPIRVToLLVMConversion<SPIRVOp> {		class DirectConversionPattern : public SPIRVToLLVMConversion<SPIRVOp> {
public:		public:
using SPIRVToLLVMConversion<SPIRVOp>::SPIRVToLLVMConversion;		using SPIRVToLLVMConversion<SPIRVOp>::SPIRVToLLVMConversion;

LogicalResult		LogicalResult
▲ Show 20 Lines • Show All 294 Lines • ▼ Show 20 Lines	patterns.insert<
DirectConversionPattern<spirv::FRemOp, LLVM::FRemOp>,		DirectConversionPattern<spirv::FRemOp, LLVM::FRemOp>,
DirectConversionPattern<spirv::FSubOp, LLVM::FSubOp>,		DirectConversionPattern<spirv::FSubOp, LLVM::FSubOp>,
DirectConversionPattern<spirv::SDivOp, LLVM::SDivOp>,		DirectConversionPattern<spirv::SDivOp, LLVM::SDivOp>,
DirectConversionPattern<spirv::SRemOp, LLVM::SRemOp>,		DirectConversionPattern<spirv::SRemOp, LLVM::SRemOp>,
DirectConversionPattern<spirv::UDivOp, LLVM::UDivOp>,		DirectConversionPattern<spirv::UDivOp, LLVM::UDivOp>,
DirectConversionPattern<spirv::UModOp, LLVM::URemOp>,		DirectConversionPattern<spirv::UModOp, LLVM::URemOp>,

// Bitwise ops		// Bitwise ops
		BitFieldInsertPattern,
DirectConversionPattern<spirv::BitwiseAndOp, LLVM::AndOp>,		DirectConversionPattern<spirv::BitwiseAndOp, LLVM::AndOp>,
DirectConversionPattern<spirv::BitwiseOrOp, LLVM::OrOp>,		DirectConversionPattern<spirv::BitwiseOrOp, LLVM::OrOp>,
DirectConversionPattern<spirv::BitwiseXorOp, LLVM::XOrOp>,		DirectConversionPattern<spirv::BitwiseXorOp, LLVM::XOrOp>,
NotPattern<spirv::NotOp>,		NotPattern<spirv::NotOp>,

// Cast ops		// Cast ops
DirectConversionPattern<spirv::ConvertFToSOp, LLVM::FPToSIOp>,		DirectConversionPattern<spirv::ConvertFToSOp, LLVM::FPToSIOp>,
DirectConversionPattern<spirv::ConvertFToUOp, LLVM::FPToUIOp>,		DirectConversionPattern<spirv::ConvertFToUOp, LLVM::FPToUIOp>,
▲ Show 20 Lines • Show All 59 Lines • Show Last 20 Lines

mlir/test/Conversion/SPIRVToLLVM/bitwise-ops-to-llvm.mlir

	// RUN: mlir-opt -convert-spirv-to-llvm %s \| FileCheck %s			// RUN: mlir-opt -convert-spirv-to-llvm %s \| FileCheck %s

	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
				// spv.BitFieldInsert
				//===----------------------------------------------------------------------===//

				// CHECK-LABEL: func @bitfield_insert_scalar_same_bit_width
				// CHECK-SAME: %[[BASE:.]]: !llvm.i32, %[[INSERT:.]]: !llvm.i32, %[[OFFSET:.]]: !llvm.i32, %[[COUNT:.]]: !llvm.i32
				func @bitfield_insert_scalar_same_bit_width(%base: i32, %insert: i32, %offset: i32, %count: i32) {
				// CHECK: %[[MINUS_ONE:.*]] = llvm.mlir.constant(-1 : i32) : !llvm.i32
				// CHECK: %[[T0:.*]] = llvm.shl %[[MINUS_ONE]], %[[COUNT]] : !llvm.i32
				// CHECK: %[[T1:.*]] = llvm.xor %[[T0]], %[[MINUS_ONE]] : !llvm.i32
				// CHECK: %[[T2:.*]] = llvm.shl %[[T1]], %[[OFFSET]] : !llvm.i32
				// CHECK: %[[MASK:.*]] = llvm.xor %[[T2]], %[[MINUS_ONE]] : !llvm.i32
				// CHECK: %[[NEW_BASE:.*]] = llvm.and %[[BASE]], %[[MASK]] : !llvm.i32
				// CHECK: %[[SHIFTED_INSERT:.*]] = llvm.shl %[[INSERT]], %[[OFFSET]] : !llvm.i32
				// CHECK: %{{.*}} = llvm.or %[[NEW_BASE]], %[[SHIFTED_INSERT]] : !llvm.i32
				%0 = spv.BitFieldInsert %base, %insert, %offset, %count : i32, i32, i32
				return
				}

				// CHECK-LABEL: func @bitfield_insert_scalar_smaller_bit_width
				// CHECK-SAME: %[[BASE:.]]: !llvm.i64, %[[INSERT:.]]: !llvm.i64, %[[OFFSET:.]]: !llvm.i8, %[[COUNT:.]]: !llvm.i8
				func @bitfield_insert_scalar_smaller_bit_width(%base: i64, %insert: i64, %offset: i8, %count: i8) {
				// CHECK: %[[MINUS_ONE:.*]] = llvm.mlir.constant(-1 : i64) : !llvm.i64
				// CHECK: %[[EXT_COUNT:.*]] = llvm.zext %[[COUNT]] : !llvm.i8 to !llvm.i64
				// CHECK: %[[EXT_OFFSET:.*]] = llvm.zext %[[OFFSET]] : !llvm.i8 to !llvm.i64
				// CHECK: %[[T0:.*]] = llvm.shl %[[MINUS_ONE]], %[[EXT_COUNT]] : !llvm.i64
				// CHECK: %[[T1:.*]] = llvm.xor %[[T0]], %[[MINUS_ONE]] : !llvm.i64
				// CHECK: %[[T2:.*]] = llvm.shl %[[T1]], %[[EXT_OFFSET]] : !llvm.i64
				// CHECK: %[[MASK:.*]] = llvm.xor %[[T2]], %[[MINUS_ONE]] : !llvm.i64
				// CHECK: %[[NEW_BASE:.*]] = llvm.and %[[BASE]], %[[MASK]] : !llvm.i64
				// CHECK: %[[SHIFTED_INSERT:.*]] = llvm.shl %[[INSERT]], %[[EXT_OFFSET]] : !llvm.i64
				// CHECK: %{{.*}} = llvm.or %[[NEW_BASE]], %[[SHIFTED_INSERT]] : !llvm.i64
				%0 = spv.BitFieldInsert %base, %insert, %offset, %count : i64, i8, i8
				return
				}

				// CHECK-LABEL: func @bitfield_insert_scalar_greater_bit_width
				// CHECK-SAME: %[[BASE:.]]: !llvm.i16, %[[INSERT:.]]: !llvm.i16, %[[OFFSET:.]]: !llvm.i32, %[[COUNT:.]]: !llvm.i64
				func @bitfield_insert_scalar_greater_bit_width(%base: i16, %insert: i16, %offset: i32, %count: i64) {
				// CHECK: %[[MINUS_ONE:.*]] = llvm.mlir.constant(-1 : i16) : !llvm.i16
				// CHECK: %[[TRUNC_COUNT:.*]] = llvm.trunc %[[COUNT]] : !llvm.i64 to !llvm.i16
				// CHECK: %[[TRUNC_OFFSET:.*]] = llvm.trunc %[[OFFSET]] : !llvm.i32 to !llvm.i16
				// CHECK: %[[T0:.*]] = llvm.shl %[[MINUS_ONE]], %[[TRUNC_COUNT]] : !llvm.i16
				// CHECK: %[[T1:.*]] = llvm.xor %[[T0]], %[[MINUS_ONE]] : !llvm.i16
				// CHECK: %[[T2:.*]] = llvm.shl %[[T1]], %[[TRUNC_OFFSET]] : !llvm.i16
				// CHECK: %[[MASK:.*]] = llvm.xor %[[T2]], %[[MINUS_ONE]] : !llvm.i16
				// CHECK: %[[NEW_BASE:.*]] = llvm.and %[[BASE]], %[[MASK]] : !llvm.i16
				// CHECK: %[[SHIFTED_INSERT:.*]] = llvm.shl %[[INSERT]], %[[TRUNC_OFFSET]] : !llvm.i16
				// CHECK: %{{.*}} = llvm.or %[[NEW_BASE]], %[[SHIFTED_INSERT]] : !llvm.i16
				%0 = spv.BitFieldInsert %base, %insert, %offset, %count : i16, i32, i64
				return
				}

				// CHECK-LABEL: func @bitfield_insert_vector_same_bit_width
				// CHECK-SAME: %[[BASE:.]]: !llvm<"<2 x i32>">, %[[INSERT:.]]: !llvm<"<2 x i32>">, %[[OFFSET:.]]: !llvm.i32, %[[COUNT:.]]: !llvm.i32
				func @bitfield_insert_vector_same_bit_width(%base: vector<2xi32>, %insert: vector<2xi32>, %offset: i32, %count: i32) {
				// CHECK: %[[OFFSET_V0:.*]] = llvm.mlir.undef : !llvm<"<2 x i32>">
				// CHECK: %[[ZERO:.*]] = llvm.mlir.constant(0 : i32) : !llvm.i32
				// CHECK: %[[OFFSET_V1:.*]] = llvm.insertelement %[[OFFSET]], %[[OFFSET_V0]][%[[ZERO]] : !llvm.i32] : !llvm<"<2 x i32>">
				// CHECK: %[[ONE:.*]] = llvm.mlir.constant(1 : i32) : !llvm.i32
				// CHECK: %[[OFFSET_V2:.*]] = llvm.insertelement %[[OFFSET]], %[[OFFSET_V1]][%[[ONE]] : !llvm.i32] : !llvm<"<2 x i32>">
				// CHECK: %[[COUNT_V0:.*]] = llvm.mlir.undef : !llvm<"<2 x i32>">
				// CHECK: %[[ZERO:.*]] = llvm.mlir.constant(0 : i32) : !llvm.i32
				// CHECK: %[[COUNT_V1:.*]] = llvm.insertelement %[[COUNT]], %[[COUNT_V0]][%[[ZERO]] : !llvm.i32] : !llvm<"<2 x i32>">
				// CHECK: %[[ONE:.*]] = llvm.mlir.constant(1 : i32) : !llvm.i32
				// CHECK: %[[COUNT_V2:.*]] = llvm.insertelement %[[COUNT]], %[[COUNT_V1]][%[[ONE]] : !llvm.i32] : !llvm<"<2 x i32>">
				// CHECK: %[[MINUS_ONE:.*]] = llvm.mlir.constant(dense<-1> : vector<2xi32>) : !llvm<"<2 x i32>">
				// CHECK: %[[T0:.*]] = llvm.shl %[[MINUS_ONE]], %[[COUNT_V2]] : !llvm<"<2 x i32>">
				// CHECK: %[[T1:.*]] = llvm.xor %[[T0]], %[[MINUS_ONE]] : !llvm<"<2 x i32>">
				// CHECK: %[[T2:.*]] = llvm.shl %[[T1]], %[[OFFSET_V2]] : !llvm<"<2 x i32>">
				// CHECK: %[[MASK:.*]] = llvm.xor %[[T2]], %[[MINUS_ONE]] : !llvm<"<2 x i32>">
				// CHECK: %[[NEW_BASE:.*]] = llvm.and %[[BASE]], %[[MASK]] : !llvm<"<2 x i32>">
				// CHECK: %[[SHIFTED_INSERT:.*]] = llvm.shl %[[INSERT]], %[[OFFSET_V2]] : !llvm<"<2 x i32>">
				// CHECK: %{{.*}} = llvm.or %[[NEW_BASE]], %[[SHIFTED_INSERT]] : !llvm<"<2 x i32>">
				%0 = spv.BitFieldInsert %base, %insert, %offset, %count : vector<2xi32>, i32, i32
				return
				}

				// CHECK-LABEL: func @bitfield_insert_vector_smaller_bit_width
				antiagainstUnsubmitted Done Reply Inline Actions We don't really need this test and the following one. The purpose of tests are certainly not enumerate all possible combinations and there are many many cases. :) We just need to make sure different "dimensions" are covered here. Integer vs vector and bitwidth difference. Bitwidth difference is already covered in scalar cases. Here it's fine to omit for vector cases. Less code means less maintenance burden. What do you think? antiagainst: We don't really need this test and the following one. The purpose of tests are certainly not…
				// CHECK-SAME: %[[BASE:.]]: !llvm<"<2 x i32>">, %[[INSERT:.]]: !llvm<"<2 x i32>">, %[[OFFSET:.]]: !llvm.i8, %[[COUNT:.]]: !llvm.i8
				func @bitfield_insert_vector_smaller_bit_width(%base: vector<2xi32>, %insert: vector<2xi32>, %offset: i8, %count: i8) {
				// CHECK: %[[OFFSET_V0:.*]] = llvm.mlir.undef : !llvm<"<2 x i8>">
				// CHECK: %[[ZERO:.*]] = llvm.mlir.constant(0 : i32) : !llvm.i32
				// CHECK: %[[OFFSET_V1:.*]] = llvm.insertelement %[[OFFSET]], %[[OFFSET_V0]][%[[ZERO]] : !llvm.i32] : !llvm<"<2 x i8>">
				// CHECK: %[[ONE:.*]] = llvm.mlir.constant(1 : i32) : !llvm.i32
				// CHECK: %[[OFFSET_V2:.*]] = llvm.insertelement %[[OFFSET]], %[[OFFSET_V1]][%[[ONE]] : !llvm.i32] : !llvm<"<2 x i8>">
				// CHECK: %[[COUNT_V0:.*]] = llvm.mlir.undef : !llvm<"<2 x i8>">
				// CHECK: %[[ZERO:.*]] = llvm.mlir.constant(0 : i32) : !llvm.i32
				// CHECK: %[[COUNT_V1:.*]] = llvm.insertelement %[[COUNT]], %[[COUNT_V0]][%[[ZERO]] : !llvm.i32] : !llvm<"<2 x i8>">
				// CHECK: %[[ONE:.*]] = llvm.mlir.constant(1 : i32) : !llvm.i32
				// CHECK: %[[COUNT_V2:.*]] = llvm.insertelement %[[COUNT]], %[[COUNT_V1]][%[[ONE]] : !llvm.i32] : !llvm<"<2 x i8>">
				// CHECK: %[[MINUS_ONE:.*]] = llvm.mlir.constant(dense<-1> : vector<2xi32>) : !llvm<"<2 x i32>">
				// CHECK: %[[EXT_COUNT:.*]] = llvm.zext %[[COUNT_V2]] : !llvm<"<2 x i8>"> to !llvm<"<2 x i32>">
				// CHECK: %[[EXT_OFFSET:.*]] = llvm.zext %[[OFFSET_V2]] : !llvm<"<2 x i8>"> to !llvm<"<2 x i32>">
				// CHECK: %[[T0:.*]] = llvm.shl %[[MINUS_ONE]], %[[EXT_COUNT]] : !llvm<"<2 x i32>">
				// CHECK: %[[T1:.*]] = llvm.xor %[[T0]], %[[MINUS_ONE]] : !llvm<"<2 x i32>">
				// CHECK: %[[T2:.*]] = llvm.shl %[[T1]], %[[EXT_OFFSET]] : !llvm<"<2 x i32>">
				// CHECK: %[[MASK:.*]] = llvm.xor %[[T2]], %[[MINUS_ONE]] : !llvm<"<2 x i32>">
				// CHECK: %[[NEW_BASE:.*]] = llvm.and %[[BASE]], %[[MASK]] : !llvm<"<2 x i32>">
				// CHECK: %[[SHIFTED_INSERT:.*]] = llvm.shl %[[INSERT]], %[[EXT_OFFSET]] : !llvm<"<2 x i32>">
				// CHECK: %{{.*}} = llvm.or %[[NEW_BASE]], %[[SHIFTED_INSERT]] : !llvm<"<2 x i32>">
				%0 = spv.BitFieldInsert %base, %insert, %offset, %count : vector<2xi32>, i8, i8
				return
				}

				// CHECK-LABEL: func @bitfield_insert_vector_greater_bit_width
				// CHECK-SAME: %[[BASE:.]]: !llvm<"<2 x i32>">, %[[INSERT:.]]: !llvm<"<2 x i32>">, %[[OFFSET:.]]: !llvm.i64, %[[COUNT:.]]: !llvm.i64
				func @bitfield_insert_vector_greater_bit_width(%base: vector<2xi32>, %insert: vector<2xi32>, %offset: i64, %count: i64) {
				// CHECK: %[[OFFSET_V0:.*]] = llvm.mlir.undef : !llvm<"<2 x i64>">
				// CHECK: %[[ZERO:.*]] = llvm.mlir.constant(0 : i32) : !llvm.i32
				// CHECK: %[[OFFSET_V1:.*]] = llvm.insertelement %[[OFFSET]], %[[OFFSET_V0]][%[[ZERO]] : !llvm.i32] : !llvm<"<2 x i64>">
				// CHECK: %[[ONE:.*]] = llvm.mlir.constant(1 : i32) : !llvm.i32
				// CHECK: %[[OFFSET_V2:.*]] = llvm.insertelement %[[OFFSET]], %[[OFFSET_V1]][%[[ONE]] : !llvm.i32] : !llvm<"<2 x i64>">
				// CHECK: %[[COUNT_V0:.*]] = llvm.mlir.undef : !llvm<"<2 x i64>">
				// CHECK: %[[ZERO:.*]] = llvm.mlir.constant(0 : i32) : !llvm.i32
				// CHECK: %[[COUNT_V1:.*]] = llvm.insertelement %[[COUNT]], %[[COUNT_V0]][%[[ZERO]] : !llvm.i32] : !llvm<"<2 x i64>">
				// CHECK: %[[ONE:.*]] = llvm.mlir.constant(1 : i32) : !llvm.i32
				// CHECK: %[[COUNT_V2:.*]] = llvm.insertelement %[[COUNT]], %[[COUNT_V1]][%[[ONE]] : !llvm.i32] : !llvm<"<2 x i64>">
				// CHECK: %[[MINUS_ONE:.*]] = llvm.mlir.constant(dense<-1> : vector<2xi32>) : !llvm<"<2 x i32>">
				// CHECK: %[[TRUNC_COUNT:.*]] = llvm.trunc %[[COUNT_V2]] : !llvm<"<2 x i64>"> to !llvm<"<2 x i32>">
				// CHECK: %[[TRUNC_OFFSET:.*]] = llvm.trunc %[[OFFSET_V2]] : !llvm<"<2 x i64>"> to !llvm<"<2 x i32>">
				// CHECK: %[[T0:.*]] = llvm.shl %[[MINUS_ONE]], %[[TRUNC_COUNT]] : !llvm<"<2 x i32>">
				// CHECK: %[[T1:.*]] = llvm.xor %[[T0]], %[[MINUS_ONE]] : !llvm<"<2 x i32>">
				// CHECK: %[[T2:.*]] = llvm.shl %[[T1]], %[[TRUNC_OFFSET]] : !llvm<"<2 x i32>">
				// CHECK: %[[MASK:.*]] = llvm.xor %[[T2]], %[[MINUS_ONE]] : !llvm<"<2 x i32>">
				// CHECK: %[[NEW_BASE:.*]] = llvm.and %[[BASE]], %[[MASK]] : !llvm<"<2 x i32>">
				// CHECK: %[[SHIFTED_INSERT:.*]] = llvm.shl %[[INSERT]], %[[TRUNC_OFFSET]] : !llvm<"<2 x i32>">
				// CHECK: %{{.*}} = llvm.or %[[NEW_BASE]], %[[SHIFTED_INSERT]] : !llvm<"<2 x i32>">
				%0 = spv.BitFieldInsert %base, %insert, %offset, %count : vector<2xi32>, i64, i64
				return
				}

				//===----------------------------------------------------------------------===//
	// spv.BitwiseAnd			// spv.BitwiseAnd
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//

	func @bitwise_and_scalar(%arg0: i32, %arg1: i32) {			func @bitwise_and_scalar(%arg0: i32, %arg1: i32) {
	// CHECK: %{{.}} = llvm.and %{{.}}, %{{.*}} : !llvm.i32			// CHECK: %{{.}} = llvm.and %{{.}}, %{{.*}} : !llvm.i32
	%0 = spv.BitwiseAnd %arg0, %arg1 : i32			%0 = spv.BitwiseAnd %arg0, %arg1 : i32
	return			return
	}			}
	▲ Show 20 Lines • Show All 56 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[MLIR][SPIRVToLLVM] Implementation of spv.BitFieldInsert pattern
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 273974

mlir/lib/Conversion/SPIRVToLLVM/ConvertSPIRVToLLVM.cpp

mlir/test/Conversion/SPIRVToLLVM/bitwise-ops-to-llvm.mlir

This is an archive of the discontinued LLVM Phabricator instance.

[MLIR][SPIRVToLLVM] Implementation of spv.BitFieldInsert patternClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 273974

mlir/lib/Conversion/SPIRVToLLVM/ConvertSPIRVToLLVM.cpp

mlir/test/Conversion/SPIRVToLLVM/bitwise-ops-to-llvm.mlir

[MLIR][SPIRVToLLVM] Implementation of spv.BitFieldInsert pattern
ClosedPublic