Diff 386670

mlir/include/mlir/Dialect/SparseTensor/IR/SparseTensorOps.td

Show All 19 Lines
class SparseTensor_Op<string mnemonic, list<OpTrait> traits = []>		class SparseTensor_Op<string mnemonic, list<OpTrait> traits = []>
: Op<SparseTensor_Dialect, mnemonic, traits> {		: Op<SparseTensor_Dialect, mnemonic, traits> {
let printer = [{ return ::print(p, *this); }];		let printer = [{ return ::print(p, *this); }];
let verifier = [{ return ::verify(*this); }];		let verifier = [{ return ::verify(*this); }];
let parser = [{ return ::parse$cppClass(parser, result); }];		let parser = [{ return ::parse$cppClass(parser, result); }];
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// Operations.		// Sparse Tensor Operations.
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

def SparseTensor_NewOp : SparseTensor_Op<"new", []>,		def SparseTensor_NewOp : SparseTensor_Op<"new", [NoSideEffect]>,
Arguments<(ins AnyType:$source)>,		Arguments<(ins AnyType:$source)>,
Results<(outs TensorOf<[AnyType]>:$result)> {		Results<(outs TensorOf<[AnyType]>:$result)> {
string summary = "Materializes a new sparse tensor from given source";		string summary = "Materializes a new sparse tensor from given source";
string description = [{		string description = [{
Materializes a sparse tensor with contents taken from an opaque pointer		Materializes a sparse tensor with contents taken from an opaque pointer
provided by `source`. For targets that have access to a file system,		provided by `source`. For targets that have access to a file system,
for example, this pointer may be a filename (or file) of a sparse		for example, this pointer may be a filename (or file) of a sparse
tensor in a particular external storage format. The form of the operation		tensor in a particular external storage format. The form of the operation
is kept deliberately very general to allow for alternative implementations		is kept deliberately very general to allow for alternative implementations
in the future, such as pointers to buffers or runnable initialization		in the future, such as pointers to buffers or runnable initialization
code. The operation is provided as an anchor that materializes a properly		code. The operation is provided as an anchor that materializes a properly
typed sparse tensor with inital contents into a computation.		typed sparse tensor with inital contents into a computation.

Example:		Example:

```mlir		```mlir
sparse_tensor.new %source : !Source to tensor<1024x1024xf64, #CSR>		sparse_tensor.new %source : !Source to tensor<1024x1024xf64, #CSR>
```		```
}];		}];
let assemblyFormat = "$source attr-dict `:` type($source) `to` type($result)";		let assemblyFormat = "$source attr-dict `:` type($source) `to` type($result)";
}		}

def SparseTensor_InitOp : SparseTensor_Op<"init", []>,		def SparseTensor_InitOp : SparseTensor_Op<"init", [NoSideEffect]>,
Arguments<(ins Variadic<Index>:$sizes)>,		Arguments<(ins Variadic<Index>:$sizes)>,
Results<(outs AnyTensor:$result)> {		Results<(outs AnyTensor:$result)> {
string summary = "Materializes an empty sparse tensor";		string summary = "Materializes an unitialized sparse tensor";
string description = [{		string description = [{
Materializes an empty sparse tensor with given shape (either static or dynamic).		Materializes an uninitialized sparse tensor with given shape (either static
The operation is provided as an anchor that materializes a properly typed sparse		or dynamic). The operation is provided as an anchor that materializes a
tensor into the output clause of a subsequent operation that yields a sparse tensor		properly typed but uninitialized sparse tensor into the output clause of
as the result.		a subsequent operation that yields a sparse tensor as the result.

Example:		Example:

```mlir		```mlir
%c = sparse_tensor.init_tensor [%d1, %d2] : tensor<?x?xf32, #SparseMatrix>		%c = sparse_tensor.init_tensor [%d1, %d2] : tensor<?x?xf32, #SparseMatrix>
%0 = linalg.matmul		%0 = linalg.matmul
ins(%a, %b: tensor<?x?xf32>, tensor<?x?xf32>)		ins(%a, %b: tensor<?x?xf32>, tensor<?x?xf32>)
outs(%c: tensor<?x?xf32, #SparseMatrix>) -> tensor<?x?xf32, #SparseMatrix>		outs(%c: tensor<?x?xf32, #SparseMatrix>) -> tensor<?x?xf32, #SparseMatrix>
Show All 38 Lines	string description = [{
%4 = sparse_tensor.convert %d : tensor<?xf64> to tensor<100xf64, #SV>		%4 = sparse_tensor.convert %d : tensor<?xf64> to tensor<100xf64, #SV>
```		```

}];		}];
let assemblyFormat = "$source attr-dict `:` type($source) `to` type($dest)";		let assemblyFormat = "$source attr-dict `:` type($source) `to` type($dest)";
let hasFolder = 1;		let hasFolder = 1;
}		}

def SparseTensor_ReleaseOp : SparseTensor_Op<"release", []>,
Arguments<(ins AnyTensor:$tensor)> {
string description = [{
Releases the underlying sparse storage scheme for a tensor that
materialized earlier through a `new` operator, `init` operator, or a
non-trivial `convert` operator with an annotated tensor type as destination.
This operation should only be called once for any materialized tensor.
Also, after this operation, any subsequent `memref` querying operation
on the tensor returns undefined results.

Example:

```mlir
sparse_tensor.release %tensor : tensor<1024x1024xf64, #CSR>
```
}];
let assemblyFormat = "$tensor attr-dict `:` type($tensor)";
}

def SparseTensor_ToPointersOp : SparseTensor_Op<"pointers", [NoSideEffect]>,		def SparseTensor_ToPointersOp : SparseTensor_Op<"pointers", [NoSideEffect]>,
Arguments<(ins AnyTensor:$tensor, Index:$dim)>,		Arguments<(ins AnyTensor:$tensor, Index:$dim)>,
Results<(outs AnyStridedMemRefOfRank<1>:$result)> {		Results<(outs AnyStridedMemRefOfRank<1>:$result)> {
let summary = "Extract pointers array at given dimension from a tensor";		let summary = "Extracts pointers array at given dimension from a tensor";
let description = [{		let description = [{
Returns the pointers array of the sparse storage scheme at the		Returns the pointers array of the sparse storage format at the
given dimension for the given sparse tensor. This is similar to the		given dimension for the given sparse tensor. This is similar to the
`memref.buffer_cast` operation in the sense that it provides a bridge		`memref.buffer_cast` operation in the sense that it provides a bridge
between a tensor world view and a bufferized world view. Unlike the		between a tensor world view and a bufferized world view. Unlike the
`memref.buffer_cast` operation, however, this sparse operation actually		`memref.buffer_cast` operation, however, this sparse operation actually
lowers into a call into a support library to obtain access to the		lowers into a call into a support library to obtain access to the
pointers array.		pointers array.

Example:		Example:

```mlir		```mlir
%1 = sparse_tensor.pointers %0, %c1		%1 = sparse_tensor.pointers %0, %c1
: tensor<64x64xf64, #CSR> to memref<?xindex>		: tensor<64x64xf64, #CSR> to memref<?xindex>
```		```
}];		}];
let assemblyFormat = "$tensor `,` $dim attr-dict `:` type($tensor)"		let assemblyFormat = "$tensor `,` $dim attr-dict `:` type($tensor)"
" `to` type($result)";		" `to` type($result)";
}		}

def SparseTensor_ToIndicesOp : SparseTensor_Op<"indices", [NoSideEffect]>,		def SparseTensor_ToIndicesOp : SparseTensor_Op<"indices", [NoSideEffect]>,
Arguments<(ins AnyTensor:$tensor, Index:$dim)>,		Arguments<(ins AnyTensor:$tensor, Index:$dim)>,
Results<(outs AnyStridedMemRefOfRank<1>:$result)> {		Results<(outs AnyStridedMemRefOfRank<1>:$result)> {
let summary = "Extract indices array at given dimension from a tensor";		let summary = "Extracts indices array at given dimension from a tensor";
let description = [{		let description = [{
Returns the indices array of the sparse storage scheme at the		Returns the indices array of the sparse storage format at the
given dimension for the given sparse tensor. This is similar to the		given dimension for the given sparse tensor. This is similar to the
`memref.buffer_cast` operation in the sense that it provides a bridge		`memref.buffer_cast` operation in the sense that it provides a bridge
between a tensor world view and a bufferized world view. Unlike the		between a tensor world view and a bufferized world view. Unlike the
`memref.buffer_cast` operation, however, this sparse operation actually		`memref.buffer_cast` operation, however, this sparse operation actually
lowers into a call into a support library to obtain access to the		lowers into a call into a support library to obtain access to the
indices array.		indices array.

Example:		Example:

```mlir		```mlir
%1 = sparse_tensor.indices %0, %c1		%1 = sparse_tensor.indices %0, %c1
: tensor<64x64xf64, #CSR> to memref<?xindex>		: tensor<64x64xf64, #CSR> to memref<?xindex>
```		```
}];		}];
let assemblyFormat = "$tensor `,` $dim attr-dict `:` type($tensor)"		let assemblyFormat = "$tensor `,` $dim attr-dict `:` type($tensor)"
" `to` type($result)";		" `to` type($result)";
}		}

def SparseTensor_ToValuesOp : SparseTensor_Op<"values", [NoSideEffect]>,		def SparseTensor_ToValuesOp : SparseTensor_Op<"values", [NoSideEffect]>,
Arguments<(ins AnyTensor:$tensor)>,		Arguments<(ins AnyTensor:$tensor)>,
Results<(outs AnyStridedMemRefOfRank<1>:$result)> {		Results<(outs AnyStridedMemRefOfRank<1>:$result)> {
let summary = "Extract numerical values array from a tensor";		let summary = "Extracts numerical values array from a tensor";
let description = [{		let description = [{
Returns the values array of the sparse storage scheme for the given		Returns the values array of the sparse storage format for the given
sparse tensor, independent of the actual dimension. This is similar to		sparse tensor, independent of the actual dimension. This is similar to
the `memref.buffer_cast` operation in the sense that it provides a bridge		the `memref.buffer_cast` operation in the sense that it provides a bridge
between a tensor world view and a bufferized world view. Unlike the		between a tensor world view and a bufferized world view. Unlike the
`memref.buffer_cast` operation, however, this sparse operation actually		`memref.buffer_cast` operation, however, this sparse operation actually
lowers into a call into a support library to obtain access to the		lowers into a call into a support library to obtain access to the
values array.		values array.

Example:		Example:

```mlir		```mlir
%1 = sparse_tensor.values %0 : tensor<64x64xf64, #CSR> to memref<?xf64>		%1 = sparse_tensor.values %0 : tensor<64x64xf64, #CSR> to memref<?xf64>
```		```
}];		}];
let assemblyFormat = "$tensor attr-dict `:` type($tensor) `to` type($result)";		let assemblyFormat = "$tensor attr-dict `:` type($tensor) `to` type($result)";
}		}

def SparseTensor_ToTensorOp : SparseTensor_Op<"tensor", [NoSideEffect]>,		//===----------------------------------------------------------------------===//
Arguments<(ins Variadic<AnyStridedMemRefOfRank<1>>:$memrefs)>,		// Sparse Tensor Management Operations. These operations are "impure" in the
		// sense that they do not properly operate on SSA values. Instead, the behavior
		// is solely defined by side-effects. These operations provide a bridge between
		// the code generator and the support library. The semantics of these operations
		// may be refined over time as our sparse abstractions evolve.
		//===----------------------------------------------------------------------===//

		def SparseTensor_LexInsertOp : SparseTensor_Op<"lex_insert", []>,
		Arguments<(ins AnyTensor:$tensor,
		StridedMemRefRankOf<[Index], [1]>:$indices,
		AnyType:$value)> {
		string summary = "Inserts a value into given sparse tensor in lexicograph index order";
		string description = [{
		Inserts the given value at given indices into the underlying sparse
		storage format of the given tensor with the given indices. This
		operation can only be applied when a tensor materializes unintialized
		with an `init` operation, the insertions occur in strict lexicographic
		index order, and the final tensor is constructed with a `tensor`
		operation that has the `hasInserts` attribute set.

		Note that this operation is "impure" in the sense that its behavior
		is solely defined by side-effects and not SSA values. The semantics
		may be refined over time as our sparse abstractions evolve.

		```mlir
		sparse_tensor.lex_insert %tensor, %indices, %val
		: tensor<1024x1024xf64, #CSR>, memref<?xindex>, f64
		```
		}];
		let assemblyFormat = "$tensor `,` $indices `,` $value attr-dict `:`"
		" type($tensor) `,` type($indices) `,` type($value)";
		}

		def SparseTensor_LoadOp : SparseTensor_Op<"load", [SameOperandsAndResultType]>,
		Arguments<(ins AnyTensor:$tensor, BoolAttr:$hasInserts)>,
Results<(outs AnyTensor:$result)> {		Results<(outs AnyTensor:$result)> {
let summary = "Rematerializes tensor from arrays(s)";		let summary =
		"Rematerializes tensor from underlying sparse storage format";
let description = [{		let description = [{
Rematerializes the sparse tensor from the sparse storage scheme array(s).		Rematerializes a tensor from the underlying sparse storage format of the
This is similar to the `memref.load` operation in the sense that it		given tensor. This is similar to the `memref.load` operation in the sense
provides a bridge between a bufferized world view and a tensor world		that it provides a bridge between a bufferized world view and a tensor
view. Unlike the `memref.load` operation, however, this sparse operation		world view. Unlike the `memref.load` operation, however, this sparse
is used only temporarily to maintain a correctly typed intermediate		operation is used only temporarily to maintain a correctly typed
representation during progressive bufferization. Eventually the operation		intermediate representation during progressive bufferization.
is folded away.
		The `hasInserts` attribute denote whether insertions to the underlying
The input arrays are defined unambigously by the sparsity annotations		sparse storage format may have occurred, in which case the underlying
(pointers and indices for overhead storage in every compressed dimension,		sparse storage format needs to be finalized. Otherwise, the operation
followed by one final values array).		simply folds away.

		Note that this operation is "impure" in the sense that its behavior
		is solely defined by side-effects and not SSA values. The semantics
		may be refined over time as our sparse abstractions evolve.

Examples:		Example:

```mlir		```mlir
%1 = sparse_tensor.tensor %0 : memref<?xf64> to tensor<64x64xf64, #Dense>		%1 = sparse_tensor.load %0, false : tensor<8xf64, #SV>
		```
		}];
		let assemblyFormat = "$tensor `,` $hasInserts attr-dict `:` type($tensor)";
		}

		def SparseTensor_ReleaseOp : SparseTensor_Op<"release", []>,
		Arguments<(ins AnyTensor:$tensor)> {
		string summary = "Releases underlying sparse storage format of given tensor";
		string description = [{
		Releases the underlying sparse storage format for a tensor that
		materialized earlier through a `new` operator, `init` operator, or a
		non-trivial `convert` operator with an annotated tensor type as destination.
		wrengrUnsubmitted Done Reply Inline Actions This description is a bit uninformative, since the reader won't necessarily know which conversions count as "non-trivial" for the purpose of being released. So we should explicate which conversions this includes, either here or at the `convert` op description (with a comment here that says to look there). wrengr: This description is a bit uninformative, since the reader won't necessarily know which…
		aartbikAuthorUnsubmitted Done Reply Inline Actions Good point. Added the "non-trivial" definition. aartbik: Good point. Added the "non-trivial" definition.
		This operation should only be called once for any materialized tensor.
		Also, after this operation, any subsequent `memref` querying operation
		on the tensor returns undefined results.
		wrengrUnsubmitted Done Reply Inline Actions If this op is just for codegen / progressive-bufferization, then shouldn't we know this operand statically whenever we generate the load op? That's certainly the case for `Sparsification.cpp:1464` (and `conversion.mlir:427`, `roundtrip.mlir:121`, etc). So, are there actually any cases where we need this to be dataflow-dependent, and if not then why not make it an attribute rather than an operand? wrengr: If this op is just for codegen / progressive-bufferization, then shouldn't we know this operand…
		aartbikAuthorUnsubmitted Done Reply Inline Actions Note that it is an attribute, but I parse it indeed as an extra operand. So I guess you are proposing to parse the value in a more attribute-like manner ;-) aartbik: Note that it is an attribute, but I parse it indeed as an extra operand. So I guess you are…

%3 = sparse_tensor.tensor %0, %1, %2 :		Note that this operation is "impure" in the sense that its behavior
memref<?xindex>, memref<?xindex>, memref<?xf32> to tensor<10x10xf32, #CSR>		is solely defined by side-effects and not SSA values. The semantics
		may be refined over time as our sparse abstractions evolve.

		Example:

		```mlir
		sparse_tensor.release %tensor : tensor<1024x1024xf64, #CSR>
```		```
}];		}];
let assemblyFormat = "$memrefs attr-dict `:` type($memrefs) `to` type($result)";		let assemblyFormat = "$tensor attr-dict `:` type($tensor)";
}		}

#endif // SPARSETENSOR_OPS		#endif // SPARSETENSOR_OPS

mlir/lib/Dialect/SparseTensor/IR/SparseTensorDialect.cpp

Show First 20 Lines • Show All 257 Lines • ▼ Show 20 Lines
}		}

OpFoldResult ConvertOp::fold(ArrayRef<Attribute> operands) {		OpFoldResult ConvertOp::fold(ArrayRef<Attribute> operands) {
if (getType() == source().getType())		if (getType() == source().getType())
return source();		return source();
return {};		return {};
}		}

static LogicalResult verify(ReleaseOp op) {
if (!getSparseTensorEncoding(op.tensor().getType()))
return op.emitError("expected a sparse tensor to release");
return success();
}

static LogicalResult verify(ToPointersOp op) {		static LogicalResult verify(ToPointersOp op) {
if (auto e = getSparseTensorEncoding(op.tensor().getType())) {		if (auto e = getSparseTensorEncoding(op.tensor().getType())) {
if (failed(isInBounds(op.dim(), op.tensor())))		if (failed(isInBounds(op.dim(), op.tensor())))
return op.emitError("requested pointers dimension out of bounds");		return op.emitError("requested pointers dimension out of bounds");
if (failed(isMatchingWidth(op.result(), e.getPointerBitWidth())))		if (failed(isMatchingWidth(op.result(), e.getPointerBitWidth())))
return op.emitError("unexpected type for pointers");		return op.emitError("unexpected type for pointers");
return success();		return success();
}		}
Show All 16 Lines	if (!getSparseTensorEncoding(op.tensor().getType()))
return op.emitError("expected a sparse tensor to get values");		return op.emitError("expected a sparse tensor to get values");
RankedTensorType ttp = op.tensor().getType().cast<RankedTensorType>();		RankedTensorType ttp = op.tensor().getType().cast<RankedTensorType>();
MemRefType mtp = op.result().getType().cast<MemRefType>();		MemRefType mtp = op.result().getType().cast<MemRefType>();
if (ttp.getElementType() != mtp.getElementType())		if (ttp.getElementType() != mtp.getElementType())
return op.emitError("unexpected mismatch in element types");		return op.emitError("unexpected mismatch in element types");
return success();		return success();
}		}

static LogicalResult verify(ToTensorOp op) {		//===----------------------------------------------------------------------===//
if (!getSparseTensorEncoding(op.result().getType()))		// TensorDialect Management Operations.
return op.emitError("expected a sparse tensor result");		//===----------------------------------------------------------------------===//

		static LogicalResult verify(LexInsertOp op) {
		if (!getSparseTensorEncoding(op.tensor().getType()))
		return op.emitError("expected a sparse tensor for insertion");
		return success();
		}

		static LogicalResult verify(LoadOp op) {
		if (!getSparseTensorEncoding(op.tensor().getType()))
		return op.emitError("expected a sparse tensor to materialize");
		return success();
		}

		static LogicalResult verify(ReleaseOp op) {
		if (!getSparseTensorEncoding(op.tensor().getType()))
		return op.emitError("expected a sparse tensor to release");
return success();		return success();
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// TensorDialect Methods.		// TensorDialect Methods.
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

void SparseTensorDialect::initialize() {		void SparseTensorDialect::initialize() {
Show All 31 Lines

mlir/lib/Dialect/SparseTensor/Transforms/SparseTensorConversion.cpp

Show First 20 Lines • Show All 833 Lines • ▼ Show 20 Lines

else

return failure();

auto fn = getFunc(op, name, resType, adaptor.getOperands(),

/*emitCInterface=*/true);

rewriter.replaceOpWithNewOp<CallOp>(op, resType, fn, adaptor.getOperands());

return success();

}

};

/// Sparse conversion rule for tensor reconstruction.

/// Sparse conversion rule for tensor rematerialization.

class SparseTensorToTensorConverter : public OpConversionPattern<ToTensorOp> {

class SparseTensorLoadConverter : public OpConversionPattern<LoadOp> {

public:

using OpConversionPattern::OpConversionPattern;

LogicalResult

// Simply fold the operator into the pointer to the sparse storage scheme.

matchAndRewrite(LoadOp op, OpAdaptor adaptor,

matchAndRewrite(ToTensorOp op, OpAdaptor adaptor,

ConversionPatternRewriter &rewriter) const override {

// Check that all arguments of the tensor reconstruction operators are calls

if (op.hasInserts()) {

// into the support library that query exactly the same opaque pointer.

// Finalize any pending insertions.

Value ptr;

StringRef name = "endInsert";

for (Value op : adaptor.getOperands()) {

ValueRange noTp;

if (auto call = op.getDefiningOp<CallOp>()) {

auto fn = getFunc(op, name, noTp, adaptor.getOperands());

Value arg = call.getOperand(0);

rewriter.create<CallOp>(op.getLoc(), noTp, fn, adaptor.getOperands());

if (!arg.getType().isa<LLVM::LLVMPointerType>())

return failure();

if (!ptr)

ptr = arg;

else if (arg != ptr)

return failure();

}

rewriter.replaceOp(op, adaptor.getOperands());

return success();

}

// If a single opaque pointer is found, perform the folding.

};

if (!ptr)

return failure();

/// Sparse conversion rule for inserting in lexicographic index order.

rewriter.replaceOp(op, ptr);

class SparseTensorLexInsertConverter : public OpConversionPattern<LexInsertOp> {

public:

using OpConversionPattern::OpConversionPattern;

LogicalResult

matchAndRewrite(LexInsertOp op, OpAdaptor adaptor,

ConversionPatternRewriter &rewriter) const override {

Type srcType = op.tensor().getType();

Type eltType = srcType.cast<ShapedType>().getElementType();

StringRef name;

if (eltType.isF64())

name = "lexInsertF64";

else if (eltType.isF32())

name = "lexInsertF32";

else if (eltType.isInteger(64))

name = "lexInsert64";

wrengrUnsubmitted

Done

else if (eltType.isInteger(64))

- name = "lexInsert64";

+ name = "lexInsertI64";

else if (eltType.isInteger(32))

You're missing an "I"

wrengr: You're missing an "I"

aartbikAuthorUnsubmitted

Done

oh, good catch! we really need to add more "test generators" so we can just iterate over all data types more easily than writing tests by hand ;-)

aartbik: oh, good catch! we really need to add more "test generators" so we can just iterate over all…

bixiaUnsubmitted

Done

We have two other places that use similar if-branches, genAddEltCall and genGetNextCall.
Can we avoid duplicating such logic by have getFuncNameSuffix(eltType):

lexInsert+ getFuncNameSuffix(eltType)

bixia: We have two other places that use similar if-branches, genAddEltCall and genGetNextCall. Can we…

aartbikAuthorUnsubmitted

Done

I like that suggestion! Will do in a followup CL

aartbik: I like that suggestion! Will do in a followup CL

else if (eltType.isInteger(32))

name = "lexInsertI32";

else if (eltType.isInteger(16))

name = "lexInsertI16";

else if (eltType.isInteger(8))

name = "lexInsertI8";

else

llvm_unreachable("Unknown element type");

ValueRange noTp;

auto fn =

getFunc(op, name, noTp, adaptor.getOperands(), /*emitCInterface=*/true);

rewriter.replaceOpWithNewOp<CallOp>(op, noTp, fn, adaptor.getOperands());

return success();

}

};

} // namespace

//===----------------------------------------------------------------------===//

// Public method for populating conversion rules.

//===----------------------------------------------------------------------===//

/// Populates the given patterns list with conversion rules required for

/// the sparsification of linear algebra operations.

void mlir::populateSparseTensorConversionPatterns(TypeConverter &typeConverter,

RewritePatternSet &patterns) {

patterns.add<SparseReturnConverter, SparseTensorToDimSizeConverter,

SparseCastConverter, SparseTensorNewConverter,

SparseTensorInitConverter, SparseTensorConvertConverter,

SparseTensorReleaseConverter, SparseTensorToPointersConverter,

SparseTensorToIndicesConverter, SparseTensorToValuesConverter,

SparseTensorToTensorConverter>(typeConverter,

SparseTensorLoadConverter, SparseTensorLexInsertConverter>(

patterns.getContext());

typeConverter, patterns.getContext());

}

mlir/lib/Dialect/SparseTensor/Transforms/Sparsification.cpp

Show All 38 Lines
// Iteration graph sorting.		// Iteration graph sorting.
enum SortMask { kSparseOnly = 0x0, kIncludeDense = 0x1, kIncludeUndef = 0x2 };		enum SortMask { kSparseOnly = 0x0, kIncludeDense = 0x1, kIncludeUndef = 0x2 };

// Reduction kinds.		// Reduction kinds.
enum Reduction { kNoReduc, kSum, kProduct, kAnd, kOr, kXor };		enum Reduction { kNoReduc, kSum, kProduct, kAnd, kOr, kXor };

// Code generation.		// Code generation.
struct CodeGen {		struct CodeGen {
CodeGen(SparsificationOptions o, unsigned numTensors, unsigned numLoops)		CodeGen(SparsificationOptions o, unsigned numTensors, unsigned numLoops,
		OpOperand *op)
: options(o), loops(numLoops), sizes(numLoops), buffers(numTensors),		: options(o), loops(numLoops), sizes(numLoops), buffers(numTensors),
pointers(numTensors, std::vector<Value>(numLoops)),		pointers(numTensors, std::vector<Value>(numLoops)),
indices(numTensors, std::vector<Value>(numLoops)),		indices(numTensors, std::vector<Value>(numLoops)),
highs(numTensors, std::vector<Value>(numLoops)),		highs(numTensors, std::vector<Value>(numLoops)),
pidxs(numTensors, std::vector<Value>(numLoops)),		pidxs(numTensors, std::vector<Value>(numLoops)),
idxs(numTensors, std::vector<Value>(numLoops)), redExp(-1u), redVal(),		idxs(numTensors, std::vector<Value>(numLoops)), redExp(-1u), redVal(),
redKind(kNoReduc), curVecLength(1), curVecMask() {}		redKind(kNoReduc), sparseOut(op), lexIdx(), curVecLength(1),
		curVecMask() {}
/// Sparsification options.		/// Sparsification options.
SparsificationOptions options;		SparsificationOptions options;
/// Universal dense indices and upper bounds (by index). The loops array		/// Universal dense indices and upper bounds (by index). The loops array
/// is updated with the value of the universal dense index in the current		/// is updated with the value of the universal dense index in the current
/// loop. The sizes array is set once with the inferred dimension sizes.		/// loop. The sizes array is set once with the inferred dimension sizes.
std::vector<Value> loops;		std::vector<Value> loops;
std::vector<Value> sizes;		std::vector<Value> sizes;
/// Buffers for storing dense and sparse numerical values (by tensor).		/// Buffers for storing dense and sparse numerical values (by tensor).
/// This array is set once during bufferization of all tensors.		/// This array is set once during bufferization of all tensors.
std::vector<Value> buffers;		std::vector<Value> buffers;
/// Sparse storage schemes (1-D): pointers and indices (by tensor and index).		/// Sparse storage schemes (1-D): pointers and indices (by tensor and index).
/// This array is set once during bufferization of all sparse tensors.		/// This array is set once during bufferization of all sparse tensors.
std::vector<std::vector<Value>> pointers;		std::vector<std::vector<Value>> pointers;
std::vector<std::vector<Value>> indices;		std::vector<std::vector<Value>> indices;
/// Sparse iteration information (by tensor and index). These arrays		/// Sparse iteration information (by tensor and index). These arrays
/// are updated to remain current within the current loop.		/// are updated to remain current within the current loop.
std::vector<std::vector<Value>> highs;		std::vector<std::vector<Value>> highs;
std::vector<std::vector<Value>> pidxs;		std::vector<std::vector<Value>> pidxs;
std::vector<std::vector<Value>> idxs;		std::vector<std::vector<Value>> idxs;
/// Current reduction, updated during code generation. When indices of a		/// Current reduction, updated during code generation. When indices of a
/// reduction are exhausted, all inner loops can use a scalarized reduction.		/// reduction are exhausted, all inner loops can use a scalarized reduction.
unsigned redExp;		unsigned redExp;
Value redVal;		Value redVal;
Reduction redKind;		Reduction redKind;
		// Sparse tensor as output.
		OpOperand *sparseOut;
		Value lexIdx;
// Current vector length and mask.		// Current vector length and mask.
unsigned curVecLength;		unsigned curVecLength;
Value curVecMask;		Value curVecMask;
};		};

} // namespace		} // namespace

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
▲ Show 20 Lines • Show All 182 Lines • ▼ Show 20 Lines	if (auto funcOp = dyn_cast<FuncOp>(arg.getOwner()->getParentOp()))
if (auto attr = funcOp.getArgAttrOfType<BoolAttr>(		if (auto attr = funcOp.getArgAttrOfType<BoolAttr>(
arg.getArgNumber(),		arg.getArgNumber(),
linalg::comprehensive_bufferize::BufferizableOpInterface::		linalg::comprehensive_bufferize::BufferizableOpInterface::
kInplaceableAttrName))		kInplaceableAttrName))
return attr.getValue();		return attr.getValue();
return false;		return false;
}		}

/// Returns true if tensor materializes into the computation.		/// Returns true if tensor materializes uninitialized into the computation.
static bool isMaterializing(Value val) {		static bool isMaterializing(Value val) {
return val.getDefiningOp<linalg::InitTensorOp>() \|\|		return val.getDefiningOp<linalg::InitTensorOp>() \|\|
val.getDefiningOp<InitOp>();		val.getDefiningOp<InitOp>();
}		}

/// Returns true when the tensor expression is admissable for codegen.		/// Returns true when the tensor expression is admissable for codegen.
/// Since all sparse input tensors are admissable, we just need to check		/// Since all sparse input tensors are admissable, we just need to check
/// whether the output tensor in the tensor expression codegen is admissable.		/// whether the output tensor in the tensor expression codegen is admissable.
static bool isAdmissableTensorExp(Merger &merger, linalg::GenericOp op,		static bool isAdmissableTensorExp(Merger &merger, linalg::GenericOp op,
unsigned exp) {		unsigned exp, OpOperand **sparseOut) {
		wrengrUnsubmitted Done Reply Inline Actions Add a short description of this out-parameter to the doxygen wrengr: Add a short description of this out-parameter to the doxygen
OpOperand *lhs = op.getOutputOperand(0);		OpOperand *lhs = op.getOutputOperand(0);
unsigned tensor = lhs->getOperandNumber();		unsigned tensor = lhs->getOperandNumber();
auto enc = getSparseTensorEncoding(lhs->get().getType());		auto enc = getSparseTensorEncoding(lhs->get().getType());
// An non-annotated output tensor is assumed dense, and becomes a random		// An non-annotated output tensor is assumed dense, and becomes a random
// access n-dim memref. Admissable since insertions cannot occur.		// access n-dim memref. Admissable since insertions cannot occur.
if (!enc)		if (!enc)
return true;		return true;
// An all-dense annotated "sparse" output tensor becomes a linearized random		// An all-dense annotated "sparse" output tensor becomes a linearized random
// access 1-dim memref. Also admissable since insertions cannot occur.		// access 1-dim memref. Also admissable since insertions cannot occur.
bool allDense = true;		bool allDense = true;
unsigned numLoops = op.iterator_types().getValue().size();		unsigned numLoops = op.iterator_types().getValue().size();
for (unsigned i = 0; i < numLoops; i++)		for (unsigned i = 0; i < numLoops; i++)
if (merger.isDim(tensor, i, Dim::kSparse)) {		if (merger.isDim(tensor, i, Dim::kSparse)) {
allDense = false;		allDense = false;
break;		break;
}		}
if (allDense)		if (allDense)
return true;		return true;
// A tensor expression with a sparse output tensor that changes its values		// A tensor expression with a sparse output tensor that changes its values
// but not its nonzero structure, an operation called "simply dynamic" in		// but not its nonzero structure, an operation called "simply dynamic" in
// [Bik96,Ch9], is also admissable without special codegen, provided		// [Bik96,Ch9], is also admissable without special codegen, provided
// the tensor's underlying sparse storage scheme can be modified in place.		// the tensor's underlying sparse storage scheme can be modified in place.
if (merger.isConjunction(tensor, exp))		if (merger.isConjunction(tensor, exp) && isInPlace(lhs->get()))
return isInPlace(lhs->get());		return true;
// Reject for now since this requires changes to the nonzero structure.		// Accept "truly dynamic" if the output tensor materializes uninitialized
// TODO: implement "workspaces" [Kjolstad2019]		// into the computation and insertions occur in lexicographic index order.
		if (isMaterializing(lhs->get())) {
		// In this first sparse tensor output implementation, this is enforced by
		// rejecting any reduction loops (since the sparse parallel loops give a
		// lexicographically sorted and injective view into that tensor).
		// TODO: generalize to include reductions
		for (auto attr : op.iterator_types())
		if (isReductionIterator(attr))
		return false;
		// TODO: generalize support lib beyond vectors
		if (op.iterator_types().size() != 1)
		return false;
		*sparseOut = lhs;
		return true;
		}
return false;		return false;
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// Sparse compiler synthesis methods (reductions).		// Sparse compiler synthesis methods (reductions).
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

/// Maps reduction kind to name encoding.		/// Maps reduction kind to name encoding.
▲ Show 20 Lines • Show All 190 Lines • ▼ Show 20 Lines	if (!enc) {
// Non-annotated dense tensors.		// Non-annotated dense tensors.
auto denseTp = MemRefType::get(shape, elementType);		auto denseTp = MemRefType::get(shape, elementType);
if (tensor < op.getNumInputs())		if (tensor < op.getNumInputs())
codegen.buffers[tensor] =		codegen.buffers[tensor] =
rewriter.create<memref::BufferCastOp>(loc, denseTp, t->get());		rewriter.create<memref::BufferCastOp>(loc, denseTp, t->get());
else		else
codegen.buffers[tensor] =		codegen.buffers[tensor] =
genOutputBuffer(codegen, rewriter, op, denseTp, args);		genOutputBuffer(codegen, rewriter, op, denseTp, args);
		} else if (t == codegen.sparseOut) {
		// True sparse output needs a lexIdx array.
		Value rank = rewriter.create<arith::ConstantIndexOp>(loc, op.getRank(t));
		auto dynShape = {ShapedType::kDynamicSize};
		auto lTp = MemRefType::get(dynShape, rewriter.getIndexType());
		wrengrUnsubmitted Done Reply Inline Actions rename to `memTp` for consistency with the rest of the code wrengr: rename to `memTp` for consistency with the rest of the code
		codegen.lexIdx = rewriter.create<memref::AllocaOp>(loc, lTp, rank);
} else {		} else {
// Annotated sparse tensors.		// Annotated sparse tensors.
auto dynShape = {ShapedType::kDynamicSize};		auto dynShape = {ShapedType::kDynamicSize};
auto sparseTp = MemRefType::get(dynShape, elementType);		auto sparseTp = MemRefType::get(dynShape, elementType);
codegen.buffers[tensor] =		codegen.buffers[tensor] =
rewriter.create<ToValuesOp>(loc, sparseTp, t->get());		rewriter.create<ToValuesOp>(loc, sparseTp, t->get());
}		}
}		}
▲ Show 20 Lines • Show All 158 Lines • ▼ Show 20 Lines	if (codegen.curVecLength > 1)
return genVectorLoad(codegen, rewriter, ptr, args);		return genVectorLoad(codegen, rewriter, ptr, args);
return rewriter.create<memref::LoadOp>(op.getLoc(), ptr, args);		return rewriter.create<memref::LoadOp>(op.getLoc(), ptr, args);
}		}

/// Generates a store on a dense or sparse tensor.		/// Generates a store on a dense or sparse tensor.
static void genTensorStore(Merger &merger, CodeGen &codegen,		static void genTensorStore(Merger &merger, CodeGen &codegen,
PatternRewriter &rewriter, linalg::GenericOp op,		PatternRewriter &rewriter, linalg::GenericOp op,
Value rhs) {		Value rhs) {
		Location loc = op.getLoc();
// Test if this is a scalarized reduction.		// Test if this is a scalarized reduction.
if (codegen.redVal) {		if (codegen.redVal) {
if (codegen.curVecLength > 1)		if (codegen.curVecLength > 1)
rhs = rewriter.create<SelectOp>(op.getLoc(), codegen.curVecMask, rhs,		rhs = rewriter.create<SelectOp>(loc, codegen.curVecMask, rhs,
codegen.redVal);		codegen.redVal);
updateReduc(merger, codegen, rhs);		updateReduc(merger, codegen, rhs);
return;		return;
}		}
		// Insertion.
		OpOperand *t = op.getOutputOperand(0);
		if (t == codegen.sparseOut) {
		rewriter.create<LexInsertOp>(loc, t->get(), codegen.lexIdx, rhs);
		return;
		}
// Actual store.		// Actual store.
SmallVector<Value, 4> args;		SmallVector<Value, 4> args;
OpOperand *t = op.getOutputOperand(0);
Value ptr = genSubscript(codegen, rewriter, op, t, args);		Value ptr = genSubscript(codegen, rewriter, op, t, args);
if (codegen.curVecLength > 1)		if (codegen.curVecLength > 1)
genVectorStore(codegen, rewriter, rhs, ptr, args);		genVectorStore(codegen, rewriter, rhs, ptr, args);
else		else
rewriter.create<memref::StoreOp>(op.getLoc(), rhs, ptr, args);		rewriter.create<memref::StoreOp>(loc, rhs, ptr, args);
}		}

/// Generates a pointer/index load from the sparse storage scheme. Narrower		/// Generates a pointer/index load from the sparse storage scheme. Narrower
/// data types need to be zero extended before casting the value into the		/// data types need to be zero extended before casting the value into the
/// index type used for looping and indexing.		/// index type used for looping and indexing.
static Value genLoad(CodeGen &codegen, PatternRewriter &rewriter, Location loc,		static Value genLoad(CodeGen &codegen, PatternRewriter &rewriter, Location loc,
Value ptr, Value s) {		Value ptr, Value s) {
// See https://llvm.org/docs/GetElementPtr.html for some background on		// See https://llvm.org/docs/GetElementPtr.html for some background on
▲ Show 20 Lines • Show All 255 Lines • ▼ Show 20 Lines	static Operation *genFor(Merger &merger, CodeGen &codegen,
bool isOuter, bool isInner, unsigned idx,		bool isOuter, bool isInner, unsigned idx,
llvm::BitVector &indices) {		llvm::BitVector &indices) {
unsigned fb = indices.find_first();		unsigned fb = indices.find_first();
unsigned tensor = merger.tensor(fb);		unsigned tensor = merger.tensor(fb);
assert(idx == merger.index(fb));		assert(idx == merger.index(fb));
auto iteratorTypes = op.iterator_types().getValue();		auto iteratorTypes = op.iterator_types().getValue();
bool isReduction = isReductionIterator(iteratorTypes[idx]);		bool isReduction = isReductionIterator(iteratorTypes[idx]);
bool isSparse = merger.isDim(fb, Dim::kSparse);		bool isSparse = merger.isDim(fb, Dim::kSparse);
bool isVector = isVectorFor(codegen, isInner, isSparse) &&		bool isVector = !codegen.sparseOut &&
		isVectorFor(codegen, isInner, isSparse) &&
denseUnitStrides(merger, op, idx);		denseUnitStrides(merger, op, idx);
bool isParallel =		bool isParallel =
		!codegen.sparseOut &&
isParallelFor(codegen, isOuter, isReduction, isSparse, isVector);		isParallelFor(codegen, isOuter, isReduction, isSparse, isVector);

// Prepare vector length.		// Prepare vector length.
if (isVector)		if (isVector)
codegen.curVecLength = codegen.options.vectorLength;		codegen.curVecLength = codegen.options.vectorLength;

// Loop bounds and increment.		// Loop bounds and increment.
Location loc = op.getLoc();		Location loc = op.getLoc();
▲ Show 20 Lines • Show All 165 Lines • ▼ Show 20 Lines	if ((locals[b] \|\| merger.isOutTensor(b, idx)) &&
if (codegen.pidxs[tensor][topSort[pat - 1]])		if (codegen.pidxs[tensor][topSort[pat - 1]])
break;		break;
Value p = (pat == 0) ? rewriter.create<arith::ConstantIndexOp>(loc, 0)		Value p = (pat == 0) ? rewriter.create<arith::ConstantIndexOp>(loc, 0)
: codegen.pidxs[tensor][topSort[pat - 1]];		: codegen.pidxs[tensor][topSort[pat - 1]];
codegen.pidxs[tensor][idx] = genAddress(		codegen.pidxs[tensor][idx] = genAddress(
codegen, rewriter, loc, codegen.sizes[idx], p, codegen.loops[idx]);		codegen, rewriter, loc, codegen.sizes[idx], p, codegen.loops[idx]);
}		}
}		}

		// Move the insertion indices in lexicographic index order.
		if (codegen.sparseOut) {
		Value pos = rewriter.create<arith::ConstantIndexOp>(loc, at);
		rewriter.create<memref::StoreOp>(loc, codegen.loops[idx], codegen.lexIdx,
		pos);
		}
}		}

/// Generates the induction structure for a while-loop.		/// Generates the induction structure for a while-loop.
static void genWhileInduction(Merger &merger, CodeGen &codegen,		static void genWhileInduction(Merger &merger, CodeGen &codegen,
PatternRewriter &rewriter, linalg::GenericOp op,		PatternRewriter &rewriter, linalg::GenericOp op,
unsigned idx, bool needsUniv,		unsigned idx, bool needsUniv,
llvm::BitVector &induction,		llvm::BitVector &induction,
scf::WhileOp whileOp) {		scf::WhileOp whileOp) {
▲ Show 20 Lines • Show All 236 Lines • ▼ Show 20 Lines	static void genStmt(Merger &merger, CodeGen &codegen, PatternRewriter &rewriter,

// End a loop sequence.		// End a loop sequence.
endLoopSeq(merger, codegen, rewriter, op, exp, idx, ldx);		endLoopSeq(merger, codegen, rewriter, op, exp, idx, ldx);
}		}

/// Converts the result computed by the sparse kernel into the required form.		/// Converts the result computed by the sparse kernel into the required form.
static void genResult(Merger &merger, CodeGen &codegen,		static void genResult(Merger &merger, CodeGen &codegen,
PatternRewriter &rewriter, linalg::GenericOp op) {		PatternRewriter &rewriter, linalg::GenericOp op) {
Location loc = op.getLoc();
OpOperand *lhs = op.getOutputOperand(0);		OpOperand *lhs = op.getOutputOperand(0);
Type resType = lhs->get().getType();		Type resType = lhs->get().getType();
unsigned tensor = lhs->getOperandNumber();		Value result;
auto map = op.getTiedIndexingMap(lhs);		if (getSparseTensorEncoding(resType)) {
auto enc = getSparseTensorEncoding(resType);		// The sparse tensor rematerializes from the original
Value result = codegen.buffers.back(); // value array		// sparse tensor's underlying sparse storage format.
if (enc) {		auto hasInserts = rewriter.getBoolAttr(codegen.sparseOut == lhs);
// The sparse annotation unambigiously defines the arrays needed		rewriter.replaceOpWithNewOp<LoadOp>(op, lhs->get(), hasInserts);
// to "reconstruct" the sparse tensor from the storage scheme
// (even though lowering should never need this eventually).
SmallVector<Value, 4> args;
for (unsigned d = 0, rank = map.getNumResults(); d < rank; d++) {
AffineExpr a = map.getResult(perm(enc, d));
if (a.getKind() != AffineExprKind::DimId)
continue; // compound
unsigned idx = a.cast<AffineDimExpr>().getPosition();
if (merger.isDim(tensor, idx, Dim::kSparse)) {
args.push_back(codegen.pointers[tensor][idx]);
args.push_back(codegen.indices[tensor][idx]);
}
}
args.push_back(result);
result = rewriter.create<ToTensorOp>(loc, resType, args);
} else {		} else {
// To "reconstruct" an non-annotated tensor, sipmly load it		// To rematerialize an non-annotated tensor, simply load it
// from the bufferized value.		// from the bufferized value.
result = rewriter.create<memref::TensorLoadOp>(loc, resType, result);		Value val = codegen.buffers.back(); // value array
		rewriter.replaceOpWithNewOp<memref::TensorLoadOp>(op, resType, val);
}		}
rewriter.replaceOp(op, result);
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// Sparse compiler rewriting methods.		// Sparse compiler rewriting methods.
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

namespace {		namespace {

Show All 29 Lines	LogicalResult matchAndRewrite(linalg::GenericOp op,

// Builds the tensor expression for the Linalg operation in SSA form.		// Builds the tensor expression for the Linalg operation in SSA form.
Optional<unsigned> optExp = merger.buildTensorExpFromLinalg(op);		Optional<unsigned> optExp = merger.buildTensorExpFromLinalg(op);
if (!optExp.hasValue())		if (!optExp.hasValue())
return failure();		return failure();
unsigned exp = optExp.getValue();		unsigned exp = optExp.getValue();

// Rejects an inadmissable tensor expression.		// Rejects an inadmissable tensor expression.
if (!isAdmissableTensorExp(merger, op, exp))		OpOperand *sparseOut = nullptr;
		if (!isAdmissableTensorExp(merger, op, exp, &sparseOut))
return failure();		return failure();

// Recursively generates code.		// Recursively generates code.
CodeGen codegen(options, numTensors, numLoops);		CodeGen codegen(options, numTensors, numLoops, sparseOut);
genBuffers(merger, codegen, rewriter, op);		genBuffers(merger, codegen, rewriter, op);
genStmt(merger, codegen, rewriter, op, topSort, exp, 0);		genStmt(merger, codegen, rewriter, op, topSort, exp, 0);
genResult(merger, codegen, rewriter, op);		genResult(merger, codegen, rewriter, op);
return success();		return success();
}		}

private:		private:
/// Options to control sparse code generation.		/// Options to control sparse code generation.
Show All 11 Lines

mlir/lib/ExecutionEngine/SparseTensorUtils.cpp

Show First 20 Lines • Show All 157 Lines • ▼ Show 20 Lines	private:
bool iteratorLocked;		bool iteratorLocked;
unsigned iteratorPos;		unsigned iteratorPos;
};		};

/// Abstract base class of sparse tensor storage. Note that we use		/// Abstract base class of sparse tensor storage. Note that we use
/// function overloading to implement "partial" method specialization.		/// function overloading to implement "partial" method specialization.
class SparseTensorStorageBase {		class SparseTensorStorageBase {
public:		public:
		// Dimension size query.
virtual uint64_t getDimSize(uint64_t) = 0;		virtual uint64_t getDimSize(uint64_t) = 0;

// Overhead storage.		// Overhead storage.
virtual void getPointers(std::vector<uint64_t> **, uint64_t) { fatal("p64"); }		virtual void getPointers(std::vector<uint64_t> **, uint64_t) { fatal("p64"); }
virtual void getPointers(std::vector<uint32_t> **, uint64_t) { fatal("p32"); }		virtual void getPointers(std::vector<uint32_t> **, uint64_t) { fatal("p32"); }
virtual void getPointers(std::vector<uint16_t> **, uint64_t) { fatal("p16"); }		virtual void getPointers(std::vector<uint16_t> **, uint64_t) { fatal("p16"); }
virtual void getPointers(std::vector<uint8_t> **, uint64_t) { fatal("p8"); }		virtual void getPointers(std::vector<uint8_t> **, uint64_t) { fatal("p8"); }
virtual void getIndices(std::vector<uint64_t> **, uint64_t) { fatal("i64"); }		virtual void getIndices(std::vector<uint64_t> **, uint64_t) { fatal("i64"); }
virtual void getIndices(std::vector<uint32_t> **, uint64_t) { fatal("i32"); }		virtual void getIndices(std::vector<uint32_t> **, uint64_t) { fatal("i32"); }
virtual void getIndices(std::vector<uint16_t> **, uint64_t) { fatal("i16"); }		virtual void getIndices(std::vector<uint16_t> **, uint64_t) { fatal("i16"); }
virtual void getIndices(std::vector<uint8_t> **, uint64_t) { fatal("i8"); }		virtual void getIndices(std::vector<uint8_t> **, uint64_t) { fatal("i8"); }

// Primary storage.		// Primary storage.
virtual void getValues(std::vector<double> **) { fatal("valf64"); }		virtual void getValues(std::vector<double> **) { fatal("valf64"); }
virtual void getValues(std::vector<float> **) { fatal("valf32"); }		virtual void getValues(std::vector<float> **) { fatal("valf32"); }
virtual void getValues(std::vector<int64_t> **) { fatal("vali64"); }		virtual void getValues(std::vector<int64_t> **) { fatal("vali64"); }
virtual void getValues(std::vector<int32_t> **) { fatal("vali32"); }		virtual void getValues(std::vector<int32_t> **) { fatal("vali32"); }
virtual void getValues(std::vector<int16_t> **) { fatal("vali16"); }		virtual void getValues(std::vector<int16_t> **) { fatal("vali16"); }
virtual void getValues(std::vector<int8_t> **) { fatal("vali8"); }		virtual void getValues(std::vector<int8_t> **) { fatal("vali8"); }

		// Element-wise insertion in lexicographic index order.
		virtual void lexInsert(uint64_t *, double) { fatal("insf64"); }
		virtual void lexInsert(uint64_t *, float) { fatal("insf32"); }
		virtual void lexInsert(uint64_t *, int64_t) { fatal("insi64"); }
		virtual void lexInsert(uint64_t *, int32_t) { fatal("insi32"); }
		virtual void lexInsert(uint64_t *, int16_t) { fatal("ins16"); }
		virtual void lexInsert(uint64_t *, int8_t) { fatal("insi8"); }
		virtual void endInsert() = 0;

virtual ~SparseTensorStorageBase() {}		virtual ~SparseTensorStorageBase() {}

private:		private:
void fatal(const char *tp) {		void fatal(const char *tp) {
fprintf(stderr, "unsupported %s\n", tp);		fprintf(stderr, "unsupported %s\n", tp);
exit(1);		exit(1);
}		}
};		};

/// A memory-resident sparse tensor using a storage scheme based on		/// A memory-resident sparse tensor using a storage scheme based on
/// per-dimension sparse/dense annotations. This data structure provides a		/// per-dimension sparse/dense annotations. This data structure provides a
/// bufferized form of a sparse tensor type. In contrast to generating setup		/// bufferized form of a sparse tensor type. In contrast to generating setup
/// methods for each differently annotated sparse tensor, this method provides		/// methods for each differently annotated sparse tensor, this method provides
/// a convenient "one-size-fits-all" solution that simply takes an input tensor		/// a convenient "one-size-fits-all" solution that simply takes an input tensor
/// and annotations to implement all required setup in a general manner.		/// and annotations to implement all required setup in a general manner.
template <typename P, typename I, typename V>		template <typename P, typename I, typename V>
class SparseTensorStorage : public SparseTensorStorageBase {		class SparseTensorStorage : public SparseTensorStorageBase {
public:		public:
/// Constructs a sparse tensor storage scheme with the given dimensions,		/// Constructs a sparse tensor storage scheme with the given dimensions,
/// permutation, and per-dimension dense/sparse annotations, using		/// permutation, and per-dimension dense/sparse annotations, using
/// the coordinate scheme tensor for the initial contents if provided.		/// the coordinate scheme tensor for the initial contents if provided.
SparseTensorStorage(const std::vector<uint64_t> &szs, const uint64_t *perm,		SparseTensorStorage(const std::vector<uint64_t> &szs, const uint64_t *perm,
const DimLevelType sparsity, SparseTensorCOO<V> tensor)		const DimLevelType *sparsity,
: sizes(szs), rev(getRank()), pointers(getRank()), indices(getRank()) {		SparseTensorCOO<V> *tensor = nullptr)
		: sizes(szs), rev(getRank()), idx(getRank()), pointers(getRank()),
		indices(getRank()) {
uint64_t rank = getRank();		uint64_t rank = getRank();
// Store "reverse" permutation.		// Store "reverse" permutation.
for (uint64_t r = 0; r < rank; r++)		for (uint64_t r = 0; r < rank; r++)
rev[perm[r]] = r;		rev[perm[r]] = r;
// Provide hints on capacity of pointers and indices.		// Provide hints on capacity of pointers and indices.
// TODO: needs fine-tuning based on sparsity		// TODO: needs fine-tuning based on sparsity
for (uint64_t r = 0, s = 1; r < rank; r++) {		bool allDense = true;
s *= sizes[r];		uint64_t sz = 1;
		for (uint64_t r = 0; r < rank; r++) {
		sz *= sizes[r];
if (sparsity[r] == DimLevelType::kCompressed) {		if (sparsity[r] == DimLevelType::kCompressed) {
pointers[r].reserve(s + 1);		pointers[r].reserve(sz + 1);
indices[r].reserve(s);		indices[r].reserve(sz);
s = 1;		sz = 1;
		allDense = false;
} else {		} else {
assert(sparsity[r] == DimLevelType::kDense &&		assert(sparsity[r] == DimLevelType::kDense &&
"singleton not yet supported");		"singleton not yet supported");
}		}
}		}
// Prepare sparse pointer structures for all dimensions.		// Prepare sparse pointer structures for all dimensions.
for (uint64_t r = 0; r < rank; r++)		for (uint64_t r = 0; r < rank; r++)
if (sparsity[r] == DimLevelType::kCompressed)		if (sparsity[r] == DimLevelType::kCompressed)
pointers[r].push_back(0);		pointers[r].push_back(0);
// Then assign contents from coordinate scheme tensor if provided.		// Then assign contents from coordinate scheme tensor if provided.
if (tensor) {		if (tensor) {
uint64_t nnz = tensor->getElements().size();		uint64_t nnz = tensor->getElements().size();
values.reserve(nnz);		values.reserve(nnz);
fromCOO(tensor, sparsity, 0, nnz, 0);		fromCOO(tensor, sparsity, 0, nnz, 0);
		} else {
		if (allDense)
		values.resize(sz, 0);
		for (uint64_t r = 0; r < rank; r++)
		idx[r] = -1u;
}		}
}		}

virtual ~SparseTensorStorage() {}		virtual ~SparseTensorStorage() {}

/// Get the rank of the tensor.		/// Get the rank of the tensor.
uint64_t getRank() const { return sizes.size(); }		uint64_t getRank() const { return sizes.size(); }

/// Get the size in the given dimension of the tensor.		/// Get the size in the given dimension of the tensor.
uint64_t getDimSize(uint64_t d) override {		uint64_t getDimSize(uint64_t d) override {
assert(d < getRank());		assert(d < getRank());
return sizes[d];		return sizes[d];
}		}

// Partially specialize these three methods based on template types.		/// Partially specialize these getter methods based on template types.
void getPointers(std::vector<P> **out, uint64_t d) override {		void getPointers(std::vector<P> **out, uint64_t d) override {
assert(d < getRank());		assert(d < getRank());
*out = &pointers[d];		*out = &pointers[d];
}		}
void getIndices(std::vector<I> **out, uint64_t d) override {		void getIndices(std::vector<I> **out, uint64_t d) override {
assert(d < getRank());		assert(d < getRank());
*out = &indices[d];		*out = &indices[d];
}		}
void getValues(std::vector<V> *out) override { out = &values; }		void getValues(std::vector<V> *out) override { out = &values; }

		/// Partially specialize lexicographic insertions based on template types.
		// TODO: 1-dim tensors only for now, generalize soon
		void lexInsert(uint64_t *cursor, V val) override {
		wrengrUnsubmitted Not Done Reply Inline Actions Why pointer instead of reference? If pointer is for extern-C reasons, then should assert non-null before dereferencing it wrengr: Why pointer instead of reference? If pointer is for extern-C reasons, then should assert non…
		aartbikAuthorUnsubmitted Done Reply Inline Actions Yeah similar to all the other strided memrefs that are passed between code and lib. I added the assert to IMPL_LEXINSERT, similar to the other macro tests for non-null. Good suggestion! aartbik: Yeah similar to all the other strided memrefs that are passed between code and lib. I added the…
		assert((idx[0] == -1u \|\| idx[0] < cursor[0]) && "not lexicographic");
		indices[0].push_back(cursor[0]);
		values.push_back(val);
		idx[0] = cursor[0];
		}

		/// Finalizes lexicographic insertions.
		void endInsert() override { pointers[0].push_back(indices[0].size()); }

/// Returns this sparse tensor storage scheme as a new memory-resident		/// Returns this sparse tensor storage scheme as a new memory-resident
/// sparse tensor in coordinate scheme with the given dimension order.		/// sparse tensor in coordinate scheme with the given dimension order.
SparseTensorCOO<V> toCOO(const uint64_t perm) {		SparseTensorCOO<V> toCOO(const uint64_t perm) {
// Restore original order of the dimension sizes and allocate coordinate		// Restore original order of the dimension sizes and allocate coordinate
// scheme with desired new ordering specified in perm.		// scheme with desired new ordering specified in perm.
uint64_t rank = getRank();		uint64_t rank = getRank();
std::vector<uint64_t> orgsz(rank);		std::vector<uint64_t> orgsz(rank);
for (uint64_t r = 0; r < rank; r++)		for (uint64_t r = 0; r < rank; r++)
orgsz[rev[r]] = sizes[r];		orgsz[rev[r]] = sizes[r];
SparseTensorCOO<V> *tensor = SparseTensorCOO<V>::newSparseTensorCOO(		SparseTensorCOO<V> *tensor = SparseTensorCOO<V>::newSparseTensorCOO(
rank, orgsz.data(), perm, values.size());		rank, orgsz.data(), perm, values.size());
// Populate coordinate scheme restored from old ordering and changed with		// Populate coordinate scheme restored from old ordering and changed with
// new ordering. Rather than applying both reorderings during the recursion,		// new ordering. Rather than applying both reorderings during the recursion,
// we compute the combine permutation in advance.		// we compute the combine permutation in advance.
std::vector<uint64_t> reord(rank);		std::vector<uint64_t> reord(rank);
for (uint64_t r = 0; r < rank; r++)		for (uint64_t r = 0; r < rank; r++)
reord[r] = perm[rev[r]];		reord[r] = perm[rev[r]];
std::vector<uint64_t> idx(rank);		toCOO(tensor, reord, 0, 0);
toCOO(tensor, reord, idx, 0, 0);
assert(tensor->getElements().size() == values.size());		assert(tensor->getElements().size() == values.size());
return tensor;		return tensor;
}		}

/// Factory method. Constructs a sparse tensor storage scheme with the given		/// Factory method. Constructs a sparse tensor storage scheme with the given
/// dimensions, permutation, and per-dimension dense/sparse annotations,		/// dimensions, permutation, and per-dimension dense/sparse annotations,
/// using the coordinate scheme tensor for the initial contents if provided.		/// using the coordinate scheme tensor for the initial contents if provided.
/// In the latter case, the coordinate scheme must respect the same		/// In the latter case, the coordinate scheme must respect the same
Show All 9 Lines	if (tensor) {
tensor->sort(); // sort lexicographically		tensor->sort(); // sort lexicographically
n = new SparseTensorStorage<P, I, V>(tensor->getSizes(), perm, sparsity,		n = new SparseTensorStorage<P, I, V>(tensor->getSizes(), perm, sparsity,
tensor);		tensor);
delete tensor;		delete tensor;
} else {		} else {
std::vector<uint64_t> permsz(rank);		std::vector<uint64_t> permsz(rank);
for (uint64_t r = 0; r < rank; r++)		for (uint64_t r = 0; r < rank; r++)
permsz[perm[r]] = sizes[r];		permsz[perm[r]] = sizes[r];
n = new SparseTensorStorage<P, I, V>(permsz, perm, sparsity, tensor);		n = new SparseTensorStorage<P, I, V>(permsz, perm, sparsity);
}		}
return n;		return n;
}		}

private:		private:
/// Initializes sparse tensor storage scheme from a memory-resident sparse		/// Initializes sparse tensor storage scheme from a memory-resident sparse
/// tensor in coordinate scheme. This method prepares the pointers and		/// tensor in coordinate scheme. This method prepares the pointers and
/// indices arrays under the given per-dimension dense/sparse annotations.		/// indices arrays under the given per-dimension dense/sparse annotations.
void fromCOO(SparseTensorCOO<V> tensor, const DimLevelType sparsity,		void fromCOO(SparseTensorCOO<V> tensor, const DimLevelType sparsity,
uint64_t lo, uint64_t hi, uint64_t d) {		uint64_t lo, uint64_t hi, uint64_t d) {
const std::vector<Element<V>> &elements = tensor->getElements();		const std::vector<Element<V>> &elements = tensor->getElements();
// Once dimensions are exhausted, insert the numerical values.		// Once dimensions are exhausted, insert the numerical values.
		assert(d <= getRank());
if (d == getRank()) {		if (d == getRank()) {
assert(lo >= hi \|\| lo < elements.size());		assert(lo >= hi \|\| lo < elements.size());
values.push_back(lo < hi ? elements[lo].value : 0);		values.push_back(lo < hi ? elements[lo].value : 0);
return;		return;
}		}
assert(d < getRank());
// Visit all elements in this interval.		// Visit all elements in this interval.
uint64_t full = 0;		uint64_t full = 0;
while (lo < hi) {		while (lo < hi) {
assert(lo < elements.size() && hi <= elements.size());		assert(lo < elements.size() && hi <= elements.size());
// Find segment in interval with same index elements in this dimension.		// Find segment in interval with same index elements in this dimension.
uint64_t idx = elements[lo].indices[d];		uint64_t i = elements[lo].indices[d];
uint64_t seg = lo + 1;		uint64_t seg = lo + 1;
while (seg < hi && elements[seg].indices[d] == idx)		while (seg < hi && elements[seg].indices[d] == i)
seg++;		seg++;
// Handle segment in interval for sparse or dense dimension.		// Handle segment in interval for sparse or dense dimension.
if (sparsity[d] == DimLevelType::kCompressed) {		if (sparsity[d] == DimLevelType::kCompressed) {
indices[d].push_back(idx);		indices[d].push_back(i);
} else {		} else {
// For dense storage we must fill in all the zero values between		// For dense storage we must fill in all the zero values between
// the previous element (when last we ran this for-loop) and the		// the previous element (when last we ran this for-loop) and the
// current element.		// current element.
for (; full < idx; full++)		for (; full < i; full++)
fromCOO(tensor, sparsity, 0, 0, d + 1); // pass empty		fromCOO(tensor, sparsity, 0, 0, d + 1); // pass empty
full++;		full++;
}		}
fromCOO(tensor, sparsity, lo, seg, d + 1);		fromCOO(tensor, sparsity, lo, seg, d + 1);
// And move on to next segment in interval.		// And move on to next segment in interval.
lo = seg;		lo = seg;
}		}
// Finalize the sparse pointer structure at this dimension.		// Finalize the sparse pointer structure at this dimension.
if (sparsity[d] == DimLevelType::kCompressed) {		if (sparsity[d] == DimLevelType::kCompressed) {
pointers[d].push_back(indices[d].size());		pointers[d].push_back(indices[d].size());
} else {		} else {
// For dense storage we must fill in all the zero values after		// For dense storage we must fill in all the zero values after
// the last element.		// the last element.
for (uint64_t sz = sizes[d]; full < sz; full++)		for (uint64_t sz = sizes[d]; full < sz; full++)
fromCOO(tensor, sparsity, 0, 0, d + 1); // pass empty		fromCOO(tensor, sparsity, 0, 0, d + 1); // pass empty
}		}
}		}

/// Stores the sparse tensor storage scheme into a memory-resident sparse		/// Stores the sparse tensor storage scheme into a memory-resident sparse
/// tensor in coordinate scheme.		/// tensor in coordinate scheme.
void toCOO(SparseTensorCOO<V> *tensor, std::vector<uint64_t> &reord,		void toCOO(SparseTensorCOO<V> *tensor, std::vector<uint64_t> &reord,
std::vector<uint64_t> &idx, uint64_t pos, uint64_t d) {		uint64_t pos, uint64_t d) {
assert(d <= getRank());		assert(d <= getRank());
if (d == getRank()) {		if (d == getRank()) {
assert(pos < values.size());		assert(pos < values.size());
tensor->add(idx, values[pos]);		tensor->add(idx, values[pos]);
} else if (pointers[d].empty()) {		} else if (pointers[d].empty()) {
// Dense dimension.		// Dense dimension.
for (uint64_t i = 0, sz = sizes[d], off = pos * sz; i < sz; i++) {		for (uint64_t i = 0, sz = sizes[d], off = pos * sz; i < sz; i++) {
idx[reord[d]] = i;		idx[reord[d]] = i;
toCOO(tensor, reord, idx, off + i, d + 1);		toCOO(tensor, reord, off + i, d + 1);
}		}
} else {		} else {
// Sparse dimension.		// Sparse dimension.
for (uint64_t ii = pointers[d][pos]; ii < pointers[d][pos + 1]; ii++) {		for (uint64_t ii = pointers[d][pos]; ii < pointers[d][pos + 1]; ii++) {
idx[reord[d]] = indices[d][ii];		idx[reord[d]] = indices[d][ii];
toCOO(tensor, reord, idx, ii, d + 1);		toCOO(tensor, reord, ii, d + 1);
}		}
}		}
}		}

private:		private:
std::vector<uint64_t> sizes; // per-dimension sizes		std::vector<uint64_t> sizes; // per-dimension sizes
std::vector<uint64_t> rev; // "reverse" permutation		std::vector<uint64_t> rev; // "reverse" permutation
		std::vector<uint64_t> idx; // index cursor
std::vector<std::vector<P>> pointers;		std::vector<std::vector<P>> pointers;
std::vector<std::vector<I>> indices;		std::vector<std::vector<I>> indices;
std::vector<V> values;		std::vector<V> values;
};		};

/// Helper to convert string to lower case.		/// Helper to convert string to lower case.
static char toLower(char token) {		static char toLower(char token) {
for (char c = token; c; c++)		for (char c = token; c; c++)
▲ Show 20 Lines • Show All 100 Lines • ▼ Show 20 Lines	static SparseTensorCOO<V> openSparseTensorCOO(char filename, uint64_t rank,
for (uint64_t r = 0; r < rank; r++)		for (uint64_t r = 0; r < rank; r++)
assert((sizes[r] == 0 \|\| sizes[r] == idata[2 + r]) &&		assert((sizes[r] == 0 \|\| sizes[r] == idata[2 + r]) &&
"dimension size mismatch");		"dimension size mismatch");
SparseTensorCOO<V> *tensor =		SparseTensorCOO<V> *tensor =
SparseTensorCOO<V>::newSparseTensorCOO(rank, idata + 2, perm, nnz);		SparseTensorCOO<V>::newSparseTensorCOO(rank, idata + 2, perm, nnz);
// Read all nonzero elements.		// Read all nonzero elements.
std::vector<uint64_t> indices(rank);		std::vector<uint64_t> indices(rank);
for (uint64_t k = 0; k < nnz; k++) {		for (uint64_t k = 0; k < nnz; k++) {
uint64_t idx = -1;		uint64_t idx = -1u;
for (uint64_t r = 0; r < rank; r++) {		for (uint64_t r = 0; r < rank; r++) {
if (fscanf(file, "%" PRIu64, &idx) != 1) {		if (fscanf(file, "%" PRIu64, &idx) != 1) {
fprintf(stderr, "Cannot find next index in %s\n", filename);		fprintf(stderr, "Cannot find next index in %s\n", filename);
exit(1);		exit(1);
}		}
// Add 0-based index.		// Add 0-based index.
indices[perm[r]] = idx - 1;		indices[perm[r]] = idx - 1;
}		}
▲ Show 20 Lines • Show All 120 Lines • ▼ Show 20 Lines	if (elem == nullptr) { \
return false; \		return false; \
} \		} \
for (uint64_t r = 0; r < isize; r++) \		for (uint64_t r = 0; r < isize; r++) \
indx[r] = elem->indices[r]; \		indx[r] = elem->indices[r]; \
*value = elem->value; \		*value = elem->value; \
return true; \		return true; \
}		}

		#define IMPL_LEXINSERT(NAME, V) \
		void _mlir_ciface_##NAME(void tensor, StridedMemRefType<index_t, 1> cref, \
		V val) { \
		assert(cref->strides[0] == 1); \
		uint64_t *cursor = cref->data + cref->offset; \
		static_cast<SparseTensorStorageBase *>(tensor)->lexInsert(cursor, val); \
		}

/// Constructs a new sparse tensor. This is the "swiss army knife"		/// Constructs a new sparse tensor. This is the "swiss army knife"
/// method for materializing sparse tensors into the computation.		/// method for materializing sparse tensors into the computation.
///		///
/// Action:		/// Action:
/// kEmpty = returns empty storage to fill later		/// kEmpty = returns empty storage to fill later
/// kFromFile = returns storage, where ptr contains filename to read		/// kFromFile = returns storage, where ptr contains filename to read
/// kFromCOO = returns storage, where ptr contains coordinate scheme to assign		/// kFromCOO = returns storage, where ptr contains coordinate scheme to assign
/// kEmptyCOO = returns empty coordinate scheme to fill and use with kFromCOO		/// kEmptyCOO = returns empty coordinate scheme to fill and use with kFromCOO
▲ Show 20 Lines • Show All 135 Lines • ▼ Show 20 Lines
/// Helper to enumerate elements of coordinate scheme, one per value type.		/// Helper to enumerate elements of coordinate scheme, one per value type.
IMPL_GETNEXT(getNextF64, double)		IMPL_GETNEXT(getNextF64, double)
IMPL_GETNEXT(getNextF32, float)		IMPL_GETNEXT(getNextF32, float)
IMPL_GETNEXT(getNextI64, int64_t)		IMPL_GETNEXT(getNextI64, int64_t)
IMPL_GETNEXT(getNextI32, int32_t)		IMPL_GETNEXT(getNextI32, int32_t)
IMPL_GETNEXT(getNextI16, int16_t)		IMPL_GETNEXT(getNextI16, int16_t)
IMPL_GETNEXT(getNextI8, int8_t)		IMPL_GETNEXT(getNextI8, int8_t)

		/// Helper to insert elements in lexicograph index order, one per value type.
		IMPL_LEXINSERT(lexInsertF64, double)
		IMPL_LEXINSERT(lexInsertF32, float)
		IMPL_LEXINSERT(lexInsertI64, int64_t)
		IMPL_LEXINSERT(lexInsertI32, int32_t)
		IMPL_LEXINSERT(lexInsertI16, int16_t)
		IMPL_LEXINSERT(lexInsertI8, int8_t)

#undef CASE		#undef CASE
#undef IMPL_SPARSEVALUES		#undef IMPL_SPARSEVALUES
#undef IMPL_GETOVERHEAD		#undef IMPL_GETOVERHEAD
#undef IMPL_ADDELT		#undef IMPL_ADDELT
#undef IMPL_GETNEXT		#undef IMPL_GETNEXT
		#undef IMPL_INSERTLEX

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
//		//
// Public API with methods that accept C-style data structures to interact		// Public API with methods that accept C-style data structures to interact
// with sparse tensors, which are only visible as opaque pointers externally.		// with sparse tensors, which are only visible as opaque pointers externally.
// These methods can be used both by MLIR compiler-generated code as well as by		// These methods can be used both by MLIR compiler-generated code as well as by
// an external runtime that wants to interact with MLIR compiler-generated code.		// an external runtime that wants to interact with MLIR compiler-generated code.
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

/// Helper method to read a sparse tensor filename from the environment,		/// Helper method to read a sparse tensor filename from the environment,
/// defined with the naming convention ${TENSOR0}, ${TENSOR1}, etc.		/// defined with the naming convention ${TENSOR0}, ${TENSOR1}, etc.
char *getTensorFilename(index_t id) {		char *getTensorFilename(index_t id) {
char var[80];		char var[80];
sprintf(var, "TENSOR%" PRIu64, id);		sprintf(var, "TENSOR%" PRIu64, id);
char *env = getenv(var);		char *env = getenv(var);
return env;		return env;
}		}

/// Returns size of sparse tensor in given dimension.		/// Returns size of sparse tensor in given dimension.
index_t sparseDimSize(void *tensor, index_t d) {		index_t sparseDimSize(void *tensor, index_t d) {
return static_cast<SparseTensorStorageBase *>(tensor)->getDimSize(d);		return static_cast<SparseTensorStorageBase *>(tensor)->getDimSize(d);
}		}

		/// Finalizes lexicographic insertions.
		void endInsert(void *tensor) {
		return static_cast<SparseTensorStorageBase *>(tensor)->endInsert();
		}

/// Releases sparse tensor storage.		/// Releases sparse tensor storage.
void delSparseTensor(void *tensor) {		void delSparseTensor(void *tensor) {
delete static_cast<SparseTensorStorageBase *>(tensor);		delete static_cast<SparseTensorStorageBase *>(tensor);
}		}

/// Initializes sparse tensor from a COO-flavored format expressed using C-style		/// Initializes sparse tensor from a COO-flavored format expressed using C-style
/// data structures. The expected parameters are:		/// data structures. The expected parameters are:
///		///
▲ Show 20 Lines • Show All 42 Lines • Show Last 20 Lines

mlir/test/Dialect/SparseTensor/conversion.mlir

	// RUN: mlir-opt %s --sparse-tensor-conversion --canonicalize --cse \| FileCheck %s			// RUN: mlir-opt %s --sparse-tensor-conversion --canonicalize --cse \| FileCheck %s

	#DenseVector = #sparse_tensor.encoding<{
	dimLevelType = ["dense"]
	}>

	#SparseVector = #sparse_tensor.encoding<{			#SparseVector = #sparse_tensor.encoding<{
	dimLevelType = ["compressed"]			dimLevelType = ["compressed"]
	}>			}>

	#SparseVector64 = #sparse_tensor.encoding<{			#SparseVector64 = #sparse_tensor.encoding<{
	dimLevelType = ["compressed"],			dimLevelType = ["compressed"],
	pointerBitWidth = 64,			pointerBitWidth = 64,
	indexBitWidth = 64			indexBitWidth = 64
	▲ Show 20 Lines • Show All 395 Lines • ▼ Show 20 Lines
	// CHECK-SAME: %[[A:.*]]: !llvm.ptr<i8>)			// CHECK-SAME: %[[A:.*]]: !llvm.ptr<i8>)
	// CHECK: %[[T:.*]] = call @sparseValuesI8(%[[A]]) : (!llvm.ptr<i8>) -> memref<?xi8>			// CHECK: %[[T:.*]] = call @sparseValuesI8(%[[A]]) : (!llvm.ptr<i8>) -> memref<?xi8>
	// CHECK: return %[[T]] : memref<?xi8>			// CHECK: return %[[T]] : memref<?xi8>
	func @sparse_valuesi8(%arg0: tensor<128xi8, #SparseVector>) -> memref<?xi8> {			func @sparse_valuesi8(%arg0: tensor<128xi8, #SparseVector>) -> memref<?xi8> {
	%0 = sparse_tensor.values %arg0: tensor<128xi8, #SparseVector> to memref<?xi8>			%0 = sparse_tensor.values %arg0: tensor<128xi8, #SparseVector> to memref<?xi8>
	return %0 : memref<?xi8>			return %0 : memref<?xi8>
	}			}

	// CHECK-LABEL: func @sparse_reconstruct_1(			// CHECK-LABEL: func @sparse_reconstruct(
	// CHECK-SAME: %[[A:.*]]: !llvm.ptr<i8>			// CHECK-SAME: %[[A:.*]]: !llvm.ptr<i8>
	// CHECK: return %[[A]] : !llvm.ptr<i8>			// CHECK: return %[[A]] : !llvm.ptr<i8>
	func @sparse_reconstruct_1(%arg0: tensor<128xf32, #DenseVector> {linalg.inplaceable = true}) -> tensor<128xf32, #DenseVector> {			func @sparse_reconstruct(%arg0: tensor<128xf32, #SparseVector>) -> tensor<128xf32, #SparseVector> {
	%0 = sparse_tensor.values %arg0 : tensor<128xf32, #DenseVector> to memref<?xf32>			%0 = sparse_tensor.load %arg0, false : tensor<128xf32, #SparseVector>
	%1 = sparse_tensor.tensor %0 : memref<?xf32> to tensor<128xf32, #DenseVector>			return %0 : tensor<128xf32, #SparseVector>
				wrengrUnsubmitted Done Reply Inline Actions Why the removal of `#DenseVector`, is that test no longer valid for LoadOp? wrengr: Why the removal of `#DenseVector`, is that test no longer valid for LoadOp?
				aartbikAuthorUnsubmitted Done Reply Inline Actions The reconstruct (was .tensor, now .load to be more consistent with tensor equivalent) used to depend on the sparsity structure (so I tested a sparse and a dense one). I opted for the side-effect impureness for the time being, otherwise we get a lot of SSA spaghetti deps in intermediate very short lived code that adds no value. We may refine as needed. aartbik: The reconstruct (was .tensor, now .load to be more consistent with tensor equivalent) used to…
	return %1 : tensor<128xf32, #DenseVector>
	}			}

	// CHECK-LABEL: func @sparse_reconstruct_n(			// CHECK-LABEL: func @sparse_reconstruct_ins(
	// CHECK-SAME: %[[A:.*]]: !llvm.ptr<i8>			// CHECK-SAME: %[[A:.*]]: !llvm.ptr<i8>
				// CHECK: call @endInsert(%[[A]]) : (!llvm.ptr<i8>) -> ()
	// CHECK: return %[[A]] : !llvm.ptr<i8>			// CHECK: return %[[A]] : !llvm.ptr<i8>
	func @sparse_reconstruct_n(%arg0: tensor<128xf32, #SparseVector> {linalg.inplaceable = true}) -> tensor<128xf32, #SparseVector> {			func @sparse_reconstruct_ins(%arg0: tensor<128xf32, #SparseVector>) -> tensor<128xf32, #SparseVector> {
	%c = arith.constant 0 : index			%0 = sparse_tensor.load %arg0, true : tensor<128xf32, #SparseVector>
	%0 = sparse_tensor.pointers %arg0, %c : tensor<128xf32, #SparseVector> to memref<?xindex>			return %0 : tensor<128xf32, #SparseVector>
	%1 = sparse_tensor.indices %arg0, %c : tensor<128xf32, #SparseVector> to memref<?xindex>			}
	%2 = sparse_tensor.values %arg0 : tensor<128xf32, #SparseVector> to memref<?xf32>
	%3 = sparse_tensor.tensor %0, %1, %2 : memref<?xindex>, memref<?xindex>, memref<?xf32> to tensor<128xf32, #SparseVector>			// CHECK-LABEL: func @sparse_insert(
	return %3 : tensor<128xf32, #SparseVector>			// CHECK-SAME: %[[A:.*]]: !llvm.ptr<i8>,
				// CHECK-SAME: %[[B:.*]]: memref<?xindex>,
				// CHECK-SAME: %[[C:.*]]: f32) {
				// CHECK: call @lexInsertF32(%[[A]], %[[B]], %[[C]]) : (!llvm.ptr<i8>, memref<?xindex>, f32) -> ()
				// CHECK: return
				func @sparse_insert(%arg0: tensor<128xf32, #SparseVector>,
				%arg1: memref<?xindex>,
				%arg2: f32) {
				sparse_tensor.lex_insert %arg0, %arg1, %arg2 : tensor<128xf32, #SparseVector>, memref<?xindex>, f32
				return
	}			}

mlir/test/Dialect/SparseTensor/dense.mlir

	Show First 20 Lines • Show All 111 Lines • ▼ Show 20 Lines
	}			}

	//			//
	// Test with a non-annotated dense matrix as input and			// Test with a non-annotated dense matrix as input and
	// an all-dense annotated "sparse" matrix as output.			// an all-dense annotated "sparse" matrix as output.
	// The rewriting would fail if argx was not in-placeable.			// The rewriting would fail if argx was not in-placeable.
	//			//
	// CHECK-LABEL: func @dense3(			// CHECK-LABEL: func @dense3(
	// CHECK-SAME: %[[VAL_0:.*]]: tensor<32x16xf32>,			// CHECK-SAME: %[[VAL_0:.*]]: tensor<32x16xf32>,
	// CHECK-SAME: %[[VAL_1:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> {linalg.inplaceable = true}) -> tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>> {			// CHECK-SAME: %[[VAL_1:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> {linalg.inplaceable = true}) -> tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>> {
	// CHECK: %[[VAL_2:.*]] = arith.constant 1.000000e+00 : f32			// CHECK-DAG: %[[VAL_2:.*]] = arith.constant 1.000000e+00 : f32
	// CHECK: %[[VAL_3:.*]] = arith.constant 32 : index			// CHECK-DAG: %[[VAL_3:.*]] = arith.constant 32 : index
	// CHECK: %[[VAL_4:.*]] = arith.constant 16 : index			// CHECK-DAG: %[[VAL_4:.*]] = arith.constant 16 : index
	// CHECK: %[[VAL_5:.*]] = arith.constant 0 : index			// CHECK-DAG: %[[VAL_5:.*]] = arith.constant 0 : index
	// CHECK: %[[VAL_6:.*]] = arith.constant 1 : index			// CHECK-DAG: %[[VAL_6:.*]] = arith.constant 1 : index
	// CHECK: %[[VAL_7:.*]] = memref.buffer_cast %[[VAL_0]] : memref<32x16xf32>			// CHECK: %[[VAL_7:.*]] = memref.buffer_cast %[[VAL_0]] : memref<32x16xf32>
	// CHECK: %[[VAL_8:.]] = sparse_tensor.values %[[VAL_1]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xf32>			// CHECK: %[[VAL_8:.]] = sparse_tensor.values %[[VAL_1]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xf32>
	// CHECK: scf.for %[[VAL_9:.*]] = %[[VAL_5]] to %[[VAL_3]] step %[[VAL_6]] {			// CHECK: scf.for %[[VAL_9:.*]] = %[[VAL_5]] to %[[VAL_3]] step %[[VAL_6]] {
	// CHECK: scf.for %[[VAL_10:.*]] = %[[VAL_5]] to %[[VAL_4]] step %[[VAL_6]] {			// CHECK: scf.for %[[VAL_10:.*]] = %[[VAL_5]] to %[[VAL_4]] step %[[VAL_6]] {
	// CHECK: %[[VAL_11:.*]] = arith.muli %[[VAL_9]], %[[VAL_4]] : index			// CHECK: %[[VAL_11:.*]] = arith.muli %[[VAL_9]], %[[VAL_4]] : index
	// CHECK: %[[VAL_12:.*]] = arith.addi %[[VAL_11]], %[[VAL_10]] : index			// CHECK: %[[VAL_12:.*]] = arith.addi %[[VAL_11]], %[[VAL_10]] : index
	// CHECK: %[[VAL_13:.*]] = memref.load %[[VAL_7]]{{\[}}%[[VAL_9]], %[[VAL_10]]] : memref<32x16xf32>			// CHECK: %[[VAL_13:.*]] = memref.load %[[VAL_7]]{{\[}}%[[VAL_9]], %[[VAL_10]]] : memref<32x16xf32>
	// CHECK: %[[VAL_14:.*]] = arith.addf %[[VAL_13]], %[[VAL_2]] : f32			// CHECK: %[[VAL_14:.*]] = arith.addf %[[VAL_13]], %[[VAL_2]] : f32
	// CHECK: memref.store %[[VAL_14]], %[[VAL_8]]{{\[}}%[[VAL_12]]] : memref<?xf32>			// CHECK: memref.store %[[VAL_14]], %[[VAL_8]]{{\[}}%[[VAL_12]]] : memref<?xf32>
	// CHECK: }			// CHECK: }
	// CHECK: }			// CHECK: }
	// CHECK: %[[VAL_15:.]] = sparse_tensor.tensor %[[VAL_8]] : memref<?xf32> to tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>			// CHECK: %[[VAL_15:.]] = sparse_tensor.load %[[VAL_1]], false : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>
	// CHECK: return %[[VAL_15]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>>			// CHECK: return %[[VAL_15]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>>
	// CHECK: }			// CHECK: }
	func @dense3(%arga: tensor<32x16xf32>,			func @dense3(%arga: tensor<32x16xf32>,
	%argx: tensor<32x16xf32, #DenseMatrix> {linalg.inplaceable = true})			%argx: tensor<32x16xf32, #DenseMatrix> {linalg.inplaceable = true})
	-> tensor<32x16xf32, #DenseMatrix> {			-> tensor<32x16xf32, #DenseMatrix> {
	%c = arith.constant 1.0 : f32			%c = arith.constant 1.0 : f32
	%0 = linalg.generic #trait_2d			%0 = linalg.generic #trait_2d
	ins(%arga: tensor<32x16xf32>)			ins(%arga: tensor<32x16xf32>)
	Show All 9 Lines
	//			//
	// Test with a non-annotated dense matrix as input and			// Test with a non-annotated dense matrix as input and
	// an all-dense annotated "sparse" matrix as output.			// an all-dense annotated "sparse" matrix as output.
	// The rewriting would fail if argx was not in-placeable.			// The rewriting would fail if argx was not in-placeable.
	// The missing innermost "k" index (due to a reduction) is accounted			// The missing innermost "k" index (due to a reduction) is accounted
	// for by scalarizing the reduction operation for the output tensor.			// for by scalarizing the reduction operation for the output tensor.
	//			//
	// CHECK-LABEL: func @dense4(			// CHECK-LABEL: func @dense4(
	// CHECK-SAME: %[[VAL_0:.*]]: tensor<32x16x8xf32>,			// CHECK-SAME: %[[VAL_0:.*]]: tensor<32x16x8xf32>,
	// CHECK-SAME: %[[VAL_1:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> {linalg.inplaceable = true}) -> tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>> {			// CHECK-SAME: %[[VAL_1:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> {linalg.inplaceable = true}) -> tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>> {
	// CHECK: %[[VAL_2:.*]] = arith.constant 8 : index			// CHECK-DAG: %[[VAL_2:.*]] = arith.constant 8 : index
	// CHECK: %[[VAL_3:.*]] = arith.constant 32 : index			// CHECK-DAG: %[[VAL_3:.*]] = arith.constant 32 : index
	// CHECK: %[[VAL_4:.*]] = arith.constant 16 : index			// CHECK-DAG: %[[VAL_4:.*]] = arith.constant 16 : index
	// CHECK: %[[VAL_5:.*]] = arith.constant 0 : index			// CHECK-DAG: %[[VAL_5:.*]] = arith.constant 0 : index
	// CHECK: %[[VAL_6:.*]] = arith.constant 1 : index			// CHECK-DAG: %[[VAL_6:.*]] = arith.constant 1 : index
	// CHECK: %[[VAL_7:.*]] = memref.buffer_cast %[[VAL_0]] : memref<32x16x8xf32>			// CHECK: %[[VAL_7:.*]] = memref.buffer_cast %[[VAL_0]] : memref<32x16x8xf32>
	// CHECK: %[[VAL_8:.]] = sparse_tensor.values %[[VAL_1]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}}>> to memref<?xf32>			// CHECK: %[[VAL_8:.]] = sparse_tensor.values %[[VAL_1]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}}>> to memref<?xf32>
	// CHECK: scf.for %[[VAL_9:.*]] = %[[VAL_5]] to %[[VAL_3]] step %[[VAL_6]] {			// CHECK: scf.for %[[VAL_9:.*]] = %[[VAL_5]] to %[[VAL_3]] step %[[VAL_6]] {
	// CHECK: scf.for %[[VAL_10:.*]] = %[[VAL_5]] to %[[VAL_4]] step %[[VAL_6]] {			// CHECK: scf.for %[[VAL_10:.*]] = %[[VAL_5]] to %[[VAL_4]] step %[[VAL_6]] {
	// CHECK: %[[VAL_11:.*]] = arith.muli %[[VAL_9]], %[[VAL_4]] : index			// CHECK: %[[VAL_11:.*]] = arith.muli %[[VAL_9]], %[[VAL_4]] : index
	// CHECK: %[[VAL_12:.*]] = arith.addi %[[VAL_11]], %[[VAL_10]] : index			// CHECK: %[[VAL_12:.*]] = arith.addi %[[VAL_11]], %[[VAL_10]] : index
	// CHECK: %[[VAL_13:.*]] = memref.load %[[VAL_8]]{{\[}}%[[VAL_12]]] : memref<?xf32>			// CHECK: %[[VAL_13:.*]] = memref.load %[[VAL_8]]{{\[}}%[[VAL_12]]] : memref<?xf32>
	// CHECK: %[[VAL_14:.]] = scf.for %[[VAL_15:.]] = %[[VAL_5]] to %[[VAL_2]] step %[[VAL_6]] iter_args(%[[VAL_16:.*]] = %[[VAL_13]]) -> (f32) {			// CHECK: %[[VAL_14:.]] = scf.for %[[VAL_15:.]] = %[[VAL_5]] to %[[VAL_2]] step %[[VAL_6]] iter_args(%[[VAL_16:.*]] = %[[VAL_13]]) -> (f32) {
	// CHECK: %[[VAL_17:.*]] = memref.load %[[VAL_7]]{{\[}}%[[VAL_9]], %[[VAL_10]], %[[VAL_15]]] : memref<32x16x8xf32>			// CHECK: %[[VAL_17:.*]] = memref.load %[[VAL_7]]{{\[}}%[[VAL_9]], %[[VAL_10]], %[[VAL_15]]] : memref<32x16x8xf32>
	// CHECK: %[[VAL_18:.*]] = arith.addf %[[VAL_16]], %[[VAL_17]] : f32			// CHECK: %[[VAL_18:.*]] = arith.addf %[[VAL_16]], %[[VAL_17]] : f32
	// CHECK: scf.yield %[[VAL_18]] : f32			// CHECK: scf.yield %[[VAL_18]] : f32
	// CHECK: }			// CHECK: }
	// CHECK: memref.store %[[VAL_19:.*]], %[[VAL_8]]{{\[}}%[[VAL_12]]] : memref<?xf32>			// CHECK: memref.store %[[VAL_19:.*]], %[[VAL_8]]{{\[}}%[[VAL_12]]] : memref<?xf32>
	// CHECK: }			// CHECK: }
	// CHECK: }			// CHECK: }
	// CHECK: %[[VAL_20:.]] = sparse_tensor.tensor %[[VAL_8]] : memref<?xf32> to tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>			// CHECK: %[[VAL_20:.]] = sparse_tensor.load %[[VAL_1]], false : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>
	// CHECK: return %[[VAL_20]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>>			// CHECK: return %[[VAL_20]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>>
	// CHECK: }			// CHECK: }
	func @dense4(%arga: tensor<32x16x8xf32>,			func @dense4(%arga: tensor<32x16x8xf32>,
	%argx: tensor<32x16xf32, #DenseMatrix> {linalg.inplaceable = true})			%argx: tensor<32x16xf32, #DenseMatrix> {linalg.inplaceable = true})
	-> tensor<32x16xf32, #DenseMatrix> {			-> tensor<32x16xf32, #DenseMatrix> {
	%0 = linalg.generic #trait_3d			%0 = linalg.generic #trait_3d
	ins(%arga: tensor<32x16x8xf32>)			ins(%arga: tensor<32x16x8xf32>)
	outs(%argx: tensor<32x16xf32, #DenseMatrix>) {			outs(%argx: tensor<32x16xf32, #DenseMatrix>) {
	^bb(%a: f32, %x: f32):			^bb(%a: f32, %x: f32):
	%1 = arith.addf %x, %a : f32			%1 = arith.addf %x, %a : f32
	linalg.yield %1 : f32			linalg.yield %1 : f32
	} -> tensor<32x16xf32, #DenseMatrix>			} -> tensor<32x16xf32, #DenseMatrix>
	return %0 : tensor<32x16xf32, #DenseMatrix>			return %0 : tensor<32x16xf32, #DenseMatrix>
	}			}

mlir/test/Dialect/SparseTensor/fold.mlir

	// RUN: mlir-opt %s --canonicalize --cse \| FileCheck %s			// RUN: mlir-opt %s --canonicalize --cse \| FileCheck %s

	#DenseVector = #sparse_tensor.encoding<{dimLevelType = ["dense"]}>
	#SparseVector = #sparse_tensor.encoding<{dimLevelType = ["compressed"]}>			#SparseVector = #sparse_tensor.encoding<{dimLevelType = ["compressed"]}>

	// CHECK-LABEL: func @sparse_nop_convert(			// CHECK-LABEL: func @sparse_nop_convert(
	// CHECK-SAME: %[[A:.]]: tensor<64xf32, #{{.}}>)			// CHECK-SAME: %[[A:.]]: tensor<64xf32, #sparse_tensor.encoding<{{{.}}}>>)
	// CHECK: return %[[A]] : tensor<64xf32, #{{.*}}>			// CHECK-NOT: sparse_tensor.convert
				// CHECK: return %[[A]] : tensor<64xf32, #sparse_tensor.encoding<{{{.*}}}>>
	func @sparse_nop_convert(%arg0: tensor<64xf32, #SparseVector>) -> tensor<64xf32, #SparseVector> {			func @sparse_nop_convert(%arg0: tensor<64xf32, #SparseVector>) -> tensor<64xf32, #SparseVector> {
	%0 = sparse_tensor.convert %arg0 : tensor<64xf32, #SparseVector> to tensor<64xf32, #SparseVector>			%0 = sparse_tensor.convert %arg0 : tensor<64xf32, #SparseVector> to tensor<64xf32, #SparseVector>
	return %0 : tensor<64xf32, #SparseVector>			return %0 : tensor<64xf32, #SparseVector>
	}			}

	// CHECK-LABEL: func @sparse_dce_convert(			// CHECK-LABEL: func @sparse_dce_convert(
	// CHECK-SAME: %[[A:.*]]: tensor<64xf32>)			// CHECK-SAME: %[[A:.*]]: tensor<64xf32>)
	// CHECK-NOT: sparse_tensor.convert			// CHECK-NOT: sparse_tensor.convert
	Show All 11 Lines
	// CHECK: return			// CHECK: return
	func @sparse_dce_getters(%arg0: tensor<64xf32, #SparseVector>) {			func @sparse_dce_getters(%arg0: tensor<64xf32, #SparseVector>) {
	%c = arith.constant 0 : index			%c = arith.constant 0 : index
	%0 = sparse_tensor.pointers %arg0, %c : tensor<64xf32, #SparseVector> to memref<?xindex>			%0 = sparse_tensor.pointers %arg0, %c : tensor<64xf32, #SparseVector> to memref<?xindex>
	%1 = sparse_tensor.indices %arg0, %c : tensor<64xf32, #SparseVector> to memref<?xindex>			%1 = sparse_tensor.indices %arg0, %c : tensor<64xf32, #SparseVector> to memref<?xindex>
	%2 = sparse_tensor.values %arg0 : tensor<64xf32, #SparseVector> to memref<?xf32>			%2 = sparse_tensor.values %arg0 : tensor<64xf32, #SparseVector> to memref<?xf32>
	return			return
	}			}

	// CHECK-LABEL: func @sparse_dce_reconstruct(
	// CHECK-SAME: %[[A:.]]: tensor<64xf32, #sparse_tensor.encoding<{{{.}}}>>)
	// CHECK-NOT: sparse_tensor.values
	// CHECK-NOT: sparse_tensor.tensor
	// CHECK: return
	func @sparse_dce_reconstruct(%arg0: tensor<64xf32, #DenseVector>) {
	%0 = sparse_tensor.values %arg0 : tensor<64xf32, #DenseVector> to memref<?xf32>
	%1 = sparse_tensor.tensor %0 : memref<?xf32> to tensor<64xf32, #DenseVector>
	return
	}

mlir/test/Dialect/SparseTensor/invalid.mlir

	Show First 20 Lines • Show All 138 Lines • ▼ Show 20 Lines
	func @mismatch_values_types(%arg0: tensor<?xf64, #SparseVector>) -> memref<?xf32> {			func @mismatch_values_types(%arg0: tensor<?xf64, #SparseVector>) -> memref<?xf32> {
	// expected-error@+1 {{unexpected mismatch in element types}}			// expected-error@+1 {{unexpected mismatch in element types}}
	%0 = sparse_tensor.values %arg0 : tensor<?xf64, #SparseVector> to memref<?xf32>			%0 = sparse_tensor.values %arg0 : tensor<?xf64, #SparseVector> to memref<?xf32>
	return %0 : memref<?xf32>			return %0 : memref<?xf32>
	}			}

	// -----			// -----

	func @sparse_to_unannotated_tensor(%arg0: memref<?xf64>) -> tensor<16x32xf64> {			func @sparse_unannotated_load(%arg0: tensor<16x32xf64>) -> tensor<16x32xf64> {
	// expected-error@+1 {{expected a sparse tensor result}}			// expected-error@+1 {{expected a sparse tensor to materialize}}
	%0 = sparse_tensor.tensor %arg0 : memref<?xf64> to tensor<16x32xf64>			%0 = sparse_tensor.load %arg0, false : tensor<16x32xf64>
	return %0 : tensor<16x32xf64>			return %0 : tensor<16x32xf64>
	}			}

	// -----			// -----

				func @sparse_unannotated_insert(%arg0: tensor<128xf64>, %arg1: memref<?xindex>, %arg2: f64) {
				// expected-error@+1 {{expected a sparse tensor for insertion}}
				sparse_tensor.lex_insert %arg0, %arg1, %arg2 : tensor<128xf64>, memref<?xindex>, f64
				return
				}

				// -----

	func @sparse_convert_unranked(%arg0: tensor<*xf32>) -> tensor<10xf32> {			func @sparse_convert_unranked(%arg0: tensor<*xf32>) -> tensor<10xf32> {
	// expected-error@+1 {{unexpected type in convert}}			// expected-error@+1 {{unexpected type in convert}}
	%0 = sparse_tensor.convert %arg0 : tensor<*xf32> to tensor<10xf32>			%0 = sparse_tensor.convert %arg0 : tensor<*xf32> to tensor<10xf32>
	return %0 : tensor<10xf32>			return %0 : tensor<10xf32>
	}			}

	// -----			// -----

	Show All 17 Lines

mlir/test/Dialect/SparseTensor/roundtrip.mlir

Show First 20 Lines • Show All 107 Lines • ▼ Show 20 Lines	func @sparse_values(%arg0: tensor<128xf64, #SparseVector>) -> memref<?xf64> {
%0 = sparse_tensor.values %arg0 : tensor<128xf64, #SparseVector> to memref<?xf64>		%0 = sparse_tensor.values %arg0 : tensor<128xf64, #SparseVector> to memref<?xf64>
return %0 : memref<?xf64>		return %0 : memref<?xf64>
}		}

// -----		// -----

#DenseMatrix = #sparse_tensor.encoding<{dimLevelType = ["dense","dense"]}>		#DenseMatrix = #sparse_tensor.encoding<{dimLevelType = ["dense","dense"]}>

// CHECK-LABEL: func @sparse_to_tensor(		// CHECK-LABEL: func @sparse_load(
// CHECK-SAME: %[[A:.*]]: memref<?xf64>)		// CHECK-SAME: %[[A:.]]: tensor<16x32xf64, #{{.}}>)
// CHECK: %[[T:.]] = sparse_tensor.tensor %[[A]] : memref<?xf64> to tensor<16x32xf64, #{{.}}>		// CHECK: %[[T:.]] = sparse_tensor.load %[[A]], false : tensor<16x32xf64, #{{.}}>
// CHECK: return %[[T]] : tensor<16x32xf64, #{{.*}}>		// CHECK: return %[[T]] : tensor<16x32xf64, #{{.*}}>
func @sparse_to_tensor(%arg0: memref<?xf64>) -> tensor<16x32xf64, #DenseMatrix> {		func @sparse_load(%arg0: tensor<16x32xf64, #DenseMatrix>) -> tensor<16x32xf64, #DenseMatrix> {
%0 = sparse_tensor.tensor %arg0 : memref<?xf64> to tensor<16x32xf64, #DenseMatrix>		%0 = sparse_tensor.load %arg0, false : tensor<16x32xf64, #DenseMatrix>
return %0 : tensor<16x32xf64, #DenseMatrix>		return %0 : tensor<16x32xf64, #DenseMatrix>
}		}

		// -----

		#SparseVector = #sparse_tensor.encoding<{dimLevelType = ["compressed"]}>

		// CHECK-LABEL: func @sparse_insert(
		// CHECK-SAME: %[[A:.]]: tensor<128xf64, #sparse_tensor.encoding<{{.}}>>,
		// CHECK-SAME: %[[B:.*]]: memref<?xindex>,
		// CHECK-SAME: %[[C:.*]]: f64) {
		// CHECK: sparse_tensor.lex_insert %[[A]], %[[B]], %[[C]] : tensor<128xf64, #{{.*}}>, memref<?xindex>, f64
		// CHECK: return
		func @sparse_insert(%arg0: tensor<128xf64, #SparseVector>,
		%arg1: memref<?xindex>,
		%arg2: f64) {
		wrengrUnsubmitted Done Reply Inline Actions reindent/align wrengr: reindent/align
		sparse_tensor.lex_insert %arg0, %arg1, %arg2 : tensor<128xf64, #SparseVector>, memref<?xindex>, f64
		return
		}

mlir/test/Dialect/SparseTensor/sparse_out.mlir

Show All 14 Lines	#trait_scale = {
indexing_maps = [		indexing_maps = [
affine_map<(i,j) -> (i,j)> // X (out)		affine_map<(i,j) -> (i,j)> // X (out)
],		],
iterator_types = ["parallel", "parallel"],		iterator_types = ["parallel", "parallel"],
doc = "X(i,j) = X(i,j) * 2"		doc = "X(i,j) = X(i,j) * 2"
}		}

// CHECK-LABEL: func @sparse_simply_dynamic1(		// CHECK-LABEL: func @sparse_simply_dynamic1(
// CHECK-SAME: %[[VAL_0:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> {		// CHECK-SAME: %[[VAL_0:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> {
// CHECK-DAG: %[[VAL_1:.*]] = arith.constant 2.000000e+00 : f32		// CHECK-DAG: %[[VAL_1:.*]] = arith.constant 2.000000e+00 : f32
// CHECK-DAG: %[[VAL_2:.*]] = arith.constant 0 : index		// CHECK-DAG: %[[VAL_2:.*]] = arith.constant 0 : index
// CHECK-DAG: %[[VAL_3:.*]] = arith.constant 1 : index		// CHECK-DAG: %[[VAL_3:.*]] = arith.constant 1 : index
// CHECK: %[[VAL_4:.]] = sparse_tensor.pointers %[[VAL_0]], %[[VAL_2]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>		// CHECK: %[[VAL_4:.]] = sparse_tensor.pointers %[[VAL_0]], %[[VAL_2]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_5:.]] = sparse_tensor.indices %[[VAL_0]], %[[VAL_2]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_6:.]] = sparse_tensor.pointers %[[VAL_0]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>		// CHECK: %[[VAL_6:.]] = sparse_tensor.pointers %[[VAL_0]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_7:.]] = sparse_tensor.indices %[[VAL_0]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_8:.]] = sparse_tensor.values %[[VAL_0]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xf32>		// CHECK: %[[VAL_8:.]] = sparse_tensor.values %[[VAL_0]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xf32>
// CHECK: %[[VAL_9:.*]] = memref.load %[[VAL_4]]{{\[}}%[[VAL_2]]] : memref<?xindex>		// CHECK: %[[VAL_9:.*]] = memref.load %[[VAL_4]]{{\[}}%[[VAL_2]]] : memref<?xindex>
// CHECK: %[[VAL_10:.*]] = memref.load %[[VAL_4]]{{\[}}%[[VAL_3]]] : memref<?xindex>		// CHECK: %[[VAL_10:.*]] = memref.load %[[VAL_4]]{{\[}}%[[VAL_3]]] : memref<?xindex>
// CHECK: scf.for %[[VAL_11:.*]] = %[[VAL_9]] to %[[VAL_10]] step %[[VAL_3]] {		// CHECK: scf.for %[[VAL_11:.*]] = %[[VAL_9]] to %[[VAL_10]] step %[[VAL_3]] {
// CHECK: %[[VAL_12:.*]] = memref.load %[[VAL_6]]{{\[}}%[[VAL_11]]] : memref<?xindex>		// CHECK: %[[VAL_12:.*]] = memref.load %[[VAL_6]]{{\[}}%[[VAL_11]]] : memref<?xindex>
// CHECK: %[[VAL_13:.*]] = arith.addi %[[VAL_11]], %[[VAL_3]] : index		// CHECK: %[[VAL_13:.*]] = arith.addi %[[VAL_11]], %[[VAL_3]] : index
// CHECK: %[[VAL_14:.*]] = memref.load %[[VAL_6]]{{\[}}%[[VAL_13]]] : memref<?xindex>		// CHECK: %[[VAL_14:.*]] = memref.load %[[VAL_6]]{{\[}}%[[VAL_13]]] : memref<?xindex>
// CHECK: scf.for %[[VAL_15:.*]] = %[[VAL_12]] to %[[VAL_14]] step %[[VAL_3]] {		// CHECK: scf.for %[[VAL_15:.*]] = %[[VAL_12]] to %[[VAL_14]] step %[[VAL_3]] {
// CHECK: %[[VAL_16:.*]] = memref.load %[[VAL_8]]{{\[}}%[[VAL_15]]] : memref<?xf32>		// CHECK: %[[VAL_16:.*]] = memref.load %[[VAL_8]]{{\[}}%[[VAL_15]]] : memref<?xf32>
// CHECK: %[[VAL_17:.*]] = arith.mulf %[[VAL_16]], %[[VAL_1]] : f32		// CHECK: %[[VAL_17:.*]] = arith.mulf %[[VAL_16]], %[[VAL_1]] : f32
// CHECK: memref.store %[[VAL_17]], %[[VAL_8]]{{\[}}%[[VAL_15]]] : memref<?xf32>		// CHECK: memref.store %[[VAL_17]], %[[VAL_8]]{{\[}}%[[VAL_15]]] : memref<?xf32>
// CHECK: }		// CHECK: }
// CHECK: }		// CHECK: }
// CHECK: %[[VAL_18:.]] = sparse_tensor.tensor %[[VAL_4]], %[[VAL_5]], %[[VAL_6]], %[[VAL_7]], %[[VAL_8]] : memref<?xindex>, memref<?xindex>, memref<?xindex>, memref<?xindex>, memref<?xf32> to tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>		// CHECK: %[[VAL_18:.]] = sparse_tensor.load %[[VAL_0]], false : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>
// CHECK: return %[[VAL_18]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>>		// CHECK: return %[[VAL_18]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>>
// CHECK: }		// CHECK: }
func @sparse_simply_dynamic1(%argx: tensor<32x16xf32, #DCSR> {linalg.inplaceable = true}) -> tensor<32x16xf32, #DCSR> {		func @sparse_simply_dynamic1(%argx: tensor<32x16xf32, #DCSR> {linalg.inplaceable = true}) -> tensor<32x16xf32, #DCSR> {
%c = arith.constant 2.0 : f32		%c = arith.constant 2.0 : f32
%0 = linalg.generic #trait_scale		%0 = linalg.generic #trait_scale
outs(%argx: tensor<32x16xf32, #DCSR>) {		outs(%argx: tensor<32x16xf32, #DCSR>) {
^bb(%x: f32):		^bb(%x: f32):
%1 = arith.mulf %x, %c : f32		%1 = arith.mulf %x, %c : f32
linalg.yield %1 : f32		linalg.yield %1 : f32
} -> tensor<32x16xf32, #DCSR>		} -> tensor<32x16xf32, #DCSR>
return %0 : tensor<32x16xf32, #DCSR>		return %0 : tensor<32x16xf32, #DCSR>
}		}

#trait_elt_wise_mult = {		#trait_elt_wise_mult = {
indexing_maps = [		indexing_maps = [
affine_map<(i,j) -> (i,j)>, // A		affine_map<(i,j) -> (i,j)>, // A
affine_map<(i,j) -> (i,j)> // X (out)		affine_map<(i,j) -> (i,j)> // X (out)
],		],
iterator_types = ["parallel", "parallel"],		iterator_types = ["parallel", "parallel"],
doc = "X(i,j) = A(i,j) * X(i,j)"		doc = "X(i,j) = A(i,j) * X(i,j)"
}		}

// CHECK-LABEL: func @sparse_simply_dynamic2(		// CHECK-LABEL: func @sparse_simply_dynamic2(
// CHECK-SAME: %[[VAL_0:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>,		// CHECK-SAME: %[[VAL_0:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>,
// CHECK-SAME: %[[VAL_1:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> {		// CHECK-SAME: %[[VAL_1:.]]: tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> {
// CHECK-DAG: %[[VAL_2:.*]] = arith.constant 0 : index		// CHECK-DAG: %[[VAL_2:.*]] = arith.constant 0 : index
// CHECK-DAG: %[[VAL_3:.*]] = arith.constant 1 : index		// CHECK-DAG: %[[VAL_3:.*]] = arith.constant 1 : index
// CHECK: %[[VAL_4:.]] = sparse_tensor.pointers %[[VAL_0]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>		// CHECK: %[[VAL_4:.]] = sparse_tensor.pointers %[[VAL_0]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_5:.]] = sparse_tensor.indices %[[VAL_0]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>		// CHECK: %[[VAL_5:.]] = sparse_tensor.indices %[[VAL_0]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_6:.]] = sparse_tensor.values %[[VAL_0]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xf32>		// CHECK: %[[VAL_6:.]] = sparse_tensor.values %[[VAL_0]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xf32>
// CHECK: %[[VAL_7:.]] = sparse_tensor.pointers %[[VAL_1]], %[[VAL_2]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>		// CHECK: %[[VAL_7:.]] = sparse_tensor.pointers %[[VAL_1]], %[[VAL_2]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_8:.]] = sparse_tensor.indices %[[VAL_1]], %[[VAL_2]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>		// CHECK: %[[VAL_8:.]] = sparse_tensor.indices %[[VAL_1]], %[[VAL_2]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_9:.]] = sparse_tensor.pointers %[[VAL_1]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>		// CHECK: %[[VAL_9:.]] = sparse_tensor.pointers %[[VAL_1]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_10:.]] = sparse_tensor.indices %[[VAL_1]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>		// CHECK: %[[VAL_10:.]] = sparse_tensor.indices %[[VAL_1]], %[[VAL_3]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xindex>
// CHECK: %[[VAL_11:.]] = sparse_tensor.values %[[VAL_1]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xf32>		// CHECK: %[[VAL_11:.]] = sparse_tensor.values %[[VAL_1]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>> to memref<?xf32>
Show All 32 Lines
// CHECK: %[[VAL_41:.*]] = arith.addi %[[VAL_28]], %[[VAL_3]] : index		// CHECK: %[[VAL_41:.*]] = arith.addi %[[VAL_28]], %[[VAL_3]] : index
// CHECK: %[[VAL_42:.*]] = select %[[VAL_40]], %[[VAL_41]], %[[VAL_28]] : index		// CHECK: %[[VAL_42:.*]] = select %[[VAL_40]], %[[VAL_41]], %[[VAL_28]] : index
// CHECK: %[[VAL_43:.*]] = arith.cmpi eq, %[[VAL_31]], %[[VAL_33]] : index		// CHECK: %[[VAL_43:.*]] = arith.cmpi eq, %[[VAL_31]], %[[VAL_33]] : index
// CHECK: %[[VAL_44:.*]] = arith.addi %[[VAL_29]], %[[VAL_3]] : index		// CHECK: %[[VAL_44:.*]] = arith.addi %[[VAL_29]], %[[VAL_3]] : index
// CHECK: %[[VAL_45:.*]] = select %[[VAL_43]], %[[VAL_44]], %[[VAL_29]] : index		// CHECK: %[[VAL_45:.*]] = select %[[VAL_43]], %[[VAL_44]], %[[VAL_29]] : index
// CHECK: scf.yield %[[VAL_42]], %[[VAL_45]] : index, index		// CHECK: scf.yield %[[VAL_42]], %[[VAL_45]] : index, index
// CHECK: }		// CHECK: }
// CHECK: }		// CHECK: }
// CHECK: %[[VAL_46:.]] = sparse_tensor.tensor %[[VAL_7]], %[[VAL_8]], %[[VAL_9]], %[[VAL_10]], %[[VAL_11]] : memref<?xindex>, memref<?xindex>, memref<?xindex>, memref<?xindex>, memref<?xf32> to tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>		// CHECK: %[[VAL_46:.]] = sparse_tensor.load %[[VAL_1]], false : tensor<32x16xf32, #sparse_tensor.encoding<{{.}}>>
// CHECK: return %[[VAL_46]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>>		// CHECK: return %[[VAL_46]] : tensor<32x16xf32, #sparse_tensor.encoding<{{.*}}>>
// CHECK: }		// CHECK: }
func @sparse_simply_dynamic2(%arga: tensor<32x16xf32, #CSR>,		func @sparse_simply_dynamic2(%arga: tensor<32x16xf32, #CSR>,
%argx: tensor<32x16xf32, #DCSR> {linalg.inplaceable = true}) -> tensor<32x16xf32, #DCSR> {		%argx: tensor<32x16xf32, #DCSR> {linalg.inplaceable = true}) -> tensor<32x16xf32, #DCSR> {
%0 = linalg.generic #trait_elt_wise_mult		%0 = linalg.generic #trait_elt_wise_mult
ins(%arga: tensor<32x16xf32, #CSR>)		ins(%arga: tensor<32x16xf32, #CSR>)
outs(%argx: tensor<32x16xf32, #DCSR>) {		outs(%argx: tensor<32x16xf32, #DCSR>) {
^bb(%a: f32, %x: f32):		^bb(%a: f32, %x: f32):
%1 = arith.mulf %x, %a : f32		%1 = arith.mulf %x, %a : f32
linalg.yield %1 : f32		linalg.yield %1 : f32
} -> tensor<32x16xf32, #DCSR>		} -> tensor<32x16xf32, #DCSR>
return %0 : tensor<32x16xf32, #DCSR>		return %0 : tensor<32x16xf32, #DCSR>
}		}

mlir/test/Integration/Dialect/SparseTensor/CPU/sparse_vector_ops.mlir

This file was added.

				// RUN: mlir-opt %s \
				// RUN: --sparsification --sparse-tensor-conversion \
				// RUN: --linalg-bufferize --convert-linalg-to-loops \
				// RUN: --convert-vector-to-scf --convert-scf-to-std \
				// RUN: --func-bufferize --tensor-constant-bufferize --tensor-bufferize \
				// RUN: --std-bufferize --finalizing-bufferize --lower-affine \
				// RUN: --convert-vector-to-llvm --convert-memref-to-llvm --convert-math-to-llvm \
				// RUN: --convert-std-to-llvm --reconcile-unrealized-casts \| \
				// RUN: mlir-cpu-runner \
				// RUN: -e entry -entry-point-result=void \
				// RUN: -shared-libs=%mlir_integration_test_dir/libmlir_c_runner_utils%shlibext \| \
				// RUN: FileCheck %s

				#SparseVector = #sparse_tensor.encoding<{dimLevelType = ["compressed"]}>
				#DenseVector = #sparse_tensor.encoding<{dimLevelType = ["dense"]}>

				//
				// Traits for 1-d tensor (aka vector) operations.
				//
				#trait_scale_inpl = {
				indexing_maps = [
				affine_map<(i) -> (i)> // x (out)
				],
				iterator_types = ["parallel"],
				doc = "x(i) *= 2.0"
				}
				#trait_scale = {
				indexing_maps = [
				affine_map<(i) -> (i)>, // a (in)
				affine_map<(i) -> (i)> // x (out)
				],
				iterator_types = ["parallel"],
				doc = "x(i) = a(i) * 2.0"
				}
				#trait_op = {
				indexing_maps = [
				affine_map<(i) -> (i)>, // a (in)
				affine_map<(i) -> (i)>, // b (in)
				affine_map<(i) -> (i)> // x (out)
				],
				iterator_types = ["parallel"],
				doc = "x(i) = a(i) OP b(i)"
				}
				#trait_dot = {
				indexing_maps = [
				affine_map<(i) -> (i)>, // a (in)
				affine_map<(i) -> (i)>, // b (in)
				affine_map<(i) -> ()> // x (out)
				],
				iterator_types = ["parallel"],
				doc = "x(i) += a(i) * b(i)"
				}

				module {
				// Scales a sparse vector into a new sparse vector.
				func @vector_scale(%arga: tensor<?xf64, #SparseVector>) -> tensor<?xf64, #SparseVector> {
				%s = arith.constant 2.0 : f64
				%c = arith.constant 0 : index
				%d = tensor.dim %arga, %c : tensor<?xf64, #SparseVector>
				%xv = sparse_tensor.init [%d] : tensor<?xf64, #SparseVector>
				%0 = linalg.generic #trait_scale
				ins(%arga: tensor<?xf64, #SparseVector>)
				outs(%xv: tensor<?xf64, #SparseVector>) {
				^bb(%a: f64, %x: f64):
				%1 = arith.mulf %a, %s : f64
				linalg.yield %1 : f64
				} -> tensor<?xf64, #SparseVector>
				return %0 : tensor<?xf64, #SparseVector>
				}

				// Scales a sparse vector in place.
				func @vector_scale_inplace(%argx: tensor<?xf64, #SparseVector>
				{linalg.inplaceable = true}) -> tensor<?xf64, #SparseVector> {
				%s = arith.constant 2.0 : f64
				%0 = linalg.generic #trait_scale_inpl
				outs(%argx: tensor<?xf64, #SparseVector>) {
				^bb(%x: f64):
				%1 = arith.mulf %x, %s : f64
				linalg.yield %1 : f64
				} -> tensor<?xf64, #SparseVector>
				return %0 : tensor<?xf64, #SparseVector>
				}

				// Adds two sparse vectors into a new sparse vector.
				func @vector_add(%arga: tensor<?xf64, #SparseVector>,
				%argb: tensor<?xf64, #SparseVector>) -> tensor<?xf64, #SparseVector> {
				%c = arith.constant 0 : index
				%d = tensor.dim %arga, %c : tensor<?xf64, #SparseVector>
				%xv = sparse_tensor.init [%d] : tensor<?xf64, #SparseVector>
				%0 = linalg.generic #trait_op
				ins(%arga, %argb: tensor<?xf64, #SparseVector>, tensor<?xf64, #SparseVector>)
				outs(%xv: tensor<?xf64, #SparseVector>) {
				^bb(%a: f64, %b: f64, %x: f64):
				%1 = arith.addf %a, %b : f64
				linalg.yield %1 : f64
				} -> tensor<?xf64, #SparseVector>
				return %0 : tensor<?xf64, #SparseVector>
				}

				// Multiplies two sparse vectors into a new sparse vector.
				func @vector_mul(%arga: tensor<?xf64, #SparseVector>,
				%argb: tensor<?xf64, #SparseVector>) -> tensor<?xf64, #SparseVector> {
				%c = arith.constant 0 : index
				%d = tensor.dim %arga, %c : tensor<?xf64, #SparseVector>
				%xv = sparse_tensor.init [%d] : tensor<?xf64, #SparseVector>
				%0 = linalg.generic #trait_op
				ins(%arga, %argb: tensor<?xf64, #SparseVector>, tensor<?xf64, #SparseVector>)
				outs(%xv: tensor<?xf64, #SparseVector>) {
				^bb(%a: f64, %b: f64, %x: f64):
				%1 = arith.mulf %a, %b : f64
				linalg.yield %1 : f64
				} -> tensor<?xf64, #SparseVector>
				return %0 : tensor<?xf64, #SparseVector>
				}

				// Multiplies two sparse vectors into a new "annotated" dense vector.
				func @vector_mul_d(%arga: tensor<?xf64, #SparseVector>,
				%argb: tensor<?xf64, #SparseVector>) -> tensor<?xf64, #DenseVector> {
				%c = arith.constant 0 : index
				%d = tensor.dim %arga, %c : tensor<?xf64, #SparseVector>
				%xv = sparse_tensor.init [%d] : tensor<?xf64, #DenseVector>
				%0 = linalg.generic #trait_op
				ins(%arga, %argb: tensor<?xf64, #SparseVector>, tensor<?xf64, #SparseVector>)
				outs(%xv: tensor<?xf64, #DenseVector>) {
				^bb(%a: f64, %b: f64, %x: f64):
				%1 = arith.mulf %a, %b : f64
				linalg.yield %1 : f64
				} -> tensor<?xf64, #DenseVector>
				return %0 : tensor<?xf64, #DenseVector>
				}

				// Sum reduces dot product of two sparse vectors.
				func @vector_dotprod(%arga: tensor<?xf64, #SparseVector>,
				%argb: tensor<?xf64, #SparseVector>,
				%argx: tensor<f64> {linalg.inplaceable = true}) -> tensor<f64> {
				%0 = linalg.generic #trait_dot
				ins(%arga, %argb: tensor<?xf64, #SparseVector>, tensor<?xf64, #SparseVector>)
				outs(%argx: tensor<f64>) {
				^bb(%a: f64, %b: f64, %x: f64):
				%1 = arith.mulf %a, %b : f64
				%2 = arith.addf %x, %1 : f64
				linalg.yield %2 : f64
				} -> tensor<f64>
				return %0 : tensor<f64>
				}

				// Dumps just the values array of the sparse vector.
				func @dump(%arg0: tensor<?xf64, #SparseVector>) {
				// Dump the values array to verify only sparse contents are stored.
				%c0 = arith.constant 0 : index
				%d0 = arith.constant -1.0 : f64
				%0 = sparse_tensor.values %arg0 : tensor<?xf64, #SparseVector> to memref<?xf64>
				%1 = vector.transfer_read %0[%c0], %d0: memref<?xf64>, vector<16xf64>
				vector.print %1 : vector<16xf64>
				// Dump the dense vector to verify structure is correct.
				%dv = sparse_tensor.convert %arg0 : tensor<?xf64, #SparseVector> to tensor<?xf64>
				%2 = memref.buffer_cast %dv : memref<?xf64>
				%3 = vector.transfer_read %2[%c0], %d0: memref<?xf64>, vector<32xf64>
				vector.print %3 : vector<32xf64>
				memref.dealloc %2 : memref<?xf64>
				return
				}

				// Driver method to call and verify vector kernels.
				func @entry() {
				%c0 = arith.constant 0 : index
				%d1 = arith.constant 1.1 : f64

				// Setup sparse vectors.
				%v1 = arith.constant sparse<
				[ [0], [3], [11], [17], [20], [21], [28], [29], [31] ],
				[ 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 9.0 ]
				> : tensor<32xf64>
				%v2 = arith.constant sparse<
				[ [1], [3], [4], [10], [16], [18], [21], [28], [29], [31] ],
				[11.0, 12.0, 13.0, 14.0, 15.0, 16.0, 17.0, 18.0, 19.0, 20.0 ]
				> : tensor<32xf64>
				%sv1 = sparse_tensor.convert %v1 : tensor<32xf64> to tensor<?xf64, #SparseVector>
				%sv2 = sparse_tensor.convert %v2 : tensor<32xf64> to tensor<?xf64, #SparseVector>

				// Setup memory for a single reduction scalar.
				%xdata = memref.alloc() : memref<f64>
				memref.store %d1, %xdata[] : memref<f64>
				%x = memref.tensor_load %xdata : memref<f64>

				// Call sparse vector kernels.
				%0 = call @vector_scale(%sv1)
				: (tensor<?xf64, #SparseVector>) -> tensor<?xf64, #SparseVector>
				%1 = call @vector_scale_inplace(%sv1)
				: (tensor<?xf64, #SparseVector>) -> tensor<?xf64, #SparseVector>
				%2 = call @vector_add(%sv1, %sv2)
				: (tensor<?xf64, #SparseVector>,
				tensor<?xf64, #SparseVector>) -> tensor<?xf64, #SparseVector>
				%3 = call @vector_mul(%sv1, %sv2)
				: (tensor<?xf64, #SparseVector>,
				tensor<?xf64, #SparseVector>) -> tensor<?xf64, #SparseVector>
				%4 = call @vector_mul_d(%sv1, %sv2)
				: (tensor<?xf64, #SparseVector>,
				tensor<?xf64, #SparseVector>) -> tensor<?xf64, #DenseVector>
				%5 = call @vector_dotprod(%sv1, %sv2, %x)
				: (tensor<?xf64, #SparseVector>,
				tensor<?xf64, #SparseVector>, tensor<f64>) -> tensor<f64>

				//
				// Verify the results.
				//
				// CHECK: ( 2, 4, 6, 8, 10, 12, 14, 16, 18, -1, -1, -1, -1, -1, -1, -1 )
				// CHECK-NEXT: ( 2, 0, 0, 4, 0, 0, 0, 0, 0, 0, 0, 6, 0, 0, 0, 0, 0, 8, 0, 0, 10, 12, 0, 0, 0, 0, 0, 0, 14, 16, 0, 18 )
				// CHECK-NEXT: ( 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, -1, -1, -1, -1, -1, -1 )
				// CHECK-NEXT: ( 0, 11, 0, 12, 13, 0, 0, 0, 0, 0, 14, 0, 0, 0, 0, 0, 15, 0, 16, 0, 0, 17, 0, 0, 0, 0, 0, 0, 18, 19, 0, 20 )
				// CHECK-NEXT: ( 2, 4, 6, 8, 10, 12, 14, 16, 18, -1, -1, -1, -1, -1, -1, -1 )
				// CHECK-NEXT: ( 2, 0, 0, 4, 0, 0, 0, 0, 0, 0, 0, 6, 0, 0, 0, 0, 0, 8, 0, 0, 10, 12, 0, 0, 0, 0, 0, 0, 14, 16, 0, 18 )
				// CHECK-NEXT: ( 2, 4, 6, 8, 10, 12, 14, 16, 18, -1, -1, -1, -1, -1, -1, -1 )
				// CHECK-NEXT: ( 2, 0, 0, 4, 0, 0, 0, 0, 0, 0, 0, 6, 0, 0, 0, 0, 0, 8, 0, 0, 10, 12, 0, 0, 0, 0, 0, 0, 14, 16, 0, 18 )
				// CHECK-NEXT: ( 2, 11, 16, 13, 14, 6, 15, 8, 16, 10, 29, 32, 35, 38, -1, -1 )
				// CHECK-NEXT: ( 2, 11, 0, 16, 13, 0, 0, 0, 0, 0, 14, 6, 0, 0, 0, 0, 15, 8, 16, 0, 10, 29, 0, 0, 0, 0, 0, 0, 32, 35, 0, 38 )
				// CHECK-NEXT: ( 48, 204, 252, 304, 360, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1 )
				// CHECK-NEXT: ( 0, 0, 0, 48, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 204, 0, 0, 0, 0, 0, 0, 252, 304, 0, 360 )
				// CHECK-NEXT: ( 0, 0, 0, 48, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 204, 0, 0, 0, 0, 0, 0, 252, 304, 0, 360 )
				// CHECK-NEXT: 1169.1
				//
				call @dump(%sv1) : (tensor<?xf64, #SparseVector>) -> ()
				call @dump(%sv2) : (tensor<?xf64, #SparseVector>) -> ()
				call @dump(%0) : (tensor<?xf64, #SparseVector>) -> ()
				call @dump(%1) : (tensor<?xf64, #SparseVector>) -> ()
				call @dump(%2) : (tensor<?xf64, #SparseVector>) -> ()
				call @dump(%3) : (tensor<?xf64, #SparseVector>) -> ()
				%m4 = sparse_tensor.values %4 : tensor<?xf64, #DenseVector> to memref<?xf64>
				%v4 = vector.load %m4[%c0]: memref<?xf64>, vector<32xf64>
				vector.print %v4 : vector<32xf64>
				%m5 = memref.buffer_cast %5 : memref<f64>
				%v5 = memref.load %m5[] : memref<f64>
				vector.print %v5 : f64

				// Release the resources.
				sparse_tensor.release %sv1 : tensor<?xf64, #SparseVector>
				sparse_tensor.release %sv2 : tensor<?xf64, #SparseVector>
				sparse_tensor.release %0 : tensor<?xf64, #SparseVector>
				sparse_tensor.release %2 : tensor<?xf64, #SparseVector>
				sparse_tensor.release %3 : tensor<?xf64, #SparseVector>
				sparse_tensor.release %4 : tensor<?xf64, #DenseVector>
				memref.dealloc %xdata : memref<f64>
				return
				}
				}

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][sparse] first version of "truly" dynamic sparse tensors as outputs of kernels
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 386670

mlir/include/mlir/Dialect/SparseTensor/IR/SparseTensorOps.td

mlir/lib/Dialect/SparseTensor/IR/SparseTensorDialect.cpp

mlir/lib/Dialect/SparseTensor/Transforms/SparseTensorConversion.cpp

mlir/lib/Dialect/SparseTensor/Transforms/Sparsification.cpp

mlir/lib/ExecutionEngine/SparseTensorUtils.cpp

mlir/test/Dialect/SparseTensor/conversion.mlir

mlir/test/Dialect/SparseTensor/dense.mlir

mlir/test/Dialect/SparseTensor/fold.mlir

mlir/test/Dialect/SparseTensor/invalid.mlir

mlir/test/Dialect/SparseTensor/roundtrip.mlir

mlir/test/Dialect/SparseTensor/sparse_out.mlir

mlir/test/Integration/Dialect/SparseTensor/CPU/sparse_vector_ops.mlir

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][sparse] first version of "truly" dynamic sparse tensors as outputs of kernelsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 386670

mlir/include/mlir/Dialect/SparseTensor/IR/SparseTensorOps.td

mlir/lib/Dialect/SparseTensor/IR/SparseTensorDialect.cpp

mlir/lib/Dialect/SparseTensor/Transforms/SparseTensorConversion.cpp

mlir/lib/Dialect/SparseTensor/Transforms/Sparsification.cpp

mlir/lib/ExecutionEngine/SparseTensorUtils.cpp

mlir/test/Dialect/SparseTensor/conversion.mlir

mlir/test/Dialect/SparseTensor/dense.mlir

mlir/test/Dialect/SparseTensor/fold.mlir

mlir/test/Dialect/SparseTensor/invalid.mlir

mlir/test/Dialect/SparseTensor/roundtrip.mlir

mlir/test/Dialect/SparseTensor/sparse_out.mlir

mlir/test/Integration/Dialect/SparseTensor/CPU/sparse_vector_ops.mlir

[mlir][sparse] first version of "truly" dynamic sparse tensors as outputs of kernels
ClosedPublic