diff --git a/mlir/test/Integration/Dialect/SparseTensor/CPU/sparse_spmm.mlir b/mlir/test/Integration/Dialect/SparseTensor/CPU/sparse_spmm.mlir new file mode 100644 --- /dev/null +++ b/mlir/test/Integration/Dialect/SparseTensor/CPU/sparse_spmm.mlir @@ -0,0 +1,108 @@ +// RUN: mlir-opt %s \ +// RUN: --sparsification --sparse-tensor-conversion \ +// RUN: --convert-linalg-to-loops --convert-vector-to-scf --convert-scf-to-std \ +// RUN: --func-bufferize --tensor-constant-bufferize --tensor-bufferize \ +// RUN: --std-bufferize --finalizing-bufferize \ +// RUN: --convert-vector-to-llvm --convert-std-to-llvm | \ +// RUN: TENSOR0="%mlir_integration_test_dir/data/wide.mtx" \ +// RUN: mlir-cpu-runner \ +// RUN: -e entry -entry-point-result=void \ +// RUN: -shared-libs=%mlir_integration_test_dir/libmlir_c_runner_utils%shlibext | \ +// RUN: FileCheck %s + +!Filename = type !llvm.ptr + +#SparseMatrix = #sparse_tensor.encoding<{ + dimLevelType = [ "dense", "compressed" ], + pointerBitWidth = 8, + indexBitWidth = 8 +}> + +#spmm = { + indexing_maps = [ + affine_map<(i,j,k) -> (i,j)>, // A + affine_map<(i,j,k) -> (j,k)>, // B + affine_map<(i,j,k) -> (i,k)> // X (out) + ], + iterator_types = ["parallel", "reduction", "parallel"], + doc = "X(i,k) += A(i,j) * B(j,k)" +} + +// +// Integration test that lowers a kernel annotated as sparse to +// actual sparse code, initializes a matching sparse storage scheme +// from file, and runs the resulting code with the JIT compiler. +// +module { + // + // A kernel that multiplies a sparse matrix A with a dense matrix B + // into a dense matrix X. + // + func @kernel_spmm(%arga: tensor, + %argb: tensor, + %argx: tensor) -> tensor { + %0 = linalg.generic #spmm + ins(%arga, %argb: tensor, tensor) + outs(%argx: tensor) { + ^bb(%a: i32, %b: i32, %x: i32): + %0 = muli %a, %b : i32 + %1 = addi %x, %0 : i32 + linalg.yield %1 : i32 + } -> tensor + return %0 : tensor + } + + func private @getTensorFilename(index) -> (!Filename) + + // + // Main driver that reads matrix from file and calls the sparse kernel. + // + func @entry() { + %i0 = constant 0 : i32 + %c0 = constant 0 : index + %c1 = constant 1 : index + %c4 = constant 4 : index + %c256 = constant 256 : index + + // Read the sparse matrix from file, construct sparse storage. + %fileName = call @getTensorFilename(%c0) : (index) -> (!Filename) + %a = sparse_tensor.new %fileName : !llvm.ptr to tensor + + // Initialize dense vectors. + %bdata = memref.alloc(%c256, %c4) : memref + %xdata = memref.alloc(%c4, %c4) : memref + scf.for %i = %c0 to %c256 step %c1 { + scf.for %j = %c0 to %c4 step %c1 { + %k0 = muli %i, %c4 : index + %k1 = addi %j, %k0 : index + %k = index_cast %k1 : index to i32 + memref.store %k, %bdata[%i, %j] : memref + } + } + scf.for %i = %c0 to %c4 step %c1 { + scf.for %j = %c0 to %c4 step %c1 { + memref.store %i0, %xdata[%i, %j] : memref + } + } + %b = memref.tensor_load %bdata : memref + %x = memref.tensor_load %xdata : memref + + // Call kernel. + %0 = call @kernel_spmm(%a, %b, %x) + : (tensor, tensor, tensor) -> tensor + + // Print the result for verification. + // + // CHECK: ( ( 3548, 3550, 3552, 3554 ), ( 6052, 6053, 6054, 6055 ), ( -56, -63, -70, -77 ), ( -13704, -13709, -13714, -13719 ) ) + // + %m = memref.buffer_cast %0 : memref + %v = vector.transfer_read %m[%c0, %c0], %i0: memref, vector<4x4xi32> + vector.print %v : vector<4x4xi32> + + // Release the resources. + memref.dealloc %bdata : memref + memref.dealloc %xdata : memref + + return + } +}