diff --git a/mlir/lib/Dialect/Vector/VectorOps.cpp b/mlir/lib/Dialect/Vector/VectorOps.cpp --- a/mlir/lib/Dialect/Vector/VectorOps.cpp +++ b/mlir/lib/Dialect/Vector/VectorOps.cpp @@ -1630,6 +1630,12 @@ int64_t dimB = 1; while (dimB < dimA && j < rankB) dimB *= b[j++]; + + // Handle the case when trailing dimensions are of size 1. + // Include them into the contiguous sequence. + while (dimB == dimA && j < rankB && b[j] == 1) + ++j; + if (dimA != dimB) break; ++i; diff --git a/mlir/test/Dialect/Vector/ops.mlir b/mlir/test/Dialect/Vector/ops.mlir --- a/mlir/test/Dialect/Vector/ops.mlir +++ b/mlir/test/Dialect/Vector/ops.mlir @@ -266,8 +266,10 @@ // CHECK-LABEL: @shape_cast func @shape_cast(%arg0 : vector<5x1x3x2xf32>, - %arg1 : tuple, vector<3x4x2xf32>>) - -> (vector<15x2xf32>, tuple, vector<12x2xf32>>) { + %arg1 : tuple, vector<3x4x2xf32>>, + %arg2 : vector<8x1xf32>, + %arg3 : vector<16x1x1xf32>) + -> (vector<15x2xf32>, tuple, vector<12x2xf32>>, vector<8xf32>, vector<16xf32>) { // CHECK: vector.shape_cast %{{.*}} : vector<5x1x3x2xf32> to vector<15x2xf32> %0 = vector.shape_cast %arg0 : vector<5x1x3x2xf32> to vector<15x2xf32> @@ -276,7 +278,13 @@ %1 = vector.shape_cast %arg1 : tuple, vector<3x4x2xf32>> to tuple, vector<12x2xf32>> - return %0, %1 : vector<15x2xf32>, tuple, vector<12x2xf32>> + // CHECK-NEXT: vector.shape_cast %{{.*}} : vector<8x1xf32> to vector<8xf32> + %2 = vector.shape_cast %arg2 : vector<8x1xf32> to vector<8xf32> + + // CHECK-NEXT: vector.shape_cast %{{.*}} : vector<16x1x1xf32> to vector<16xf32> + %3 = vector.shape_cast %arg3 : vector<16x1x1xf32> to vector<16xf32> + + return %0, %1, %2, %3 : vector<15x2xf32>, tuple, vector<12x2xf32>>, vector<8xf32>, vector<16xf32> } // CHECK-LABEL: @vector_fma