Skip to content

Commit 66347e5

Browse files
authored
[mlir][vector] Drop inner unit dims for transfer ops on dynamic shapes. (#79752)
1 parent 4a39d08 commit 66347e5

File tree

2 files changed

+57
-12
lines changed

2 files changed

+57
-12
lines changed

mlir/lib/Dialect/Vector/Transforms/VectorTransforms.cpp

Lines changed: 17 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -1236,7 +1236,7 @@ class DropInnerMostUnitDimsTransferRead
12361236
return failure();
12371237

12381238
auto srcType = dyn_cast<MemRefType>(readOp.getSource().getType());
1239-
if (!srcType || !srcType.hasStaticShape())
1239+
if (!srcType)
12401240
return failure();
12411241

12421242
if (!readOp.getPermutationMap().isMinorIdentity())
@@ -1260,19 +1260,21 @@ class DropInnerMostUnitDimsTransferRead
12601260
targetType.getElementType());
12611261

12621262
auto loc = readOp.getLoc();
1263+
SmallVector<OpFoldResult> sizes =
1264+
memref::getMixedSizes(rewriter, loc, readOp.getSource());
1265+
SmallVector<OpFoldResult> offsets(srcType.getRank(),
1266+
rewriter.getIndexAttr(0));
1267+
SmallVector<OpFoldResult> strides(srcType.getRank(),
1268+
rewriter.getIndexAttr(1));
12631269
MemRefType resultMemrefType =
12641270
getMemRefTypeWithDroppingInnerDims(rewriter, srcType, dimsToDrop);
1265-
SmallVector<int64_t> offsets(srcType.getRank(), 0);
1266-
SmallVector<int64_t> strides(srcType.getRank(), 1);
1267-
12681271
ArrayAttr inBoundsAttr =
12691272
readOp.getInBounds()
12701273
? rewriter.getArrayAttr(
12711274
readOp.getInBoundsAttr().getValue().drop_back(dimsToDrop))
12721275
: ArrayAttr();
12731276
Value rankedReducedView = rewriter.create<memref::SubViewOp>(
1274-
loc, resultMemrefType, readOp.getSource(), offsets, srcType.getShape(),
1275-
strides);
1277+
loc, resultMemrefType, readOp.getSource(), offsets, sizes, strides);
12761278
auto permMap = getTransferMinorIdentityMap(
12771279
cast<ShapedType>(rankedReducedView.getType()), resultTargetVecType);
12781280
Value result = rewriter.create<vector::TransferReadOp>(
@@ -1318,7 +1320,7 @@ class DropInnerMostUnitDimsTransferWrite
13181320
return failure();
13191321

13201322
auto srcType = dyn_cast<MemRefType>(writeOp.getSource().getType());
1321-
if (!srcType || !srcType.hasStaticShape())
1323+
if (!srcType)
13221324
return failure();
13231325

13241326
if (!writeOp.getPermutationMap().isMinorIdentity())
@@ -1341,20 +1343,23 @@ class DropInnerMostUnitDimsTransferWrite
13411343
VectorType::get(targetType.getShape().drop_back(dimsToDrop),
13421344
targetType.getElementType());
13431345

1346+
Location loc = writeOp.getLoc();
1347+
SmallVector<OpFoldResult> sizes =
1348+
memref::getMixedSizes(rewriter, loc, writeOp.getSource());
1349+
SmallVector<OpFoldResult> offsets(srcType.getRank(),
1350+
rewriter.getIndexAttr(0));
1351+
SmallVector<OpFoldResult> strides(srcType.getRank(),
1352+
rewriter.getIndexAttr(1));
13441353
MemRefType resultMemrefType =
13451354
getMemRefTypeWithDroppingInnerDims(rewriter, srcType, dimsToDrop);
1346-
SmallVector<int64_t> offsets(srcType.getRank(), 0);
1347-
SmallVector<int64_t> strides(srcType.getRank(), 1);
13481355
ArrayAttr inBoundsAttr =
13491356
writeOp.getInBounds()
13501357
? rewriter.getArrayAttr(
13511358
writeOp.getInBoundsAttr().getValue().drop_back(dimsToDrop))
13521359
: ArrayAttr();
13531360

1354-
Location loc = writeOp.getLoc();
13551361
Value rankedReducedView = rewriter.create<memref::SubViewOp>(
1356-
loc, resultMemrefType, writeOp.getSource(), offsets, srcType.getShape(),
1357-
strides);
1362+
loc, resultMemrefType, writeOp.getSource(), offsets, sizes, strides);
13581363
auto permMap = getTransferMinorIdentityMap(
13591364
cast<ShapedType>(rankedReducedView.getType()), resultTargetVecType);
13601365

mlir/test/Dialect/Vector/vector-transfer-collapse-inner-most-dims.mlir

Lines changed: 40 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,25 @@ func.func @contiguous_inner_most_view(%in: memref<1x1x8x1xf32, strided<[3072, 8,
1616

1717
// -----
1818

19+
func.func @contiguous_outer_dyn_inner_most_view(%in: memref<?x1x8x1xf32, strided<[3072, 8, 1, 1], offset: ?>>) -> vector<1x8x1xf32>{
20+
%c0 = arith.constant 0 : index
21+
%cst = arith.constant 0.0 : f32
22+
%0 = vector.transfer_read %in[%c0, %c0, %c0, %c0], %cst {in_bounds = [true, true, true]} : memref<?x1x8x1xf32, strided<[3072, 8, 1, 1], offset: ?>>, vector<1x8x1xf32>
23+
return %0 : vector<1x8x1xf32>
24+
}
25+
// CHECK: func @contiguous_outer_dyn_inner_most_view(
26+
// CHECK-SAME: %[[SRC:[a-zA-Z0-9]+]]
27+
// CHECK-DAG: %[[C0:.+]] = arith.constant 0 : index
28+
// CHECK-DAG: %[[D0:.+]] = memref.dim %[[SRC]], %[[C0]]
29+
// CHECK: %[[SRC_0:.+]] = memref.subview %[[SRC]][0, 0, 0, 0] [%[[D0]], 1, 8, 1] [1, 1, 1, 1]
30+
// CHECK-SAME: memref<?x1x8x1xf32, strided<[3072, 8, 1, 1], offset: ?>> to memref<?x1x8xf32, strided<[3072, 8, 1], offset: ?>>
31+
// CHECK: %[[VEC:.+]] = vector.transfer_read %[[SRC_0]]
32+
// CHECK-SAME: memref<?x1x8xf32, strided<[3072, 8, 1], offset: ?>>, vector<1x8xf32>
33+
// CHECK: %[[RESULT:.+]] = vector.shape_cast %[[VEC]]
34+
// CHECK: return %[[RESULT]]
35+
36+
// -----
37+
1938
func.func @contiguous_inner_most_dim(%A: memref<16x1xf32>, %i:index, %j:index) -> (vector<8x1xf32>) {
2039
%c0 = arith.constant 0 : index
2140
%f0 = arith.constant 0.0 : f32
@@ -119,6 +138,27 @@ func.func @drop_inner_most_dim_for_transfer_write(%arg0: memref<1x512x16x1xf32,
119138

120139
// -----
121140

141+
func.func @outer_dyn_drop_inner_most_dim_for_transfer_write(%arg0: memref<?x512x16x1xf32, strided<[8192, 16, 1, 1], offset: ?>>, %arg1: vector<1x16x16x1xf32>, %arg2: index) {
142+
%c0 = arith.constant 0 : index
143+
vector.transfer_write %arg1, %arg0[%arg2, %c0, %c0, %c0]
144+
{in_bounds = [true, true, true, true]}
145+
: vector<1x16x16x1xf32>, memref<?x512x16x1xf32, strided<[8192, 16, 1, 1], offset: ?>>
146+
return
147+
}
148+
// CHECK: func.func @outer_dyn_drop_inner_most_dim_for_transfer_write
149+
// CHECK-SAME: %[[DEST:[a-zA-Z0-9]+]]
150+
// CHECK-SAME: %[[VEC:[a-zA-Z0-9]+]]
151+
// CHECK-SAME: %[[IDX:[a-zA-Z0-9]+]]
152+
// CHECK-DAG: %[[C0:.+]] = arith.constant 0 : index
153+
// CHECK-DAG: %[[D0:.+]] = memref.dim %[[SRC]], %[[C0]]
154+
// CHECK: %[[SUBVIEW:.+]] = memref.subview %[[DEST]][0, 0, 0, 0] [%[[D0]], 512, 16, 1]
155+
// CHECK-SAME: memref<?x512x16x1xf32, strided<[8192, 16, 1, 1], offset: ?>> to memref<?x512x16xf32, strided<[8192, 16, 1], offset: ?>>
156+
// CHECK: %[[CAST:.+]] = vector.shape_cast %[[VEC]] : vector<1x16x16x1xf32> to vector<1x16x16xf32>
157+
// CHECK: vector.transfer_write %[[CAST]], %[[SUBVIEW]]
158+
// CHECK-SAME: [%[[IDX]], %[[C0]], %[[C0]]]
159+
160+
// -----
161+
122162
func.func @non_unit_strides(%arg0: memref<512x16x1xf32, strided<[8192, 16, 4], offset: ?>>, %arg1: vector<16x16x1xf32>, %arg2: index) {
123163
%c0 = arith.constant 0 : index
124164
vector.transfer_write %arg1, %arg0[%arg2, %c0, %c0]

0 commit comments

Comments
 (0)