Skip to content

Commit 14c1450

Browse files
[mlir][Vector] Add vector to outerproduct lowering for the [reduction, parallel] case.
Differential Revision: https://reviews.llvm.org/D105373
1 parent 8b81524 commit 14c1450

File tree

2 files changed

+67
-8
lines changed

2 files changed

+67
-8
lines changed

mlir/lib/Dialect/Vector/VectorTransforms.cpp

Lines changed: 32 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -1324,15 +1324,14 @@ LogicalResult ContractionOpToOuterProductOpLowering::matchAndRewrite(
13241324
VectorType lhsType = op.getLhsType();
13251325
Value lhs = op.lhs(), rhs = op.rhs(), res = op.acc();
13261326

1327-
// Set up the parallel/reduction structure in right form.
1328-
AffineExpr m, n, k;
1329-
bindDims(rewriter.getContext(), m, n, k);
1330-
13311327
//
13321328
// Two outer parallel, one inner reduction (matmat flavor).
13331329
//
13341330
UnrolledOuterProductEmitter e(rewriter, op);
13351331
if (e.iters({Par(), Par(), Red()})) {
1332+
// Set up the parallel/reduction structure in right form.
1333+
AffineExpr m, n, k;
1334+
bindDims(rewriter.getContext(), m, n, k);
13361335
// Classical row-major matmul: Just permute the lhs.
13371336
if (e.layout({{m, k}, {k, n}, {m, n}}))
13381337
return e.outer_prod(e.t(lhs), rhs, res, lhsType.getDimSize(1));
@@ -1367,17 +1366,42 @@ LogicalResult ContractionOpToOuterProductOpLowering::matchAndRewrite(
13671366
// One outer parallel, one inner reduction (matvec flavor)
13681367
//
13691368
if (e.iters({Par(), Red()})) {
1369+
AffineExpr m, k;
1370+
bindDims(rewriter.getContext(), m, k);
1371+
1372+
// Case mat-vec: transpose.
1373+
if (e.layout({{m, k}, {k}, {m}}))
1374+
return e.outer_prod(e.t(lhs), rhs, res, lhsType.getDimSize(1));
1375+
// Case mat-trans-vec: ready to go.
1376+
if (e.layout({{k, m}, {k}, {m}}))
1377+
return e.outer_prod(lhs, rhs, res, lhsType.getDimSize(0));
1378+
// Case vec-mat: swap and transpose.
1379+
if (e.layout({{k}, {m, k}, {m}}))
1380+
return e.outer_prod(e.t(rhs), lhs, res, lhsType.getDimSize(0));
1381+
// Case vec-mat-trans: swap and ready to go.
1382+
if (e.layout({{k}, {k, m}, {m}}))
1383+
return e.outer_prod(rhs, lhs, res, lhsType.getDimSize(0));
1384+
return failure();
1385+
}
1386+
1387+
//
1388+
// One outer reduction, one inner parallel (tmatvec flavor)
1389+
//
1390+
if (e.iters({Red(), Par()})) {
1391+
AffineExpr k, m;
1392+
bindDims(rewriter.getContext(), k, m);
1393+
13701394
// Case mat-vec: transpose.
1371-
if (e.layout({{m, n}, {n}, {m}}))
1395+
if (e.layout({{m, k}, {k}, {m}}))
13721396
return e.outer_prod(e.t(lhs), rhs, res, lhsType.getDimSize(1));
13731397
// Case mat-trans-vec: ready to go.
1374-
if (e.layout({{n, m}, {n}, {m}}))
1398+
if (e.layout({{k, m}, {k}, {m}}))
13751399
return e.outer_prod(lhs, rhs, res, lhsType.getDimSize(0));
13761400
// Case vec-mat: swap and transpose.
1377-
if (e.layout({{n}, {m, n}, {m}}))
1401+
if (e.layout({{k}, {m, k}, {m}}))
13781402
return e.outer_prod(e.t(rhs), lhs, res, lhsType.getDimSize(0));
13791403
// Case vec-mat-trans: swap and ready to go.
1380-
if (e.layout({{n}, {n, m}, {m}}))
1404+
if (e.layout({{k}, {k, m}, {m}}))
13811405
return e.outer_prod(rhs, lhs, res, lhsType.getDimSize(0));
13821406
return failure();
13831407
}

mlir/test/Dialect/Vector/vector-contract-matvec-transforms.mlir

Lines changed: 35 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -45,6 +45,16 @@
4545
iterator_types = ["parallel", "reduction"]
4646
}
4747

48+
#redpar_vecmattrans_accesses = [
49+
affine_map<(i, j) -> (i)>,
50+
affine_map<(i, j) -> (i, j)>,
51+
affine_map<(i, j) -> (j)>
52+
]
53+
#redpar_vecmattrans_trait = {
54+
indexing_maps = #redpar_vecmattrans_accesses,
55+
iterator_types = ["reduction", "parallel"]
56+
}
57+
4858
// CHECK-LABEL: func @matvec2x2
4959
// CHECK-SAME: %[[A:.*0]]: memref<vector<2x2xf32>>
5060
// CHECK-SAME: %[[B:.*1]]: memref<vector<2xf32>>
@@ -172,3 +182,28 @@ func @vecmattrans2x2(%arg0: memref<vector<2x2xf32>>, %arg1: memref<vector<2xf32>
172182
memref.store %0, %arg2[] : memref<vector<2xf32>>
173183
return
174184
}
185+
186+
// CHECK-LABEL: func @redpar_vecmattrans2x2
187+
// CHECK-SAME: %[[A:.*0]]: memref<vector<2x2xf32>>
188+
// CHECK-SAME: %[[B:.*1]]: memref<vector<2xf32>>
189+
// CHECK-SAME: %[[C:.*2]]: memref<vector<2xf32>>
190+
// CHECK: %[[T0:.*]] = memref.load %[[A]][] : memref<vector<2x2xf32>>
191+
// CHECK: %[[T1:.*]] = memref.load %[[B]][] : memref<vector<2xf32>>
192+
// CHECK: %[[T2:.*]] = memref.load %[[C]][] : memref<vector<2xf32>>
193+
// CHECK: %[[T3:.*]] = vector.extract %[[T0]][0] : vector<2x2xf32>
194+
// CHECK: %[[T4:.*]] = vector.extract %[[T1]][0] : vector<2xf32>
195+
// CHECK: %[[T5:.*]] = vector.outerproduct %[[T3]], %[[T4]], %[[T2]] {kind = #vector.kind<add>} : vector<2xf32>, f32
196+
// CHECK: %[[T6:.*]] = vector.extract %[[T0]][1] : vector<2x2xf32>
197+
// CHECK: %[[T7:.*]] = vector.extract %[[T1]][1] : vector<2xf32>
198+
// CHECK: %[[T8:.*]] = vector.outerproduct %[[T6]], %[[T7]], %[[T5]] {kind = #vector.kind<add>} : vector<2xf32>, f32
199+
// CHECK: memref.store %[[T8]], %[[C]][] : memref<vector<2xf32>>
200+
// CHECK: return
201+
func @redpar_vecmattrans2x2(%arg0: memref<vector<2x2xf32>>, %arg1: memref<vector<2xf32>>,
202+
%arg2: memref<vector<2xf32>>) {
203+
%A = memref.load %arg0[] : memref<vector<2x2xf32>>
204+
%x = memref.load %arg1[] : memref<vector<2xf32>>
205+
%b = memref.load %arg2[] : memref<vector<2xf32>>
206+
%0 = vector.contract #redpar_vecmattrans_trait %x, %A, %b : vector<2xf32>, vector<2x2xf32> into vector<2xf32>
207+
memref.store %0, %arg2[] : memref<vector<2xf32>>
208+
return
209+
}

0 commit comments

Comments
 (0)