Skip to content

Commit d51c46c

Browse files
Normalize reinterpret_cast op
Rewrites the memref defined by reinterpet_cast op to have an identity layout map and updates all its indexing uses. Also extend `replaceAllMemRefUsesWith` utility to work when there are multiple occurences of `oldMemRef` in `op`'s operand list when op is non-dereferencing.
1 parent 4d1e4ef commit d51c46c

File tree

5 files changed

+199
-120
lines changed

5 files changed

+199
-120
lines changed

mlir/include/mlir/Dialect/Affine/Utils.h

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -32,6 +32,7 @@ class FuncOp;
3232
namespace memref {
3333
class AllocOp;
3434
class AllocaOp;
35+
class ReinterpretCastOp;
3536
} // namespace memref
3637

3738
namespace affine {
@@ -243,15 +244,16 @@ LogicalResult replaceAllMemRefUsesWith(Value oldMemRef, Value newMemRef,
243244
ArrayRef<Value> symbolOperands = {},
244245
bool allowNonDereferencingOps = false);
245246

246-
/// Rewrites the memref defined by this alloc op to have an identity layout map
247-
/// and updates all its indexing uses. Returns failure if any of its uses
248-
/// escape (while leaving the IR in a valid state).
247+
/// Rewrites the memref defined by alloc or reinterpret_cast op to have an
248+
/// identity layout map and updates all its indexing uses. Returns failure if
249+
/// any of its uses escape (while leaving the IR in a valid state).
249250
template <typename AllocLikeOp>
250251
LogicalResult normalizeMemRef(AllocLikeOp op);
251252
extern template LogicalResult
252253
normalizeMemRef<memref::AllocaOp>(memref::AllocaOp op);
253254
extern template LogicalResult
254255
normalizeMemRef<memref::AllocOp>(memref::AllocOp op);
256+
LogicalResult normalizeMemRef(memref::ReinterpretCastOp op);
255257

256258
/// Normalizes `memrefType` so that the affine layout map of the memref is
257259
/// transformed to an identity map with a new shape being computed for the

mlir/lib/Dialect/Affine/Utils/Utils.cpp

Lines changed: 140 additions & 115 deletions
Original file line numberDiff line numberDiff line change
@@ -1098,90 +1098,12 @@ void mlir::affine::affineScalarReplace(func::FuncOp f, DominanceInfo &domInfo,
10981098
op->erase();
10991099
}
11001100

1101-
// Private helper function to transform memref.load with reduced rank.
1102-
// This function will modify the indices of the memref.load to match the
1103-
// newMemRef.
1104-
LogicalResult transformMemRefLoadWithReducedRank(
1105-
Operation *op, Value oldMemRef, Value newMemRef, unsigned memRefOperandPos,
1106-
ArrayRef<Value> extraIndices, ArrayRef<Value> extraOperands,
1107-
ArrayRef<Value> symbolOperands, AffineMap indexRemap) {
1108-
unsigned oldMemRefRank = cast<MemRefType>(oldMemRef.getType()).getRank();
1109-
unsigned newMemRefRank = cast<MemRefType>(newMemRef.getType()).getRank();
1110-
unsigned oldMapNumInputs = oldMemRefRank;
1111-
SmallVector<Value, 4> oldMapOperands(
1112-
op->operand_begin() + memRefOperandPos + 1,
1113-
op->operand_begin() + memRefOperandPos + 1 + oldMapNumInputs);
1114-
SmallVector<Value, 4> oldMemRefOperands;
1115-
oldMemRefOperands.assign(oldMapOperands.begin(), oldMapOperands.end());
1116-
SmallVector<Value, 4> remapOperands;
1117-
remapOperands.reserve(extraOperands.size() + oldMemRefRank +
1118-
symbolOperands.size());
1119-
remapOperands.append(extraOperands.begin(), extraOperands.end());
1120-
remapOperands.append(oldMemRefOperands.begin(), oldMemRefOperands.end());
1121-
remapOperands.append(symbolOperands.begin(), symbolOperands.end());
1122-
1123-
SmallVector<Value, 4> remapOutputs;
1124-
remapOutputs.reserve(oldMemRefRank);
1125-
SmallVector<Value, 4> affineApplyOps;
1126-
1127-
OpBuilder builder(op);
1128-
1129-
if (indexRemap &&
1130-
indexRemap != builder.getMultiDimIdentityMap(indexRemap.getNumDims())) {
1131-
// Remapped indices.
1132-
for (auto resultExpr : indexRemap.getResults()) {
1133-
auto singleResMap = AffineMap::get(
1134-
indexRemap.getNumDims(), indexRemap.getNumSymbols(), resultExpr);
1135-
auto afOp = builder.create<AffineApplyOp>(op->getLoc(), singleResMap,
1136-
remapOperands);
1137-
remapOutputs.push_back(afOp);
1138-
affineApplyOps.push_back(afOp);
1139-
}
1140-
} else {
1141-
// No remapping specified.
1142-
remapOutputs.assign(remapOperands.begin(), remapOperands.end());
1143-
}
1144-
1145-
SmallVector<Value, 4> newMapOperands;
1146-
newMapOperands.reserve(newMemRefRank);
1147-
1148-
// Prepend 'extraIndices' in 'newMapOperands'.
1149-
for (Value extraIndex : extraIndices) {
1150-
assert((isValidDim(extraIndex) || isValidSymbol(extraIndex)) &&
1151-
"invalid memory op index");
1152-
newMapOperands.push_back(extraIndex);
1153-
}
1154-
1155-
// Append 'remapOutputs' to 'newMapOperands'.
1156-
newMapOperands.append(remapOutputs.begin(), remapOutputs.end());
1157-
1158-
// Create new fully composed AffineMap for new op to be created.
1159-
assert(newMapOperands.size() == newMemRefRank);
1160-
1161-
OperationState state(op->getLoc(), op->getName());
1162-
// Construct the new operation using this memref.
1163-
state.operands.reserve(newMapOperands.size() + extraIndices.size());
1164-
state.operands.push_back(newMemRef);
1165-
1166-
// Insert the new memref map operands.
1167-
state.operands.append(newMapOperands.begin(), newMapOperands.end());
1168-
1169-
state.types.reserve(op->getNumResults());
1170-
for (auto result : op->getResults())
1171-
state.types.push_back(result.getType());
1172-
1173-
// Copy over the attributes from the old operation to the new operation.
1174-
for (auto namedAttr : op->getAttrs()) {
1175-
state.attributes.push_back(namedAttr);
1176-
}
1177-
1178-
// Create the new operation.
1179-
auto *repOp = builder.create(state);
1180-
op->replaceAllUsesWith(repOp);
1181-
op->erase();
1182-
1183-
return success();
1101+
// Checks if `op` is non dereferencing.
1102+
// TODO: This hardcoded check will be removed once the right interface is added.
1103+
static bool isDereferencingOp(Operation *op) {
1104+
return isa<AffineMapAccessInterface, memref::LoadOp, memref::StoreOp>(op);
11841105
}
1106+
11851107
// Perform the replacement in `op`.
11861108
LogicalResult mlir::affine::replaceAllMemRefUsesWith(
11871109
Value oldMemRef, Value newMemRef, Operation *op,
@@ -1216,53 +1138,55 @@ LogicalResult mlir::affine::replaceAllMemRefUsesWith(
12161138
if (usePositions.empty())
12171139
return success();
12181140

1219-
if (usePositions.size() > 1) {
1220-
// TODO: extend it for this case when needed (rare).
1221-
assert(false && "multiple dereferencing uses in a single op not supported");
1222-
return failure();
1223-
}
1224-
12251141
unsigned memRefOperandPos = usePositions.front();
12261142

12271143
OpBuilder builder(op);
12281144
// The following checks if op is dereferencing memref and performs the access
12291145
// index rewrites.
12301146
auto affMapAccInterface = dyn_cast<AffineMapAccessInterface>(op);
1231-
if (!affMapAccInterface) {
1147+
if (!isDereferencingOp(op)) {
12321148
if (!allowNonDereferencingOps) {
12331149
// Failure: memref used in a non-dereferencing context (potentially
12341150
// escapes); no replacement in these cases unless allowNonDereferencingOps
12351151
// is set.
12361152
return failure();
12371153
}
1154+
for (unsigned pos : usePositions)
1155+
op->setOperand(pos, newMemRef);
1156+
return success();
1157+
}
12381158

1239-
// Check if it is a memref.load
1240-
auto memrefLoad = dyn_cast<memref::LoadOp>(op);
1241-
bool isReductionLike =
1242-
indexRemap.getNumResults() < indexRemap.getNumInputs();
1243-
if (!memrefLoad || !isReductionLike) {
1244-
op->setOperand(memRefOperandPos, newMemRef);
1245-
return success();
1246-
}
1159+
if (usePositions.size() > 1) {
1160+
// TODO: extend it for this case when needed (rare).
1161+
LLVM_DEBUG(llvm::dbgs()
1162+
<< "multiple dereferencing uses in a single op not supported");
1163+
return failure();
1164+
}
12471165

1248-
return transformMemRefLoadWithReducedRank(
1249-
op, oldMemRef, newMemRef, memRefOperandPos, extraIndices, extraOperands,
1250-
symbolOperands, indexRemap);
1166+
// Perform index rewrites for the dereferencing op and then replace the op.
1167+
SmallVector<Value, 4> oldMapOperands;
1168+
AffineMap oldMap;
1169+
unsigned oldMemRefNumIndices = oldMemRefRank;
1170+
auto startIdx = op->operand_begin() + memRefOperandPos + 1;
1171+
if (affMapAccInterface) {
1172+
// If `op` implements AffineMapAccessInterface, we can get the indices by
1173+
// quering the number of map operands from the operand list from a certain
1174+
// offset (`memRefOperandPos` in this case).
1175+
NamedAttribute oldMapAttrPair =
1176+
affMapAccInterface.getAffineMapAttrForMemRef(oldMemRef);
1177+
oldMap = cast<AffineMapAttr>(oldMapAttrPair.getValue()).getValue();
1178+
oldMemRefNumIndices = oldMap.getNumInputs();
1179+
oldMapOperands.assign(startIdx, startIdx + oldMemRefNumIndices);
1180+
} else {
1181+
oldMapOperands.assign(startIdx, startIdx + oldMemRefRank);
12511182
}
1252-
// Perform index rewrites for the dereferencing op and then replace the op
1253-
NamedAttribute oldMapAttrPair =
1254-
affMapAccInterface.getAffineMapAttrForMemRef(oldMemRef);
1255-
AffineMap oldMap = cast<AffineMapAttr>(oldMapAttrPair.getValue()).getValue();
1256-
unsigned oldMapNumInputs = oldMap.getNumInputs();
1257-
SmallVector<Value, 4> oldMapOperands(
1258-
op->operand_begin() + memRefOperandPos + 1,
1259-
op->operand_begin() + memRefOperandPos + 1 + oldMapNumInputs);
12601183

12611184
// Apply 'oldMemRefOperands = oldMap(oldMapOperands)'.
12621185
SmallVector<Value, 4> oldMemRefOperands;
12631186
SmallVector<Value, 4> affineApplyOps;
12641187
oldMemRefOperands.reserve(oldMemRefRank);
1265-
if (oldMap != builder.getMultiDimIdentityMap(oldMap.getNumDims())) {
1188+
if (affMapAccInterface &&
1189+
oldMap != builder.getMultiDimIdentityMap(oldMap.getNumDims())) {
12661190
for (auto resultExpr : oldMap.getResults()) {
12671191
auto singleResMap = AffineMap::get(oldMap.getNumDims(),
12681192
oldMap.getNumSymbols(), resultExpr);
@@ -1287,7 +1211,6 @@ LogicalResult mlir::affine::replaceAllMemRefUsesWith(
12871211

12881212
SmallVector<Value, 4> remapOutputs;
12891213
remapOutputs.reserve(oldMemRefRank);
1290-
12911214
if (indexRemap &&
12921215
indexRemap != builder.getMultiDimIdentityMap(indexRemap.getNumDims())) {
12931216
// Remapped indices.
@@ -1303,7 +1226,6 @@ LogicalResult mlir::affine::replaceAllMemRefUsesWith(
13031226
// No remapping specified.
13041227
remapOutputs.assign(remapOperands.begin(), remapOperands.end());
13051228
}
1306-
13071229
SmallVector<Value, 4> newMapOperands;
13081230
newMapOperands.reserve(newMemRefRank);
13091231

@@ -1338,13 +1260,25 @@ LogicalResult mlir::affine::replaceAllMemRefUsesWith(
13381260
state.operands.push_back(newMemRef);
13391261

13401262
// Insert the new memref map operands.
1341-
state.operands.append(newMapOperands.begin(), newMapOperands.end());
1263+
if (affMapAccInterface) {
1264+
state.operands.append(newMapOperands.begin(), newMapOperands.end());
1265+
} else {
1266+
// In the case of dereferencing ops not implementing
1267+
// AffineMapAccessInterface, we need to apply the values of `newMapOperands`
1268+
// to the `newMap` to get the correct indices.
1269+
for (unsigned i = 0; i < newMemRefRank; i++)
1270+
state.operands.push_back(builder.create<AffineApplyOp>(
1271+
op->getLoc(),
1272+
AffineMap::get(newMap.getNumDims(), newMap.getNumSymbols(),
1273+
newMap.getResult(i)),
1274+
newMapOperands));
1275+
}
13421276

13431277
// Insert the remaining operands unmodified.
1278+
unsigned oldMapNumInputs = oldMapOperands.size();
13441279
state.operands.append(op->operand_begin() + memRefOperandPos + 1 +
13451280
oldMapNumInputs,
13461281
op->operand_end());
1347-
13481282
// Result types don't change. Both memref's are of the same elemental type.
13491283
state.types.reserve(op->getNumResults());
13501284
for (auto result : op->getResults())
@@ -1353,7 +1287,9 @@ LogicalResult mlir::affine::replaceAllMemRefUsesWith(
13531287
// Add attribute for 'newMap', other Attributes do not change.
13541288
auto newMapAttr = AffineMapAttr::get(newMap);
13551289
for (auto namedAttr : op->getAttrs()) {
1356-
if (namedAttr.getName() == oldMapAttrPair.getName())
1290+
if (affMapAccInterface &&
1291+
namedAttr.getName() ==
1292+
affMapAccInterface.getAffineMapAttrForMemRef(oldMemRef).getName())
13571293
state.attributes.push_back({namedAttr.getName(), newMapAttr});
13581294
else
13591295
state.attributes.push_back(namedAttr);
@@ -1845,6 +1781,95 @@ LogicalResult mlir::affine::normalizeMemRef(AllocLikeOp allocOp) {
18451781
return success();
18461782
}
18471783

1784+
LogicalResult
1785+
mlir::affine::normalizeMemRef(memref::ReinterpretCastOp reinterpretCastOp) {
1786+
MemRefType memrefType = reinterpretCastOp.getType();
1787+
AffineMap oldLayoutMap = memrefType.getLayout().getAffineMap();
1788+
Value oldMemRef = reinterpretCastOp.getResult();
1789+
1790+
// If `oldLayoutMap` is identity, `memrefType` is already normalized.
1791+
if (oldLayoutMap.isIdentity())
1792+
return success();
1793+
1794+
// Fetch a new memref type after normalizing the old memref to have an
1795+
// identity map layout.
1796+
MemRefType newMemRefType = normalizeMemRefType(memrefType);
1797+
newMemRefType.dump();
1798+
if (newMemRefType == memrefType)
1799+
// `oldLayoutMap` couldn't be transformed to an identity map.
1800+
return failure();
1801+
1802+
uint64_t newRank = newMemRefType.getRank();
1803+
SmallVector<Value> mapOperands(oldLayoutMap.getNumDims() +
1804+
oldLayoutMap.getNumSymbols());
1805+
SmallVector<Value> oldStrides = reinterpretCastOp.getStrides();
1806+
Location loc = reinterpretCastOp.getLoc();
1807+
// As `newMemRefType` is normalized, it is unit strided.
1808+
SmallVector<int64_t> newStaticStrides(newRank, 1);
1809+
SmallVector<int64_t> newStaticOffsets(newRank, 0);
1810+
ArrayRef<int64_t> oldShape = memrefType.getShape();
1811+
mlir::ValueRange oldSizes = reinterpretCastOp.getSizes();
1812+
unsigned idx = 0;
1813+
SmallVector<int64_t> newStaticSizes;
1814+
OpBuilder b(reinterpretCastOp);
1815+
// Collectthe map operands which will be used to compute the new normalized
1816+
// memref shape.
1817+
for (unsigned i = 0, e = memrefType.getRank(); i < e; i++) {
1818+
if (memrefType.isDynamicDim(i))
1819+
mapOperands[i] =
1820+
b.create<arith::SubIOp>(loc, oldSizes[0].getType(), oldSizes[idx++],
1821+
b.create<arith::ConstantIndexOp>(loc, 1));
1822+
else
1823+
mapOperands[i] = b.create<arith::ConstantIndexOp>(loc, oldShape[i] - 1);
1824+
}
1825+
for (unsigned i = 0, e = oldStrides.size(); i < e; i++)
1826+
mapOperands[memrefType.getRank() + i] = oldStrides[i];
1827+
SmallVector<Value> newSizes;
1828+
ArrayRef<int64_t> newShape = newMemRefType.getShape();
1829+
// Compute size along all the dimensions of the new normalized memref.
1830+
for (unsigned i = 0; i < newRank; i++) {
1831+
if (!newMemRefType.isDynamicDim(i))
1832+
continue;
1833+
newSizes.push_back(b.create<AffineApplyOp>(
1834+
loc,
1835+
AffineMap::get(oldLayoutMap.getNumDims(), oldLayoutMap.getNumSymbols(),
1836+
oldLayoutMap.getResult(i)),
1837+
mapOperands));
1838+
}
1839+
for (unsigned i = 0, e = newSizes.size(); i < e; i++)
1840+
newSizes[i] =
1841+
b.create<arith::AddIOp>(loc, newSizes[i].getType(), newSizes[i],
1842+
b.create<arith::ConstantIndexOp>(loc, 1));
1843+
// Create the new reinterpret_cast op.
1844+
memref::ReinterpretCastOp newReinterpretCast =
1845+
b.create<memref::ReinterpretCastOp>(
1846+
loc, newMemRefType, reinterpretCastOp.getSource(),
1847+
/*offsets=*/mlir::ValueRange(), newSizes,
1848+
/*strides=*/mlir::ValueRange(),
1849+
/*static_offsets=*/newStaticOffsets,
1850+
/*static_sizes=*/newShape,
1851+
/*static_strides=*/newStaticStrides);
1852+
1853+
// Replace all uses of the old memref.
1854+
if (failed(replaceAllMemRefUsesWith(oldMemRef,
1855+
/*newMemRef=*/newReinterpretCast,
1856+
/*extraIndices=*/{},
1857+
/*indexRemap=*/oldLayoutMap,
1858+
/*extraOperands=*/{},
1859+
/*symbolOperands=*/oldStrides,
1860+
/*domOpFilter=*/nullptr,
1861+
/*postDomOpFilter=*/nullptr,
1862+
/*allowNonDereferencingOps=*/true))) {
1863+
// If it failed (due to escapes for example), bail out.
1864+
newReinterpretCast.erase();
1865+
return failure();
1866+
}
1867+
1868+
oldMemRef.replaceAllUsesWith(newReinterpretCast);
1869+
reinterpretCastOp.erase();
1870+
return success();
1871+
}
1872+
18481873
template LogicalResult
18491874
mlir::affine::normalizeMemRef<memref::AllocaOp>(memref::AllocaOp op);
18501875
template LogicalResult

0 commit comments

Comments
 (0)