Skip to content

Commit 216dc73

Browse files
authored
Merge branch 'main' into fx-mul-libcalls
2 parents 2390373 + a7759fb commit 216dc73

File tree

3 files changed

+22
-23
lines changed

3 files changed

+22
-23
lines changed

mlir/lib/Dialect/MLProgram/IR/MLProgramOps.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -178,7 +178,7 @@ LogicalResult GlobalOp::verify() {
178178
//===----------------------------------------------------------------------===//
179179

180180
GlobalOp GlobalLoadOp::getGlobalOp(SymbolTableCollection &symbolTable) {
181-
for (auto parent = getOperation()->getParentOp(); parent;
181+
for (auto *parent = getOperation()->getParentOp(); parent;
182182
parent = parent->getParentOp()) {
183183
if (auto nearest = symbolTable.lookupNearestSymbolFrom<GlobalOp>(
184184
parent, getGlobalAttr())) {
@@ -259,7 +259,7 @@ GlobalLoadGraphOp::verifySymbolUses(SymbolTableCollection &symbolTable) {
259259
//===----------------------------------------------------------------------===//
260260

261261
GlobalOp GlobalStoreOp::getGlobalOp(SymbolTableCollection &symbolTable) {
262-
for (auto parent = getOperation()->getParentOp(); parent;) {
262+
for (auto *parent = getOperation()->getParentOp(); parent;) {
263263
if (auto nearest = symbolTable.lookupNearestSymbolFrom<GlobalOp>(
264264
parent, getGlobalAttr())) {
265265
return nearest;

mlir/lib/Dialect/MLProgram/Transforms/PipelineGlobalOps.cpp

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@ class MLProgramPipelineGlobals
2929
private:
3030
LogicalResult buildGlobalMap(ModuleOp op);
3131

32-
void ProcessBlock(Block &block, llvm::DenseSet<SymbolRefAttr> &symbolLoad,
32+
void processBlock(Block &block, llvm::DenseSet<SymbolRefAttr> &symbolLoad,
3333
llvm::DenseSet<SymbolRefAttr> &symbolStore);
3434

3535
llvm::DenseMap<SymbolRefAttr, llvm::DenseSet<SymbolRefAttr>> loadSymbolsMap;
@@ -38,8 +38,8 @@ class MLProgramPipelineGlobals
3838

3939
// Traverses upwards searchign for the operation mapped by the symbol.
4040
static Operation *getFromSymbol(Operation *baseOp, SymbolRefAttr symbol) {
41-
for (auto op = baseOp; op; op = op->getParentOp()) {
42-
auto lookup = SymbolTable::lookupNearestSymbolFrom(op, symbol);
41+
for (auto *op = baseOp; op; op = op->getParentOp()) {
42+
auto *lookup = SymbolTable::lookupNearestSymbolFrom(op, symbol);
4343
if (lookup)
4444
return lookup;
4545
}
@@ -59,7 +59,7 @@ LogicalResult MLProgramPipelineGlobals::buildGlobalMap(ModuleOp module) {
5959
}
6060

6161
auto symbol = mlir::dyn_cast<SymbolRefAttr>(callable);
62-
auto func = getFromSymbol(op, symbol);
62+
auto *func = getFromSymbol(op, symbol);
6363
callableMap[symbol] = func;
6464
}
6565
return WalkResult::advance();
@@ -122,7 +122,7 @@ LogicalResult MLProgramPipelineGlobals::buildGlobalMap(ModuleOp module) {
122122

123123
// Process each operation in the block deleting unneeded loads / stores,
124124
// recursing on subblocks and checking function calls.
125-
void MLProgramPipelineGlobals::ProcessBlock(
125+
void MLProgramPipelineGlobals::processBlock(
126126
Block &block, llvm::DenseSet<SymbolRefAttr> &symbolLoad,
127127
llvm::DenseSet<SymbolRefAttr> &symbolStore) {
128128

@@ -184,7 +184,7 @@ void MLProgramPipelineGlobals::ProcessBlock(
184184
llvm::DenseSet<SymbolRefAttr> opSymbolStore;
185185
for (auto &region : op.getRegions()) {
186186
for (auto &block : region) {
187-
ProcessBlock(block, opSymbolLoad, opSymbolStore);
187+
processBlock(block, opSymbolLoad, opSymbolStore);
188188
}
189189
}
190190

@@ -201,7 +201,7 @@ void MLProgramPipelineGlobals::ProcessBlock(
201201
}
202202
}
203203

204-
for (auto op : toDelete) {
204+
for (auto *op : toDelete) {
205205
op->erase();
206206
}
207207
}
@@ -217,7 +217,7 @@ void MLProgramPipelineGlobals::runOnOperation() {
217217
for (auto &block : region.getBlocks()) {
218218
llvm::DenseSet<SymbolRefAttr> symbolsLoaded;
219219
llvm::DenseSet<SymbolRefAttr> symbolsStored;
220-
ProcessBlock(block, symbolsLoaded, symbolsStored);
220+
processBlock(block, symbolsLoaded, symbolsStored);
221221
}
222222
}
223223
}

mlir/lib/Dialect/NVGPU/TransformOps/NVGPUTransformOps.cpp

Lines changed: 12 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,7 @@ using namespace mlir::transform;
4040
#define DEBUG_TYPE "nvgpu-transforms"
4141
#define DBGS() (llvm::dbgs() << "[" DEBUG_TYPE "]: ")
4242
#define DBGSNL() (llvm::dbgs() << "\n")
43-
#define LDBG(X) LLVM_DEBUG(DBGS() << X << "\n")
43+
#define LDBG(X) LLVM_DEBUG(DBGS() << (X) << "\n")
4444

4545
//===----------------------------------------------------------------------===//
4646
// Apply...ConversionPatternsOp
@@ -606,7 +606,7 @@ struct MmaSyncBuilder {
606606
/// IndexCalculator callback.
607607
SmallVector<Value> buildMemRefLoads(OpBuilder &b, Location loc,
608608
OpFoldResult laneId, Value memref,
609-
IndexCalculator indexFn);
609+
const IndexCalculator &indexFn);
610610

611611
/// Perform a distributed load of a vector operand of `vectorShape` for a
612612
/// particular MMA instruction whose `(row, col)` indices are specified via
@@ -625,7 +625,7 @@ struct MmaSyncBuilder {
625625
SmallVector<Operation *> buildMemRefStores(OpBuilder &b, Location loc,
626626
ValueRange toStore,
627627
OpFoldResult laneId, Value memref,
628-
IndexCalculator indexFn);
628+
const IndexCalculator &indexFn);
629629

630630
/// Perform a distributed store of a vector operand of `vectorShape` for a
631631
/// particular MMA instruction whose `(row, col)` indices are specified via
@@ -660,10 +660,10 @@ static void foreachIndividualVectorElement(Value vector, ApplyFn applyFn,
660660
}
661661
}
662662

663-
SmallVector<Value> MmaSyncBuilder::buildMemRefLoads(OpBuilder &b, Location loc,
664-
OpFoldResult laneId,
665-
Value memref,
666-
IndexCalculator indexFn) {
663+
SmallVector<Value>
664+
MmaSyncBuilder::buildMemRefLoads(OpBuilder &b, Location loc,
665+
OpFoldResult laneId, Value memref,
666+
const IndexCalculator &indexFn) {
667667
auto aff = [&](AffineExpr e) {
668668
return affine::makeComposedFoldedAffineApply(b, loc, e, laneId);
669669
};
@@ -681,7 +681,7 @@ SmallVector<Value> MmaSyncBuilder::buildMemRefLoads(OpBuilder &b, Location loc,
681681
Value MmaSyncBuilder::buildMmaSyncMemRefLoadOperand(
682682
OpBuilder &b, Location loc, OpFoldResult laneId, Value memref,
683683
IndexCalculator indexFn, ArrayRef<int64_t> vectorShape) {
684-
auto loads = buildMemRefLoads(b, loc, laneId, memref, indexFn);
684+
auto loads = buildMemRefLoads(b, loc, laneId, memref, std::move(indexFn));
685685

686686
Type elementType = getElementTypeOrSelf(memref.getType());
687687
auto vt = VectorType::get(vectorShape, elementType);
@@ -700,10 +700,9 @@ Value MmaSyncBuilder::buildMmaSyncMemRefLoadOperand(
700700
return res;
701701
}
702702

703-
SmallVector<Operation *>
704-
MmaSyncBuilder::buildMemRefStores(OpBuilder &b, Location loc,
705-
ValueRange toStore, OpFoldResult laneId,
706-
Value memref, IndexCalculator indexFn) {
703+
SmallVector<Operation *> MmaSyncBuilder::buildMemRefStores(
704+
OpBuilder &b, Location loc, ValueRange toStore, OpFoldResult laneId,
705+
Value memref, const IndexCalculator &indexFn) {
707706
auto aff = [&](AffineExpr e) {
708707
return affine::makeComposedFoldedAffineApply(b, loc, e, laneId);
709708
};
@@ -734,7 +733,7 @@ SmallVector<Operation *> MmaSyncBuilder::buildMmaSyncMemRefStoreOperand(
734733
[&](Value v, int64_t linearIdx, ArrayRef<int64_t> indices) {
735734
toStore.push_back(v);
736735
});
737-
return buildMemRefStores(b, loc, toStore, laneId, memref, indexFn);
736+
return buildMemRefStores(b, loc, toStore, laneId, memref, std::move(indexFn));
738737
}
739738

740739
static std::tuple<SmallVector<int64_t>, SmallVector<int64_t>,

0 commit comments

Comments
 (0)