Skip to content

[ThinLTO] Use a set rather than a map to track exported ValueInfos. #97360

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 4 commits into from
Jul 3, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
11 changes: 4 additions & 7 deletions llvm/include/llvm/Transforms/IPO/FunctionImport.h
Original file line number Diff line number Diff line change
Expand Up @@ -104,13 +104,10 @@ class FunctionImporter {
/// index's module path string table).
using ImportMapTy = DenseMap<StringRef, FunctionsToImportTy>;

/// The map contains an entry for every global value the module exports.
/// The key is ValueInfo, and the value indicates whether the definition
/// or declaration is visible to another module. If a function's definition is
/// visible to other modules, the global values this function referenced are
/// visible and shouldn't be internalized.
/// TODO: Rename to `ExportMapTy`.
using ExportSetTy = DenseMap<ValueInfo, GlobalValueSummary::ImportKind>;
/// The set contains an entry for every global value that the module exports.
/// Depending on the user context, this container is allowed to contain
/// definitions, declarations or a mix of both.
using ExportSetTy = DenseSet<ValueInfo>;

/// A function of this type is used to load modules referenced by the index.
using ModuleLoaderTy =
Expand Down
14 changes: 6 additions & 8 deletions llvm/lib/LTO/LTO.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -161,19 +161,17 @@ void llvm::computeLTOCacheKey(
auto ModHash = Index.getModuleHash(ModuleID);
Hasher.update(ArrayRef<uint8_t>((uint8_t *)&ModHash[0], sizeof(ModHash)));

std::vector<std::pair<uint64_t, uint8_t>> ExportsGUID;
// TODO: `ExportList` is determined by `ImportList`. Since `ImportList` is
// used to compute cache key, we could omit hashing `ExportList` here.
std::vector<uint64_t> ExportsGUID;
ExportsGUID.reserve(ExportList.size());
for (const auto &[VI, ExportType] : ExportList)
ExportsGUID.push_back(
std::make_pair(VI.getGUID(), static_cast<uint8_t>(ExportType)));
for (const auto &VI : ExportList)
ExportsGUID.push_back(VI.getGUID());

// Sort the export list elements GUIDs.
llvm::sort(ExportsGUID);
for (auto [GUID, ExportType] : ExportsGUID) {
// The export list can impact the internalization, be conservative here
for (auto GUID : ExportsGUID)
Hasher.update(ArrayRef<uint8_t>((uint8_t *)&GUID, sizeof(GUID)));
AddUint8(ExportType);
}

// Include the hash for every module we import functions from. The set of
// imported symbols for each module may affect code generation and is
Expand Down
112 changes: 49 additions & 63 deletions llvm/lib/Transforms/IPO/FunctionImport.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -400,8 +400,7 @@ class GlobalsImporter final {
// later, in ComputeCrossModuleImport, after import decisions are
// complete, which is more efficient than adding them here.
if (ExportLists)
(*ExportLists)[RefSummary->modulePath()][VI] =
GlobalValueSummary::Definition;
(*ExportLists)[RefSummary->modulePath()].insert(VI);

// If variable is not writeonly we attempt to recursively analyze
// its references in order to import referenced constants.
Expand Down Expand Up @@ -582,7 +581,7 @@ class WorkloadImportsManager : public ModuleImportsManager {
GlobalValueSummary::Definition;
GVI.onImportingSummary(*GVS);
if (ExportLists)
(*ExportLists)[ExportingModule][VI] = GlobalValueSummary::Definition;
(*ExportLists)[ExportingModule].insert(VI);
}
LLVM_DEBUG(dbgs() << "[Workload] Done\n");
}
Expand Down Expand Up @@ -818,10 +817,8 @@ static void computeImportForFunction(
// Since definition takes precedence over declaration for the same VI,
// try emplace <VI, declaration> pair without checking insert result.
// If insert doesn't happen, there must be an existing entry keyed by
// VI.
if (ExportLists)
(*ExportLists)[DeclSourceModule].try_emplace(
VI, GlobalValueSummary::Declaration);
// VI. Note `ExportLists` only keeps track of exports due to imported
// definitions.
ImportList[DeclSourceModule].try_emplace(
VI.getGUID(), GlobalValueSummary::Declaration);
}
Expand Down Expand Up @@ -892,7 +889,7 @@ static void computeImportForFunction(
// later, in ComputeCrossModuleImport, after import decisions are
// complete, which is more efficient than adding them here.
if (ExportLists)
(*ExportLists)[ExportModulePath][VI] = GlobalValueSummary::Definition;
(*ExportLists)[ExportModulePath].insert(VI);
}

auto GetAdjustedThreshold = [](unsigned Threshold, bool IsHotCallsite) {
Expand Down Expand Up @@ -998,19 +995,29 @@ static bool isGlobalVarSummary(const ModuleSummaryIndex &Index,
return false;
}

template <class T>
static unsigned numGlobalVarSummaries(const ModuleSummaryIndex &Index, T &Cont,
unsigned &DefinedGVS,
unsigned &DefinedFS) {
// Return the number of global variable summaries in ExportSet.
static unsigned
numGlobalVarSummaries(const ModuleSummaryIndex &Index,
FunctionImporter::ExportSetTy &ExportSet) {
unsigned NumGVS = 0;
for (auto &VI : ExportSet)
if (isGlobalVarSummary(Index, VI.getGUID()))
++NumGVS;
return NumGVS;
}

// Given ImportMap, return the number of global variable summaries and record
// the number of defined function summaries as output parameter.
static unsigned
numGlobalVarSummaries(const ModuleSummaryIndex &Index,
FunctionImporter::FunctionsToImportTy &ImportMap,
unsigned &DefinedFS) {
unsigned NumGVS = 0;
DefinedGVS = 0;
DefinedFS = 0;
for (auto &[GUID, Type] : Cont) {
if (isGlobalVarSummary(Index, GUID)) {
if (Type == GlobalValueSummary::Definition)
++DefinedGVS;
for (auto &[GUID, Type] : ImportMap) {
if (isGlobalVarSummary(Index, GUID))
++NumGVS;
} else if (Type == GlobalValueSummary::Definition)
else if (Type == GlobalValueSummary::Definition)
++DefinedFS;
}
return NumGVS;
Expand Down Expand Up @@ -1046,7 +1053,7 @@ static bool checkVariableImport(
};

for (auto &ExportPerModule : ExportLists)
for (auto &[VI, Unused] : ExportPerModule.second)
for (auto &VI : ExportPerModule.second)
if (!FlattenedImports.count(VI.getGUID()) &&
IsReadOrWriteOnlyVarNeedingImporting(ExportPerModule.first, VI))
return false;
Expand Down Expand Up @@ -1079,14 +1086,12 @@ void llvm::ComputeCrossModuleImport(
// since we may import the same values multiple times into different modules
// during the import computation.
for (auto &ELI : ExportLists) {
// `NewExports` tracks the VI that gets exported because the full definition
// of its user/referencer gets exported.
FunctionImporter::ExportSetTy NewExports;
const auto &DefinedGVSummaries =
ModuleToDefinedGVSummaries.lookup(ELI.first);
for (auto &[EI, Type] : ELI.second) {
// If a variable is exported as a declaration, its 'refs' and 'calls' are
// not further exported.
if (Type == GlobalValueSummary::Declaration)
continue;
for (auto &EI : ELI.second) {
// Find the copy defined in the exporting module so that we can mark the
// values it references in that specific definition as exported.
// Below we will add all references and called values, without regard to
Expand All @@ -1105,31 +1110,22 @@ void llvm::ComputeCrossModuleImport(
// we convert such variables initializers to "zeroinitializer".
// See processGlobalForThinLTO.
if (!Index.isWriteOnly(GVS))
for (const auto &VI : GVS->refs()) {
// Try to emplace the declaration entry. If a definition entry
// already exists for key `VI`, this is a no-op.
NewExports.try_emplace(VI, GlobalValueSummary::Declaration);
}
for (const auto &VI : GVS->refs())
NewExports.insert(VI);
} else {
auto *FS = cast<FunctionSummary>(S);
for (const auto &Edge : FS->calls()) {
// Try to emplace the declaration entry. If a definition entry
// already exists for key `VI`, this is a no-op.
NewExports.try_emplace(Edge.first, GlobalValueSummary::Declaration);
}
for (const auto &Ref : FS->refs()) {
// Try to emplace the declaration entry. If a definition entry
// already exists for key `VI`, this is a no-op.
NewExports.try_emplace(Ref, GlobalValueSummary::Declaration);
}
for (const auto &Edge : FS->calls())
NewExports.insert(Edge.first);
for (const auto &Ref : FS->refs())
NewExports.insert(Ref);
}
}
// Prune list computed above to only include values defined in the
// exporting module. We do this after the above insertion since we may hit
// the same ref/call target multiple times in above loop, and it is more
// efficient to avoid a set lookup each time.
for (auto EI = NewExports.begin(); EI != NewExports.end();) {
if (!DefinedGVSummaries.count(EI->first.getGUID()))
if (!DefinedGVSummaries.count(EI->getGUID()))
NewExports.erase(EI++);
else
++EI;
Expand All @@ -1144,29 +1140,22 @@ void llvm::ComputeCrossModuleImport(
for (auto &ModuleImports : ImportLists) {
auto ModName = ModuleImports.first;
auto &Exports = ExportLists[ModName];
unsigned DefinedGVS = 0, DefinedFS = 0;
unsigned NumGVS =
numGlobalVarSummaries(Index, Exports, DefinedGVS, DefinedFS);
LLVM_DEBUG(dbgs() << "* Module " << ModName << " exports " << DefinedFS
<< " function as definitions, "
<< Exports.size() - NumGVS - DefinedFS
<< " functions as declarations, " << DefinedGVS
<< " var definitions and " << NumGVS - DefinedGVS
<< " var declarations. Imports from "
<< ModuleImports.second.size() << " modules.\n");
unsigned NumGVS = numGlobalVarSummaries(Index, Exports);
LLVM_DEBUG(dbgs() << "* Module " << ModName << " exports "
<< Exports.size() - NumGVS << " functions and " << NumGVS
<< " vars. Imports from " << ModuleImports.second.size()
<< " modules.\n");
for (auto &Src : ModuleImports.second) {
auto SrcModName = Src.first;
unsigned DefinedGVS = 0, DefinedFS = 0;
unsigned DefinedFS = 0;
unsigned NumGVSPerMod =
numGlobalVarSummaries(Index, Src.second, DefinedGVS, DefinedFS);
numGlobalVarSummaries(Index, Src.second, DefinedFS);
LLVM_DEBUG(dbgs() << " - " << DefinedFS << " function definitions and "
<< Src.second.size() - NumGVSPerMod - DefinedFS
<< " function declarations imported from " << SrcModName
<< "\n");
LLVM_DEBUG(dbgs() << " - " << DefinedGVS << " global vars definition and "
<< NumGVSPerMod - DefinedGVS
<< " global vars declaration imported from "
<< SrcModName << "\n");
LLVM_DEBUG(dbgs() << " - " << NumGVSPerMod
<< " global vars imported from " << SrcModName << "\n");
}
}
#endif
Expand All @@ -1180,17 +1169,14 @@ static void dumpImportListForModule(const ModuleSummaryIndex &Index,
<< ImportList.size() << " modules.\n");
for (auto &Src : ImportList) {
auto SrcModName = Src.first;
unsigned DefinedGVS = 0, DefinedFS = 0;
unsigned NumGVSPerMod =
numGlobalVarSummaries(Index, Src.second, DefinedGVS, DefinedFS);
unsigned DefinedFS = 0;
unsigned NumGVSPerMod = numGlobalVarSummaries(Index, Src.second, DefinedFS);
LLVM_DEBUG(dbgs() << " - " << DefinedFS << " function definitions and "
<< Src.second.size() - DefinedFS - NumGVSPerMod
<< " function declarations imported from " << SrcModName
<< "\n");
LLVM_DEBUG(dbgs() << " - " << DefinedGVS << " var definitions and "
<< NumGVSPerMod - DefinedGVS
<< " var declarations imported from " << SrcModName
<< "\n");
LLVM_DEBUG(dbgs() << " - " << NumGVSPerMod << " vars imported from "
<< SrcModName << "\n");
}
}
#endif
Expand Down
2 changes: 1 addition & 1 deletion llvm/test/ThinLTO/X86/funcimport-stats.ll
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
; RUN: cat %t4 | FileCheck %s

; CHECK: - [[NUM_FUNCS:[0-9]+]] function definitions and 0 function declarations imported from
; CHECK-NEXT: - [[NUM_VARS:[0-9]+]] global vars definition and 0 global vars declaration imported from
; CHECK-NEXT: - [[NUM_VARS:[0-9]+]] global vars imported from

; CHECK: [[NUM_FUNCS]] function-import - Number of functions imported in backend
; CHECK-NEXT: [[NUM_FUNCS]] function-import - Number of functions thin link decided to import
Expand Down
2 changes: 1 addition & 1 deletion llvm/test/Transforms/FunctionImport/funcimport.ll
Original file line number Diff line number Diff line change
Expand Up @@ -167,7 +167,7 @@ declare void @variadic_va_start(...)

; DUMP: Module [[M1:.*]] imports from 1 module
; DUMP-NEXT: 15 function definitions and 0 function declarations imported from [[M2:.*]]
; DUMP-NEXT: 4 var definitions and 0 var declarations imported from [[M2]]
; DUMP-NEXT: 4 vars imported from [[M2]]

; DUMP: Imported 15 functions for Module [[M1]]
; DUMP-NEXT: Imported 4 global variables for Module [[M1]]
Loading