Skip to content

[CAS] Cache symbol graph outputs #77935

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 1 commit into from
Dec 4, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions include/swift/Basic/FileTypes.def
Original file line number Diff line number Diff line change
Expand Up @@ -98,6 +98,7 @@ TYPE("swiftoverlay", SwiftOverlayFile, "swiftoverlay", "")

// Misc types
TYPE("pcm", ClangModuleFile, "pcm", "")
TYPE("symbol-graph", SymbolGraphFile, "symbols.json", "")
TYPE("pch", PCH, "pch", "")
TYPE("none", Nothing, "", "")

Expand Down
1 change: 1 addition & 0 deletions include/swift/Frontend/CASOutputBackends.h
Original file line number Diff line number Diff line change
Expand Up @@ -46,6 +46,7 @@ class SwiftCASOutputBackend : public llvm::vfs::OutputBackend {
llvm::cas::ActionCache &Cache,
llvm::cas::ObjectRef BaseKey,
const FrontendInputsAndOutputs &InputsAndOutputs,
const FrontendOptions &Opts,
FrontendOptions::ActionType Action);
~SwiftCASOutputBackend();

Expand Down
2 changes: 1 addition & 1 deletion include/swift/Frontend/CachingUtils.h
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,7 @@ createSwiftCachingOutputBackend(
llvm::cas::ObjectStore &CAS, llvm::cas::ActionCache &Cache,
llvm::cas::ObjectRef BaseKey,
const FrontendInputsAndOutputs &InputsAndOutputs,
FrontendOptions::ActionType Action);
const FrontendOptions &Opts, FrontendOptions::ActionType Action);

/// Replay the output of the compilation from cache.
/// Return true if outputs are replayed, false otherwise.
Expand Down
4 changes: 4 additions & 0 deletions lib/Basic/FileTypes.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -116,6 +116,7 @@ bool file_types::isTextual(ID Id) {
case file_types::TY_SwiftABIDescriptor:
case file_types::TY_SwiftAPIDescriptor:
case file_types::TY_ConstValues:
case file_types::TY_SymbolGraphFile:
return true;
case file_types::TY_Image:
case file_types::TY_Object:
Expand Down Expand Up @@ -202,6 +203,7 @@ bool file_types::isAfterLLVM(ID Id) {
case file_types::TY_SwiftFixIt:
case file_types::TY_ModuleSemanticInfo:
case file_types::TY_CachedDiagnostics:
case file_types::TY_SymbolGraphFile:
return false;
case file_types::TY_INVALID:
llvm_unreachable("Invalid type ID.");
Expand Down Expand Up @@ -263,6 +265,7 @@ bool file_types::isPartOfSwiftCompilation(ID Id) {
case file_types::TY_SwiftFixIt:
case file_types::TY_ModuleSemanticInfo:
case file_types::TY_CachedDiagnostics:
case file_types::TY_SymbolGraphFile:
return false;
case file_types::TY_INVALID:
llvm_unreachable("Invalid type ID.");
Expand Down Expand Up @@ -324,6 +327,7 @@ bool file_types::isProducedFromDiagnostics(ID Id) {
case file_types::TY_SwiftAPIDescriptor:
case file_types::TY_ConstValues:
case file_types::TY_ModuleSemanticInfo:
case file_types::TY_SymbolGraphFile:
return false;
case file_types::TY_INVALID:
llvm_unreachable("Invalid type ID.");
Expand Down
1 change: 1 addition & 0 deletions lib/Driver/Driver.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1708,6 +1708,7 @@ void Driver::buildActions(SmallVectorImpl<const Action *> &TopLevelActions,
case file_types::TY_SwiftFixIt:
case file_types::TY_ModuleSemanticInfo:
case file_types::TY_CachedDiagnostics:
case file_types::TY_SymbolGraphFile:
// We could in theory handle assembly or LLVM input, but let's not.
// FIXME: What about LTO?
Diags.diagnose(SourceLoc(), diag::error_unexpected_input_file,
Expand Down
2 changes: 2 additions & 0 deletions lib/Driver/ToolChains.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -782,6 +782,7 @@ const char *ToolChain::JobContext::computeFrontendModeForCompile() const {
case file_types::TY_SwiftFixIt:
case file_types::TY_ModuleSemanticInfo:
case file_types::TY_CachedDiagnostics:
case file_types::TY_SymbolGraphFile:
llvm_unreachable("Output type can never be primary output.");
case file_types::TY_INVALID:
llvm_unreachable("Invalid type ID");
Expand Down Expand Up @@ -1057,6 +1058,7 @@ ToolChain::constructInvocation(const BackendJobAction &job,
case file_types::TY_SwiftFixIt:
case file_types::TY_ModuleSemanticInfo:
case file_types::TY_CachedDiagnostics:
case file_types::TY_SymbolGraphFile:
llvm_unreachable("Output type can never be primary output.");
case file_types::TY_INVALID:
llvm_unreachable("Invalid type ID");
Expand Down
42 changes: 38 additions & 4 deletions lib/Frontend/CASOutputBackends.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -57,16 +57,39 @@ class SwiftCASOutputBackend::Implementation {
public:
Implementation(ObjectStore &CAS, ActionCache &Cache, ObjectRef BaseKey,
const FrontendInputsAndOutputs &InputsAndOutputs,
const FrontendOptions &Opts,
FrontendOptions::ActionType Action)
: CAS(CAS), Cache(Cache), BaseKey(BaseKey),
InputsAndOutputs(InputsAndOutputs), Action(Action) {
InputsAndOutputs(InputsAndOutputs), Opts(Opts), Action(Action) {
initBackend(InputsAndOutputs);
}

llvm::Expected<std::unique_ptr<llvm::vfs::OutputFileImpl>>
createFileImpl(llvm::StringRef ResolvedPath,
std::optional<llvm::vfs::OutputConfig> Config) {
auto ProducingInput = OutputToInputMap.find(ResolvedPath);
if (ProducingInput == OutputToInputMap.end() &&
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Instead of doing this special condition, I prefer add symbol graph to SupplementaryOutputPaths and compute the path in ArgsToFrontendOutputsConverter.cpp.

Hope it is not too bad to pass the output path to the location where the file is generated.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I prefer add symbol graph to SupplementaryOutputPaths and compute the path in ArgsToFrontendOutputsConverter.cpp.

The symbol graph contains an arbitrary number of files, and I think you can't know how many files there will be until you typecheck, because if you have module A that contains import B; extension B.Foo { public func bar() {} } there will be A.symbols.json and [email protected]. That's why I didn't model it as a "normal" output.

ResolvedPath.starts_with(Opts.SymbolGraphOutputDir)) {
return std::make_unique<SwiftCASOutputFile>(
ResolvedPath, [this](StringRef Path, StringRef Bytes) -> Error {
bool Shortened = Path.consume_front(Opts.SymbolGraphOutputDir);
assert(Shortened && "symbol graph path outside output dir");
(void)Shortened;
std::optional<ObjectRef> PathRef;
if (Error E =
CAS.storeFromString(std::nullopt, Path).moveInto(PathRef))
return E;
std::optional<ObjectRef> BytesRef;
if (Error E =
CAS.storeFromString(std::nullopt, Bytes).moveInto(BytesRef))
return E;
auto Ref = CAS.store({*PathRef, *BytesRef}, {});
if (!Ref)
return Ref.takeError();
SymbolGraphOutputRefs.push_back(*Ref);
return Error::success();
});
}
assert(ProducingInput != OutputToInputMap.end() && "Unknown output file");

unsigned InputIndex = ProducingInput->second.first;
Expand Down Expand Up @@ -97,21 +120,24 @@ class SwiftCASOutputBackend::Implementation {
ActionCache &Cache;
ObjectRef BaseKey;
const FrontendInputsAndOutputs &InputsAndOutputs;
const FrontendOptions &Opts;
FrontendOptions::ActionType Action;

// Map from output path to the input index and output kind.
StringMap<std::pair<unsigned, file_types::ID>> OutputToInputMap;

// A vector of output refs where the index is the input index.
SmallVector<DenseMap<file_types::ID, ObjectRef>> OutputRefs;

SmallVector<ObjectRef> SymbolGraphOutputRefs;
};

SwiftCASOutputBackend::SwiftCASOutputBackend(
ObjectStore &CAS, ActionCache &Cache, ObjectRef BaseKey,
const FrontendInputsAndOutputs &InputsAndOutputs,
FrontendOptions::ActionType Action)
const FrontendOptions &Opts, FrontendOptions::ActionType Action)
: Impl(*new SwiftCASOutputBackend::Implementation(
CAS, Cache, BaseKey, InputsAndOutputs, Action)) {}
CAS, Cache, BaseKey, InputsAndOutputs, Opts, Action)) {}

SwiftCASOutputBackend::~SwiftCASOutputBackend() { delete &Impl; }

Expand All @@ -122,7 +148,8 @@ bool SwiftCASOutputBackend::isStoredDirectly(file_types::ID Kind) {

IntrusiveRefCntPtr<OutputBackend> SwiftCASOutputBackend::cloneImpl() const {
return makeIntrusiveRefCnt<SwiftCASOutputBackend>(
Impl.CAS, Impl.Cache, Impl.BaseKey, Impl.InputsAndOutputs, Impl.Action);
Impl.CAS, Impl.Cache, Impl.BaseKey, Impl.InputsAndOutputs, Impl.Opts,
Impl.Action);
}

Expected<std::unique_ptr<OutputFileImpl>>
Expand Down Expand Up @@ -243,6 +270,13 @@ Error SwiftCASOutputBackend::Implementation::finalizeCacheKeysFor(
llvm::for_each(ProducedOutputs, [&OutputsForInput](auto E) {
OutputsForInput.emplace_back(E.first, E.second);
});
if (InputIndex == InputsAndOutputs.getIndexOfFirstOutputProducingInput() &&
!SymbolGraphOutputRefs.empty()) {
auto SGRef = CAS.store(SymbolGraphOutputRefs, {});
if (!SGRef)
return SGRef.takeError();
OutputsForInput.emplace_back(file_types::ID::TY_SymbolGraphFile, *SGRef);
}
// Sort to a stable ordering for deterministic output cache object.
llvm::sort(OutputsForInput,
[](auto &LHS, auto &RHS) { return LHS.first < RHS.first; });
Expand Down
37 changes: 32 additions & 5 deletions lib/Frontend/CachingUtils.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -54,14 +54,13 @@ using namespace llvm::vfs;

namespace swift {

llvm::IntrusiveRefCntPtr<SwiftCASOutputBackend>
createSwiftCachingOutputBackend(
llvm::IntrusiveRefCntPtr<SwiftCASOutputBackend> createSwiftCachingOutputBackend(
llvm::cas::ObjectStore &CAS, llvm::cas::ActionCache &Cache,
llvm::cas::ObjectRef BaseKey,
const FrontendInputsAndOutputs &InputsAndOutputs,
FrontendOptions::ActionType Action) {
return makeIntrusiveRefCnt<SwiftCASOutputBackend>(CAS, Cache, BaseKey,
InputsAndOutputs, Action);
const FrontendOptions &Opts, FrontendOptions::ActionType Action) {
return makeIntrusiveRefCnt<SwiftCASOutputBackend>(
CAS, Cache, BaseKey, InputsAndOutputs, Opts, Action);
}

Error cas::CachedResultLoader::replay(CallbackTy Callback) {
Expand Down Expand Up @@ -197,6 +196,31 @@ bool replayCachedCompilerOutputs(
assert(!DiagnosticsOutput && "more than 1 diagnotics found");
DiagnosticsOutput.emplace(
OutputEntry{OutputPath->second, OutID, Kind, Input, *Proxy});
} else if (Kind == file_types::ID::TY_SymbolGraphFile &&
!Opts.SymbolGraphOutputDir.empty()) {
auto Err = Proxy->forEachReference([&](ObjectRef Ref) -> Error {
auto Proxy = CAS.getProxy(Ref);
if (!Proxy)
return Proxy.takeError();
auto PathRef = Proxy->getReference(0);
auto ContentRef = Proxy->getReference(1);
auto Path = CAS.getProxy(PathRef);
auto Content = CAS.getProxy(ContentRef);
if (!Path)
return Path.takeError();
if (!Content)
return Content.takeError();

SmallString<128> OutputPath(Opts.SymbolGraphOutputDir);
llvm::sys::path::append(OutputPath, Path->getData());

OutputProxies.emplace_back(OutputEntry{
std::string(OutputPath), OutID, Kind, Input, *Content});

return Error::success();
});
if (Err)
return Err;
} else
OutputProxies.emplace_back(
OutputEntry{OutputPath->second, OutID, Kind, Input, *Proxy});
Expand Down Expand Up @@ -234,6 +258,9 @@ bool replayCachedCompilerOutputs(
Outputs.try_emplace(file_types::ID::TY_CachedDiagnostics,
"<cached-diagnostics>");

// Add symbol graph entry for lookup. Output path doesn't matter here.
Outputs.try_emplace(file_types::ID::TY_SymbolGraphFile, "<symbol-graph>");

return replayOutputsForInputFile(Input, InputPath, InputIndex, Outputs);
};

Expand Down
1 change: 1 addition & 0 deletions lib/Frontend/Frontend.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -486,6 +486,7 @@ void CompilerInstance::setupOutputBackend() {
auto &InAndOuts = Invocation.getFrontendOptions().InputsAndOutputs;
CASOutputBackend = createSwiftCachingOutputBackend(
*CAS, *ResultCache, *CompileJobBaseKey, InAndOuts,
Invocation.getFrontendOptions(),
Invocation.getFrontendOptions().RequestedAction);

if (Invocation.getIRGenOptions().UseCASBackend) {
Expand Down
46 changes: 46 additions & 0 deletions test/CAS/symbol-graph.swift
Original file line number Diff line number Diff line change
@@ -0,0 +1,46 @@
// RUN: %empty-directory(%t)
// RUN: split-file %s %t

// RUN: %target-swift-frontend -scan-dependencies -module-name Test -module-cache-path %t/clang-module-cache -O \
// RUN: -parse-stdlib -disable-implicit-string-processing-module-import -disable-implicit-concurrency-module-import \
// RUN: %t/main.swift -o %t/deps.json -swift-version 5 -cache-compile-job -cas-path %t/cas -I %t/include \
// RUN: -emit-symbol-graph -emit-symbol-graph-dir %t/symbol-graph1

// RUN: %{python} %S/Inputs/BuildCommandExtractor.py %t/deps.json A > %t/A.cmd
// RUN: %swift_frontend_plain @%t/A.cmd

// RUN: %{python} %S/Inputs/BuildCommandExtractor.py %t/deps.json Test > %t/Test.cmd
// RUN: %target-swift-frontend -module-name Test -module-cache-path %t/clang-module-cache -O \
// RUN: -parse-stdlib -disable-implicit-string-processing-module-import -disable-implicit-concurrency-module-import \
// RUN: %t/main.swift -o %t/Test.swiftmodule -swift-version 5 -cache-compile-job -cas-path %t/cas -I %t/include \
// RUN: -emit-symbol-graph -emit-symbol-graph-dir %t/symbol-graph1 \
// RUN: -emit-module @%t/Test.cmd -Rcache-compile-job 2>&1 | %FileCheck %s --check-prefix=CACHE-MISS

// CACHE-MISS: remark: cache miss for input

// RUN: %{python} %S/Inputs/BuildCommandExtractor.py %t/deps.json Test > %t/Test.cmd
// RUN: %target-swift-frontend -module-name Test -module-cache-path %t/clang-module-cache -O \
// RUN: -parse-stdlib -disable-implicit-string-processing-module-import -disable-implicit-concurrency-module-import \
// RUN: %t/main.swift -o %t/Test.swiftmodule -swift-version 5 -cache-compile-job -cas-path %t/cas -I %t/include \
// RUN: -emit-symbol-graph -emit-symbol-graph-dir %t/symbol-graph2 \
// RUN: -emit-module @%t/Test.cmd -Rcache-compile-job 2>&1 | %FileCheck %s --check-prefix=CACHE-MISS

// CACHE-HIT: remark: replay output file '{{.*}}{{/|\\}}symbol-graph2{{/|\\}}Test.symbols.json': key 'llvmcas://{{.*}}'
// CACHE-HIT: remark: replay output file '{{.*}}{{/|\\}}symbol-graph2{{/|\\}}[email protected]': key 'llvmcas://{{.*}}'

// RUN: diff -r -u %t/symbol-graph1 %t/symbol-graph2

//--- include/A.swiftinterface
// swift-interface-format-version: 1.0
// swift-module-flags: -module-name A -O -disable-implicit-string-processing-module-import -disable-implicit-concurrency-module-import -parse-stdlib -user-module-version 1.0

public struct A {}

//--- main.swift
import A

public struct Foo {}

extension A {
public func bar() {}
}