Files
swift-mirror/lib/Frontend/CASOutputBackends.cpp
Steven Wu 76bde39ee7 [Caching] Encoding cache key for input file with index instead of path
Avoid path encoding difference (for example, real_path vs. path from
symlink) by eliminating the path from cache key. Cache key is now
encoded with the index of the input file from all the input files from
the command-line, reguardless if those inputs will produce output or
not. This is to ensure stable ordering even the batching is different.

Add a new cache computation API that is preferred for using input index
directly. Old API for cache key is deprecated but still updated to
fallback to real_path comparsion if needed.

As a result of swift scan API change, rename the feature in JSON file to
avoid version confusion between swift-driver and libSwiftScan.

rdar://119387650
2023-12-18 14:06:00 -08:00

265 lines
9.7 KiB
C++

//===--- CASOutputBackends.cpp ----------------------------------*- C++ -*-===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2014 - 2018 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
//
//===----------------------------------------------------------------------===//
#include "swift/Frontend/CASOutputBackends.h"
#include "swift/Basic/FileTypes.h"
#include "swift/Frontend/CachingUtils.h"
#include "swift/Frontend/CompileJobCacheKey.h"
#include "swift/Frontend/CompileJobCacheResult.h"
#include "clang/Frontend/CompileJobCacheResult.h"
#include "llvm/ADT/STLExtras.h"
#include "llvm/CAS/HierarchicalTreeBuilder.h"
#include "llvm/CAS/ObjectStore.h"
#include "llvm/Support/Debug.h"
#include <optional>
#define DEBUG_TYPE "swift-cas-backend"
using namespace swift;
using namespace llvm;
using namespace llvm::cas;
using namespace llvm::vfs;
namespace {
class SwiftCASOutputFile final : public OutputFileImpl {
public:
Error keep() override { return OnKeep(Path, Bytes); }
Error discard() override { return Error::success(); }
raw_pwrite_stream &getOS() override { return OS; }
using OnKeepType = llvm::unique_function<Error(StringRef, StringRef)>;
SwiftCASOutputFile(StringRef Path, OnKeepType OnKeep)
: Path(Path.str()), OS(Bytes), OnKeep(std::move(OnKeep)) {}
private:
std::string Path;
SmallString<16> Bytes;
raw_svector_ostream OS;
OnKeepType OnKeep;
};
} // namespace
namespace swift::cas {
void SwiftCASOutputBackend::anchor() {}
class SwiftCASOutputBackend::Implementation {
public:
Implementation(ObjectStore &CAS, ActionCache &Cache, ObjectRef BaseKey,
const FrontendInputsAndOutputs &InputsAndOutputs,
FrontendOptions::ActionType Action)
: CAS(CAS), Cache(Cache), BaseKey(BaseKey),
InputsAndOutputs(InputsAndOutputs), Action(Action) {
initBackend(InputsAndOutputs);
}
llvm::Expected<std::unique_ptr<llvm::vfs::OutputFileImpl>>
createFileImpl(llvm::StringRef ResolvedPath,
llvm::Optional<llvm::vfs::OutputConfig> Config) {
auto ProducingInput = OutputToInputMap.find(ResolvedPath);
assert(ProducingInput != OutputToInputMap.end() && "Unknown output file");
unsigned InputIndex = ProducingInput->second.first;
auto OutputType = ProducingInput->second.second;
// Uncached output kind.
if (file_types::isProducedFromDiagnostics(OutputType))
return std::make_unique<llvm::vfs::NullOutputFileImpl>();
return std::make_unique<SwiftCASOutputFile>(
ResolvedPath,
[this, InputIndex, OutputType](StringRef Path,
StringRef Bytes) -> Error {
return storeImpl(Path, Bytes, InputIndex, OutputType);
});
}
void initBackend(const FrontendInputsAndOutputs &InputsAndOutputs);
Error storeImpl(StringRef Path, StringRef Bytes, unsigned InputIndex,
file_types::ID OutputKind);
Error finalizeCacheKeysFor(unsigned InputIndex);
private:
friend class SwiftCASOutputBackend;
ObjectStore &CAS;
ActionCache &Cache;
ObjectRef BaseKey;
const FrontendInputsAndOutputs &InputsAndOutputs;
FrontendOptions::ActionType Action;
// Map from output path to the input index and output kind.
StringMap<std::pair<unsigned, file_types::ID>> OutputToInputMap;
// A vector of output refs where the index is the input index.
SmallVector<DenseMap<file_types::ID, ObjectRef>> OutputRefs;
};
SwiftCASOutputBackend::SwiftCASOutputBackend(
ObjectStore &CAS, ActionCache &Cache, ObjectRef BaseKey,
const FrontendInputsAndOutputs &InputsAndOutputs,
FrontendOptions::ActionType Action)
: Impl(*new SwiftCASOutputBackend::Implementation(
CAS, Cache, BaseKey, InputsAndOutputs, Action)) {}
SwiftCASOutputBackend::~SwiftCASOutputBackend() { delete &Impl; }
IntrusiveRefCntPtr<OutputBackend> SwiftCASOutputBackend::cloneImpl() const {
return makeIntrusiveRefCnt<SwiftCASOutputBackend>(
Impl.CAS, Impl.Cache, Impl.BaseKey, Impl.InputsAndOutputs, Impl.Action);
}
Expected<std::unique_ptr<OutputFileImpl>>
SwiftCASOutputBackend::createFileImpl(StringRef ResolvedPath,
Optional<OutputConfig> Config) {
return Impl.createFileImpl(ResolvedPath, Config);
}
file_types::ID SwiftCASOutputBackend::getOutputFileType(StringRef Path) const {
return file_types::lookupTypeForExtension(llvm::sys::path::extension(Path));
}
Error SwiftCASOutputBackend::storeImpl(StringRef Path, StringRef Bytes,
unsigned InputIndex,
file_types::ID OutputKind) {
return Impl.storeImpl(Path, Bytes, InputIndex, OutputKind);
}
Error SwiftCASOutputBackend::storeCachedDiagnostics(unsigned InputIndex,
StringRef Bytes) {
return storeImpl("<cached-diagnostics>", Bytes, InputIndex,
file_types::ID::TY_CachedDiagnostics);
}
void SwiftCASOutputBackend::Implementation::initBackend(
const FrontendInputsAndOutputs &InputsAndOutputs) {
// FIXME: The output to input map might not be enough for example all the
// outputs can be written to `-`, but the backend cannot distinguish which
// input it actually comes from. Maybe the solution is just not to cache
// any commands write output to `-`.
file_types::ID mainOutputType = InputsAndOutputs.getPrincipalOutputType();
auto addInput = [&](const InputFile &Input, unsigned Index) {
if (!Input.outputFilename().empty())
OutputToInputMap.insert(
{Input.outputFilename(), {Index, mainOutputType}});
Input.getPrimarySpecificPaths()
.SupplementaryOutputs.forEachSetOutputAndType(
[&](const std::string &Out, file_types::ID ID) {
if (!file_types::isProducedFromDiagnostics(ID))
OutputToInputMap.insert({Out, {Index, ID}});
});
};
for (unsigned idx = 0; idx < InputsAndOutputs.getAllInputs().size(); ++idx)
addInput(InputsAndOutputs.getAllInputs()[idx], idx);
// FIXME: Cached diagnostics is associated with the first output producing
// input file.
OutputToInputMap.insert(
{"<cached-diagnostics>",
{InputsAndOutputs.getIndexOfFirstOutputProducingInput(),
file_types::TY_CachedDiagnostics}});
// Resize the output refs to hold all inputs.
OutputRefs.resize(InputsAndOutputs.getAllInputs().size());
}
Error SwiftCASOutputBackend::Implementation::storeImpl(
StringRef Path, StringRef Bytes, unsigned InputIndex,
file_types::ID OutputKind) {
Optional<ObjectRef> BytesRef;
if (Error E = CAS.storeFromString(None, Bytes).moveInto(BytesRef))
return E;
LLVM_DEBUG(llvm::dbgs() << "DEBUG: producing CAS output of type \'"
<< file_types::getTypeName(OutputKind)
<< "\' for input \'" << InputIndex << "\': \'"
<< CAS.getID(*BytesRef).toString() << "\'\n";);
OutputRefs[InputIndex].insert({OutputKind, *BytesRef});
return finalizeCacheKeysFor(InputIndex);
}
Error SwiftCASOutputBackend::Implementation::finalizeCacheKeysFor(
unsigned InputIndex) {
auto ProducedOutputs = OutputRefs[InputIndex];
assert(!ProducedOutputs.empty() && "Expect outputs for this input");
// If not all outputs for the input are emitted, return.
if (!llvm::all_of(OutputToInputMap, [&](auto &E) {
return (E.second.first != InputIndex ||
ProducedOutputs.count(E.second.second));
}))
return Error::success();
std::vector<std::pair<file_types::ID, ObjectRef>> OutputsForInput;
llvm::for_each(ProducedOutputs, [&OutputsForInput](auto E) {
OutputsForInput.emplace_back(E.first, E.second);
});
// Sort to a stable ordering for deterministic output cache object.
llvm::sort(OutputsForInput,
[](auto &LHS, auto &RHS) { return LHS.first < RHS.first; });
Optional<ObjectRef> Result;
// Use a clang compatible result CAS object schema when emiting PCM.
if (Action == FrontendOptions::ActionType::EmitPCM) {
clang::cas::CompileJobCacheResult::Builder Builder;
for (auto &Outs : OutputsForInput) {
if (Outs.first == file_types::ID::TY_ClangModuleFile)
Builder.addOutput(
clang::cas::CompileJobCacheResult::OutputKind::MainOutput,
Outs.second);
else if (Outs.first == file_types::ID::TY_CachedDiagnostics)
Builder.addOutput(clang::cas::CompileJobCacheResult::OutputKind::
SerializedDiagnostics,
Outs.second);
else if (Outs.first == file_types::ID::TY_Dependencies)
Builder.addOutput(
clang::cas::CompileJobCacheResult::OutputKind::Dependencies,
Outs.second);
else
llvm_unreachable("Unexpected output when compiling clang module");
}
if (auto Err = Builder.build(CAS).moveInto(Result))
return Err;
} else {
swift::cas::CompileJobCacheResult::Builder Builder;
for (auto &Outs : OutputsForInput)
Builder.addOutput(Outs.first, Outs.second);
if (auto Err = Builder.build(CAS).moveInto(Result))
return Err;
}
auto CacheKey = createCompileJobCacheKeyForOutput(CAS, BaseKey, InputIndex);
if (!CacheKey)
return CacheKey.takeError();
LLVM_DEBUG(llvm::dbgs() << "DEBUG: writing cache entry for input \'"
<< InputIndex << "\': \'"
<< CAS.getID(*CacheKey).toString() << "\' => \'"
<< CAS.getID(*Result).toString() << "\'\n";);
if (auto E = Cache.put(CAS.getID(*CacheKey), CAS.getID(*Result)))
return E;
return Error::success();
}
} // end namespace swift::cas