mirror of
https://github.com/apple/swift.git
synced 2025-12-14 20:36:38 +01:00
When we miss the in-memory (libcache-based) code completion cache, we can now chain to an on-disk code completion cache. This drastically improves the time and peak memory usage it takes to do the first code completion (ie. before the in-memory cache is warm) if we've done the same lookup before. The on-disk cache, like the in-memory cache is tied to the specific compiled swift and clang module files (.swiftmodule and .pcm), and will consider itself out of date if they are modified. Responsibility for deleting completely dead/unreachable cache files falls to the client. Most of this commit is adding a simple serialization and deserialization for CodeCompletionResults and CodeCompletionStrings. The format is very simple, using an array of fixed size CodeCompletionResults, with offsets into two blobs: one for CodeCompletionString::Chunks, and one for strings. Currently that gives us about 5.8 MB for all the results in Cocoa, but it's very compressible if we decide we want to reduce it (gzip'd it is ~1.2 MB for the same data). Swift SVN r28369
448 lines
15 KiB
C++
448 lines
15 KiB
C++
#include "swift/IDE/CodeCompletionCache.h"
|
|
#include "swift/Basic/Cache.h"
|
|
#include "llvm/ADT/APInt.h"
|
|
#include "llvm/ADT/Hashing.h"
|
|
#include "llvm/Support/EndianStream.h"
|
|
#include "llvm/Support/FileSystem.h"
|
|
#include "llvm/Support/MemoryBuffer.h"
|
|
#include "llvm/Support/Path.h"
|
|
|
|
using namespace swift;
|
|
using namespace ide;
|
|
|
|
namespace swift {
|
|
namespace ide {
|
|
struct CodeCompletionCacheImpl {
|
|
using Key = CodeCompletionCache::Key;
|
|
using Value = CodeCompletionCache::Value;
|
|
using ValueRefCntPtr = CodeCompletionCache::ValueRefCntPtr;
|
|
sys::Cache<Key, ValueRefCntPtr> TheCache{"swift.libIDE.CodeCompletionCache"};
|
|
};
|
|
} // end namespace ide
|
|
} // end namespace swift
|
|
|
|
namespace swift {
|
|
namespace sys {
|
|
template<>
|
|
struct CacheValueCostInfo<swift::ide::CodeCompletionCacheImpl::Value> {
|
|
static size_t
|
|
getCost(const swift::ide::CodeCompletionCacheImpl::Value &V) {
|
|
return V.Sink.Allocator->getTotalMemory();
|
|
}
|
|
};
|
|
} // namespace sys
|
|
} // namespace swift
|
|
|
|
CodeCompletionCache::ValueRefCntPtr CodeCompletionCache::createValue() {
|
|
return ValueRefCntPtr(new Value);
|
|
}
|
|
|
|
Optional<CodeCompletionCache::ValueRefCntPtr>
|
|
CodeCompletionCache::get(const Key &K) {
|
|
auto &TheCache = Impl->TheCache;
|
|
llvm::Optional<ValueRefCntPtr> V = TheCache.get(K);
|
|
if (V) {
|
|
// Check whether V is up to date.
|
|
llvm::sys::fs::file_status ModuleStatus;
|
|
if (llvm::sys::fs::status(K.ModuleFilename, ModuleStatus) ||
|
|
V.getValue()->ModuleModificationTime !=
|
|
ModuleStatus.getLastModificationTime()) {
|
|
// Cache is stale.
|
|
V = None;
|
|
TheCache.remove(K);
|
|
}
|
|
} else if (nextCache && (V = nextCache->get(K))) {
|
|
// Hit the chained cache. Update our own cache to match.
|
|
setImpl(K, *V, /*setChain*/ false);
|
|
}
|
|
return V;
|
|
}
|
|
|
|
void CodeCompletionCache::setImpl(const Key &K, ValueRefCntPtr V,
|
|
bool setChain) {
|
|
{
|
|
assert(!K.ModuleFilename.empty());
|
|
|
|
llvm::sys::fs::file_status ModuleStatus;
|
|
if (llvm::sys::fs::status(K.ModuleFilename, ModuleStatus)) {
|
|
V->ModuleModificationTime = llvm::sys::TimeValue::now();
|
|
return;
|
|
} else {
|
|
V->ModuleModificationTime = ModuleStatus.getLastModificationTime();
|
|
}
|
|
}
|
|
Impl->TheCache.set(K, V);
|
|
|
|
// FIXME: we could write the results to disk in the background, since they're
|
|
// immutable at this point.
|
|
if (nextCache && setChain)
|
|
nextCache->set(K, V);
|
|
}
|
|
|
|
CodeCompletionCache::CodeCompletionCache(OnDiskCodeCompletionCache *nextCache)
|
|
: Impl(new CodeCompletionCacheImpl()), nextCache(nextCache) {}
|
|
|
|
CodeCompletionCache::~CodeCompletionCache() {}
|
|
|
|
/// A version number for the format of the serialized code completion results.
|
|
///
|
|
/// This should be incremented any time we commit a change to the format of the
|
|
/// cached results. This isn't expected to change very often.
|
|
static constexpr uint32_t onDiskCompletionCacheVersion = 0;
|
|
|
|
static StringRef copyString(llvm::BumpPtrAllocator &Allocator, StringRef Str) {
|
|
char *Mem = Allocator.Allocate<char>(Str.size());
|
|
std::copy(Str.begin(), Str.end(), Mem);
|
|
return StringRef(Mem, Str.size());
|
|
}
|
|
|
|
static ArrayRef<StringRef> copyStringArray(llvm::BumpPtrAllocator &Allocator,
|
|
ArrayRef<StringRef> Arr) {
|
|
StringRef *Buff = Allocator.Allocate<StringRef>(Arr.size());
|
|
std::copy(Arr.begin(), Arr.end(), Buff);
|
|
return llvm::makeArrayRef(Buff, Arr.size());
|
|
}
|
|
|
|
/// Deserializes CodeCompletionResults from \p in and stores them in \p V.
|
|
/// \see writeCacheModule.
|
|
static bool readCachedModule(llvm::MemoryBuffer *in,
|
|
const CodeCompletionCache::Key &K,
|
|
CodeCompletionCache::Value &V,
|
|
bool allowOutOfDate = false) {
|
|
const char *cursor = in->getBufferStart();
|
|
const char *end = in->getBufferEnd();
|
|
|
|
auto read32le = [end](const char *&cursor) {
|
|
auto result = llvm::support::endian::read32le(cursor);
|
|
cursor += sizeof(result);
|
|
assert(cursor <= end);
|
|
return result;
|
|
};
|
|
|
|
// HEADER
|
|
{
|
|
auto version = read32le(cursor);
|
|
if (version != onDiskCompletionCacheVersion)
|
|
return false; // File written with different format.
|
|
|
|
auto mtime = llvm::support::endian::read64le(cursor);
|
|
cursor += sizeof(mtime);
|
|
|
|
// Check the module file's last modification time.
|
|
if (!allowOutOfDate) {
|
|
llvm::sys::fs::file_status status;
|
|
if (llvm::sys::fs::status(K.ModuleFilename, status) ||
|
|
status.getLastModificationTime().toEpochTime() != mtime) {
|
|
return false; // Out of date, or doesn't exist.
|
|
}
|
|
}
|
|
}
|
|
|
|
// DEBUG INFO
|
|
cursor += read32le(cursor); // Skip the whole debug section.
|
|
|
|
// Get the size of the various sections.
|
|
auto resultSize = read32le(cursor);
|
|
const char *resultEnd = cursor + resultSize;
|
|
const char *chunks = resultEnd;
|
|
auto chunkSize = read32le(chunks);
|
|
const char *strings = chunks + chunkSize;
|
|
auto stringCount = read32le(strings);
|
|
assert(strings + stringCount == end && "incorrect file size");
|
|
|
|
// STRINGS
|
|
auto getString = [&](uint32_t index) -> StringRef {
|
|
if (index == ~0u)
|
|
return "";
|
|
|
|
const char *p = strings + index;
|
|
auto size = read32le(p);
|
|
return copyString(*V.Sink.Allocator, StringRef(p, size));
|
|
};
|
|
|
|
// CHUNKS
|
|
auto getCompletionString = [&](uint32_t chunkIndex) {
|
|
const char *p = chunks + chunkIndex;
|
|
auto len = read32le(p);
|
|
using Chunk = CodeCompletionString::Chunk;
|
|
SmallVector<Chunk, 32> chunkList;
|
|
for (unsigned j = 0; j < len; ++j) {
|
|
auto kind = static_cast<Chunk::ChunkKind>(*p++);
|
|
auto nest = *p++;
|
|
auto isAnnotation = static_cast<bool>(*p++);
|
|
auto textIndex = read32le(p);
|
|
auto text = getString(textIndex);
|
|
|
|
if (Chunk::chunkHasText(kind)) {
|
|
chunkList.push_back(
|
|
Chunk::createWithText(kind, nest, text, isAnnotation));
|
|
} else {
|
|
chunkList.push_back(Chunk::createSimple(kind, nest, isAnnotation));
|
|
}
|
|
}
|
|
|
|
return CodeCompletionString::create(*V.Sink.Allocator, chunkList);
|
|
};
|
|
|
|
// RESULTS
|
|
while (cursor != resultEnd) {
|
|
auto kind = static_cast<CodeCompletionResult::ResultKind>(*cursor++);
|
|
auto declKind = static_cast<CodeCompletionDeclKind>(*cursor++);
|
|
auto context = static_cast<SemanticContextKind>(*cursor++);
|
|
auto notRecommended = static_cast<bool>(*cursor++);
|
|
auto numBytesToErase = static_cast<unsigned>(*cursor++);
|
|
auto chunkIndex = read32le(cursor);
|
|
auto moduleIndex = read32le(cursor);
|
|
auto briefDocIndex = read32le(cursor);
|
|
auto assocUSRCount = read32le(cursor);
|
|
auto assocUSRsIndex = read32le(cursor);
|
|
|
|
CodeCompletionString *string = getCompletionString(chunkIndex);
|
|
auto moduleName = getString(moduleIndex);
|
|
auto briefDocComment = getString(briefDocIndex);
|
|
SmallVector<StringRef, 4> assocUSRs;
|
|
for (unsigned i = 0; i < assocUSRCount; ++i) {
|
|
auto usr = getString(assocUSRsIndex);
|
|
assocUSRs.push_back(usr);
|
|
assocUSRsIndex += usr.size();
|
|
}
|
|
|
|
CodeCompletionResult *result = nullptr;
|
|
if (kind == CodeCompletionResult::Declaration) {
|
|
result = new (*V.Sink.Allocator)
|
|
CodeCompletionResult(context, numBytesToErase, string, declKind,
|
|
moduleName, notRecommended, briefDocComment,
|
|
copyStringArray(*V.Sink.Allocator, assocUSRs));
|
|
} else {
|
|
result = new (*V.Sink.Allocator)
|
|
CodeCompletionResult(kind, context, numBytesToErase, string);
|
|
}
|
|
|
|
V.Sink.Results.push_back(result);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
/// Writes the code completion results from the sink for \p V to \p out.
|
|
///
|
|
/// The high-level format is:
|
|
///
|
|
/// HEADER
|
|
/// * version, which **must be bumped** if we change the format!
|
|
/// * mtime for the module file
|
|
///
|
|
/// KEY
|
|
/// * the original CodeCompletionCache::Key, used for debugging the cache.
|
|
///
|
|
/// RESULTS
|
|
/// * A length-prefixed array of fixed size CodeCompletionResults.
|
|
/// * Contains offsets into CHUNKS and STRINGS.
|
|
///
|
|
/// CHUNKS
|
|
/// * A length-prefixed array of CodeCompletionStrings.
|
|
/// * Each CodeCompletionString is a length-prefixed array of fixed size
|
|
/// CodeCompletionString::Chunks.
|
|
///
|
|
/// STRINGS
|
|
/// * A blob of length-prefixed strings referred to in CHUNKS or RESULTS.
|
|
static void writeCachedModule(llvm::raw_ostream &out,
|
|
const CodeCompletionCache::Key &K,
|
|
CodeCompletionCache::Value &V) {
|
|
using namespace llvm::support;
|
|
endian::Writer<little> LE(out);
|
|
|
|
// HEADER
|
|
// Metadata required for reading the completions.
|
|
LE.write(onDiskCompletionCacheVersion); // Version
|
|
LE.write(V.ModuleModificationTime.toEpochTime()); // Mtime for module file
|
|
|
|
// KEY
|
|
// We don't need the stored key to load the results, but it is useful if we
|
|
// want to debug the cache itself.
|
|
{
|
|
SmallString<256> scratch;
|
|
llvm::raw_svector_ostream OSS(scratch);
|
|
OSS << K.ModuleFilename << "\0";
|
|
OSS << K.ModuleName << "\0";
|
|
endian::Writer<little> OSSLE(OSS);
|
|
OSSLE.write(K.AccessPath.size());
|
|
for (StringRef p : K.AccessPath)
|
|
OSS << p << "\0";
|
|
OSSLE.write(K.ResultsHaveLeadingDot);
|
|
OSSLE.write(K.ForTestableLookup);
|
|
LE.write(static_cast<uint32_t>(OSS.tell())); // Size of debug info
|
|
out.write(OSS.str().data(), OSS.str().size()); // Debug info blob
|
|
}
|
|
|
|
// String streams for writing to the CHUNKS and STRINGS sections.
|
|
std::string results_;
|
|
llvm::raw_string_ostream results(results_);
|
|
std::string chunks_;
|
|
llvm::raw_string_ostream chunks(chunks_);
|
|
endian::Writer<little> chunksLE(chunks);
|
|
std::string strings_;
|
|
llvm::raw_string_ostream strings(strings_);
|
|
|
|
auto addString = [&strings](StringRef str) {
|
|
if (str.empty())
|
|
return ~0u;
|
|
auto size = strings.tell();
|
|
endian::Writer<little> LE(strings);
|
|
LE.write(static_cast<uint32_t>(str.size()));
|
|
strings << str;
|
|
return static_cast<uint32_t>(size);
|
|
};
|
|
|
|
auto addCompletionString = [&](const CodeCompletionString *str) {
|
|
auto size = chunks.tell();
|
|
chunksLE.write(static_cast<uint32_t>(str->getChunks().size()));
|
|
for (auto chunk : str->getChunks()) {
|
|
chunksLE.write(static_cast<uint8_t>(chunk.getKind()));
|
|
chunksLE.write(static_cast<uint8_t>(chunk.getNestingLevel()));
|
|
chunksLE.write(static_cast<uint8_t>(chunk.isAnnotation()));
|
|
if (chunk.hasText()) {
|
|
chunksLE.write(addString(chunk.getText()));
|
|
} else {
|
|
chunksLE.write(static_cast<uint32_t>(~0u));
|
|
}
|
|
}
|
|
return static_cast<uint32_t>(size);
|
|
};
|
|
|
|
// RESULTS
|
|
{
|
|
endian::Writer<little> LE(results);
|
|
for (CodeCompletionResult *R : V.Sink.Results) {
|
|
// FIXME: compress bitfield
|
|
LE.write(static_cast<uint8_t>(R->getKind()));
|
|
if (R->getKind() == CodeCompletionResult::Declaration)
|
|
LE.write(static_cast<uint8_t>(R->getAssociatedDeclKind()));
|
|
else
|
|
LE.write(static_cast<uint8_t>(~0u));
|
|
LE.write(static_cast<uint8_t>(R->getSemanticContext()));
|
|
LE.write(static_cast<uint8_t>(R->isNotRecommended()));
|
|
LE.write(static_cast<uint8_t>(R->getNumBytesToErase()));
|
|
LE.write(
|
|
static_cast<uint32_t>(addCompletionString(R->getCompletionString())));
|
|
LE.write(addString(R->getModuleName())); // index into strings
|
|
LE.write(addString(R->getBriefDocComment())); // index into strings
|
|
LE.write(static_cast<uint32_t>(R->getAssociatedUSRs().size()));
|
|
if (R->getAssociatedUSRs().empty()) {
|
|
LE.write(static_cast<uint32_t>(~0u));
|
|
} else {
|
|
LE.write(addString(R->getAssociatedUSRs()[0]));
|
|
for (unsigned i = 1; i < R->getAssociatedUSRs().size(); ++i) {
|
|
addString(R->getAssociatedUSRs()[i]); // ignore result
|
|
}
|
|
}
|
|
}
|
|
}
|
|
LE.write(static_cast<uint32_t>(results.tell()));
|
|
out << results.str();
|
|
|
|
// CHUNKS
|
|
LE.write(static_cast<uint32_t>(chunks.tell()));
|
|
out << chunks.str();
|
|
|
|
// STRINGS
|
|
LE.write(static_cast<uint32_t>(strings.tell()));
|
|
out << strings.str();
|
|
}
|
|
|
|
/// Get the name for the cached code completion results for a given key \p K in
|
|
/// \p cacheDirectory.
|
|
///
|
|
/// This name is unique (modulo hash collisions) to the key \p K.
|
|
static std::string getName(StringRef cacheDirectory,
|
|
const CodeCompletionCache::Key &K) {
|
|
SmallString<128> name(cacheDirectory);
|
|
|
|
// cacheDirectory/ModuleName
|
|
llvm::sys::path::append(name, K.ModuleName);
|
|
llvm::raw_svector_ostream OSS(name);
|
|
|
|
// name[-dot][-testable]
|
|
OSS << (K.ResultsHaveLeadingDot ? "-dot" : "")
|
|
<< (K.ForTestableLookup ? "-testable" : "");
|
|
|
|
// name[-access-path-components]
|
|
for (StringRef component : K.AccessPath)
|
|
OSS << "-" << component;
|
|
|
|
// name-<hash of module filename>
|
|
auto hash = llvm::hash_value(K.ModuleFilename);
|
|
SmallString<16> hashStr;
|
|
llvm::APInt(64, uint64_t(hash)).toStringUnsigned(hashStr, /*Radix*/ 36);
|
|
OSS << "-" << hashStr << ".completions";
|
|
|
|
OSS.flush();
|
|
return name.str();
|
|
}
|
|
|
|
Optional<CodeCompletionCache::ValueRefCntPtr>
|
|
OnDiskCodeCompletionCache::get(const Key &K) {
|
|
// Try to find the cached file.
|
|
auto bufferOrErr = llvm::MemoryBuffer::getFile(getName(cacheDirectory, K));
|
|
if (!bufferOrErr)
|
|
return None;
|
|
|
|
// Read the cached results, failing if they are out of date.
|
|
auto V = CodeCompletionCache::createValue();
|
|
if (!readCachedModule(bufferOrErr.get().get(), K, *V))
|
|
return None;
|
|
|
|
return V;
|
|
}
|
|
|
|
std::error_code OnDiskCodeCompletionCache::set(const Key &K, ValueRefCntPtr V) {
|
|
if (K.ModuleFilename.empty())
|
|
return std::make_error_code(std::errc::no_such_file_or_directory);
|
|
|
|
// Create the cache directory if it doesn't exist.
|
|
if (auto err = llvm::sys::fs::create_directories(cacheDirectory))
|
|
return err;
|
|
|
|
std::string name = getName(cacheDirectory, K);
|
|
|
|
// Create a temporary file to write the results into.
|
|
SmallString<128> tmpName(name + "-%%%%%%");
|
|
int tmpFD;
|
|
if (auto err = llvm::sys::fs::createUniqueFile(tmpName.str(), tmpFD, tmpName))
|
|
return err;
|
|
|
|
// Write the contents of the buffer.
|
|
llvm::raw_fd_ostream out(tmpFD, /*shouldClose=*/true);
|
|
writeCachedModule(out, K, *V);
|
|
out.flush();
|
|
if (out.has_error())
|
|
return std::make_error_code(std::errc::io_error);
|
|
|
|
// Atomically rename the file into its final location.
|
|
return llvm::sys::fs::rename(tmpName.str(), name);
|
|
}
|
|
|
|
Optional<CodeCompletionCache::ValueRefCntPtr>
|
|
OnDiskCodeCompletionCache::getFromFile(StringRef filename) {
|
|
// Try to find the cached file.
|
|
auto bufferOrErr = llvm::MemoryBuffer::getFile(filename);
|
|
if (!bufferOrErr)
|
|
return None;
|
|
|
|
// Make up a key for readCachedModule.
|
|
CodeCompletionCache::Key K{filename, "<module-name>", {}, false, false};
|
|
|
|
// Read the cached results.
|
|
auto V = CodeCompletionCache::createValue();
|
|
if (!readCachedModule(bufferOrErr.get().get(), K, *V,
|
|
/*allowOutOfDate*/ true))
|
|
return None;
|
|
|
|
return V;
|
|
}
|
|
|
|
OnDiskCodeCompletionCache::OnDiskCodeCompletionCache(Twine cacheDirectory)
|
|
: cacheDirectory(cacheDirectory.str()) {}
|
|
|
|
OnDiskCodeCompletionCache::~OnDiskCodeCompletionCache() {}
|