Files
swift-mirror/include/swift/Basic/SourceManager.h
Doug Gregor 5c217bd17c Add source buffers pretty-printed for diagnostics to serialized diagnostics
When emitting a diagnostic that references a declaration that does not
itself have a source location (e.g., because it was synthesized or
deserialized), the diagnostics engine pretty-prints the declaration
into a buffer so it can provide caret diagnostics pointing to that
declaration.

Start marking those buffers as "generated source buffers", so that we
emit their contents into serialized diagnostics files. This will allow
tools that make use of serialized diagnostics to also show caret
information.
2023-01-06 11:17:29 -08:00

383 lines
14 KiB
C++

//===--- SourceManager.h - Manager for Source Buffers -----------*- C++ -*-===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2014 - 2017 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
//
//===----------------------------------------------------------------------===//
#ifndef SWIFT_BASIC_SOURCEMANAGER_H
#define SWIFT_BASIC_SOURCEMANAGER_H
#include "swift/Basic/FileSystem.h"
#include "swift/Basic/SourceLoc.h"
#include "clang/Basic/FileManager.h"
#include "llvm/ADT/DenseSet.h"
#include "llvm/ADT/Optional.h"
#include "llvm/Support/SourceMgr.h"
#include <map>
namespace swift {
class DeclContext;
/// Augments a buffer that was created specifically to hold generated source
/// code with the reasons for it being generated.
class GeneratedSourceInfo {
public:
/// The kind of generated source code.
enum Kind {
/// The expansion of a macro.
MacroExpansion,
/// A new function body that is replacing an existing function body.
ReplacedFunctionBody,
/// Pretty-printed declarations that have no source location.
PrettyPrinted,
} kind;
/// The buffer ID for the enclosing buffer, in which originalSourceRange
/// resides.
unsigned originalBufferID;
/// The source range in the enclosing buffer where this source was generated.
///
/// This could point at a macro expansion or at the implicit location at
/// which source code was generated. Conceptually, one can think of the
/// buffer described by a \c GeneratedSource instance as replacing the
/// code in the \c originalSourceRange.
SourceRange originalSourceRange;
/// The source range in the generated-source buffer where the generated
/// code exists. This might be a subrange of the buffer containing the
/// generated source, but it will never be from a different buffer.
SourceRange generatedSourceRange;
/// The opaque pointer for an ASTNode for which this buffer was generated.
void *astNode;
/// The declaration context in which this buffer logically resides.
DeclContext *declContext;
};
/// This class manages and owns source buffers.
class SourceManager {
public:
/// A \c #sourceLocation-defined virtual file region, representing the source
/// source after a \c #sourceLocation (or between two). It provides a
/// filename and line offset to be applied to \c SourceLoc's within its
/// \c Range.
struct VirtualFile {
CharSourceRange Range;
std::string Name;
int LineOffset;
};
private:
llvm::SourceMgr LLVMSourceMgr;
llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> FileSystem;
unsigned IDEInspectionTargetBufferID = 0U;
unsigned IDEInspectionTargetOffset;
/// Associates buffer identifiers to buffer IDs.
llvm::DenseMap<StringRef, unsigned> BufIdentIDMap;
/// A cache mapping buffer identifiers to vfs Status entries.
///
/// This is as much a hack to prolong the lifetime of status objects as it is
/// to speed up stats.
mutable llvm::DenseMap<StringRef, llvm::vfs::Status> StatusCache;
/// Holds generated source information, indexed by the buffer ID.
llvm::DenseMap<unsigned, GeneratedSourceInfo> GeneratedSourceInfos;
/// Holds replaced ranges. Keys are original ranges, and values are new ranges
/// in different buffers. This is used for code completion and ASTContext
/// reusing compilation.
llvm::DenseMap<SourceRange, SourceRange> ReplacedRanges;
/// The starting source locations of regex literals written in source. This
/// is an unfortunate hack needed to allow for correct re-lexing.
llvm::DenseSet<SourceLoc> RegexLiteralStartLocs;
std::map<const char *, VirtualFile> VirtualFiles;
mutable std::pair<const char *, const VirtualFile*> CachedVFile = {nullptr, nullptr};
Optional<unsigned> findBufferContainingLocInternal(SourceLoc Loc) const;
public:
SourceManager(llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> FS =
llvm::vfs::getRealFileSystem())
: FileSystem(FS) {}
llvm::SourceMgr &getLLVMSourceMgr() {
return LLVMSourceMgr;
}
const llvm::SourceMgr &getLLVMSourceMgr() const {
return LLVMSourceMgr;
}
void setFileSystem(llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> FS) {
FileSystem = FS;
}
llvm::IntrusiveRefCntPtr<llvm::vfs::FileSystem> getFileSystem() const {
return FileSystem;
}
void setIDEInspectionTarget(unsigned BufferID, unsigned Offset) {
assert(BufferID != 0U && "Buffer should be valid");
IDEInspectionTargetBufferID = BufferID;
IDEInspectionTargetOffset = Offset;
}
bool hasIDEInspectionTargetBuffer() const {
return IDEInspectionTargetBufferID != 0U;
}
unsigned getIDEInspectionTargetBufferID() const {
return IDEInspectionTargetBufferID;
}
unsigned getIDEInspectionTargetOffset() const {
return IDEInspectionTargetOffset;
}
SourceLoc getIDEInspectionTargetLoc() const;
const llvm::DenseMap<SourceRange, SourceRange> &getReplacedRanges() const {
return ReplacedRanges;
}
/// Set the generated source information associated with a given buffer.
void setGeneratedSourceInfo(unsigned bufferID, GeneratedSourceInfo);
/// Retrieve the generated source information for the given buffer.
Optional<GeneratedSourceInfo> getGeneratedSourceInfo(unsigned bufferID) const;
/// Record the starting source location of a regex literal.
void recordRegexLiteralStartLoc(SourceLoc loc) {
RegexLiteralStartLocs.insert(loc);
}
/// Checks whether a given source location is for the start of a regex
/// literal.
bool isRegexLiteralStart(SourceLoc loc) const {
return RegexLiteralStartLocs.contains(loc);
}
/// Returns true if \c LHS is before \c RHS in the source buffer.
bool isBeforeInBuffer(SourceLoc LHS, SourceLoc RHS) const {
return LHS.Value.getPointer() < RHS.Value.getPointer();
}
/// Returns true if range \c R contains the location \c Loc. The location
/// \c Loc should point at the beginning of the token.
bool rangeContainsTokenLoc(SourceRange R, SourceLoc Loc) const {
return Loc == R.Start || Loc == R.End ||
(isBeforeInBuffer(R.Start, Loc) && isBeforeInBuffer(Loc, R.End));
}
/// Returns true if range \c Enclosing contains the range \c Inner.
bool rangeContains(SourceRange Enclosing, SourceRange Inner) const {
return rangeContainsTokenLoc(Enclosing, Inner.Start) &&
rangeContainsTokenLoc(Enclosing, Inner.End);
}
/// Returns true if range \p R contains the code-completion location, if any.
bool rangeContainsIDEInspectionTarget(SourceRange R) const {
return IDEInspectionTargetBufferID
? rangeContainsTokenLoc(R, getIDEInspectionTargetLoc())
: false;
}
/// Returns the buffer ID for the specified *valid* location.
///
/// Because a valid source location always corresponds to a source buffer,
/// this routine always returns a valid buffer ID.
unsigned findBufferContainingLoc(SourceLoc Loc) const;
/// Whether the source location is pointing to any buffer owned by the SourceManager.
bool isOwning(SourceLoc Loc) const;
/// Adds a memory buffer to the SourceManager, taking ownership of it.
unsigned addNewSourceBuffer(std::unique_ptr<llvm::MemoryBuffer> Buffer);
/// Add a \c #sourceLocation-defined virtual file region of \p Length.
void createVirtualFile(SourceLoc Loc, StringRef Name, int LineOffset,
unsigned Length);
/// Add a \c #sourceLocation-defined virtual file region.
///
/// By default, this region continues to the end of the buffer.
///
/// \returns True if the new file was added, false if the file already exists.
/// The name and line offset must match exactly in that case.
///
/// \sa closeVirtualFile
bool openVirtualFile(SourceLoc loc, StringRef name, int lineOffset);
/// Close a \c #sourceLocation-defined virtual file region.
void closeVirtualFile(SourceLoc end);
/// Creates a copy of a \c MemoryBuffer and adds it to the \c SourceManager,
/// taking ownership of the copy.
unsigned addMemBufferCopy(llvm::MemoryBuffer *Buffer);
/// Creates and adds a memory buffer to the \c SourceManager, taking
/// ownership of the newly created copy.
///
/// \p InputData and \p BufIdentifier are copied, so that this memory can go
/// away as soon as this function returns.
unsigned addMemBufferCopy(StringRef InputData, StringRef BufIdentifier = "");
/// Returns a buffer ID for a previously added buffer with the given
/// buffer identifier, or None if there is no such buffer.
Optional<unsigned> getIDForBufferIdentifier(StringRef BufIdentifier) const;
/// Returns the identifier for the buffer with the given ID.
///
/// \p BufferID must be a valid buffer ID.
///
/// This should not be used for displaying information about the \e contents
/// of a buffer, since lines within the buffer may be marked as coming from
/// other files using \c #sourceLocation. Use #getDisplayNameForLoc instead
/// in that case.
StringRef getIdentifierForBuffer(unsigned BufferID) const;
/// Returns a SourceRange covering the entire specified buffer.
///
/// Note that the start location might not point at the first token: it
/// might point at whitespace or a comment.
CharSourceRange getRangeForBuffer(unsigned BufferID) const;
/// Returns the SourceLoc for the beginning of the specified buffer
/// (at offset zero).
///
/// Note that the resulting location might not point at the first token: it
/// might point at whitespace or a comment.
SourceLoc getLocForBufferStart(unsigned BufferID) const {
return getRangeForBuffer(BufferID).getStart();
}
/// Returns the offset in bytes for the given valid source location.
unsigned getLocOffsetInBuffer(SourceLoc Loc, unsigned BufferID) const;
/// Returns the distance in bytes between the given valid source
/// locations.
unsigned getByteDistance(SourceLoc Start, SourceLoc End) const;
/// Returns the SourceLoc for the byte offset in the specified buffer.
SourceLoc getLocForOffset(unsigned BufferID, unsigned Offset) const {
return getLocForBufferStart(BufferID).getAdvancedLoc(Offset);
}
/// Returns a buffer identifier suitable for display to the user containing
/// the given source location.
///
/// This respects \c #sourceLocation directives and the 'use-external-names'
/// directive in VFS overlay files. If you need an on-disk file name, use
/// #getIdentifierForBuffer instead.
StringRef getDisplayNameForLoc(SourceLoc Loc) const;
/// Returns the line and column represented by the given source location.
///
/// If \p BufferID is provided, \p Loc must come from that source buffer.
///
/// This respects \c #sourceLocation directives.
std::pair<unsigned, unsigned>
getPresumedLineAndColumnForLoc(SourceLoc Loc, unsigned BufferID = 0) const {
assert(Loc.isValid());
int LineOffset = getLineOffset(Loc);
int l, c;
std::tie(l, c) = LLVMSourceMgr.getLineAndColumn(Loc.Value, BufferID);
assert(LineOffset+l > 0 && "bogus line offset");
return { LineOffset + l, c };
}
/// Returns the real line and column for a source location.
///
/// If \p BufferID is provided, \p Loc must come from that source buffer.
///
/// This does not respect \c #sourceLocation directives.
std::pair<unsigned, unsigned>
getLineAndColumnInBuffer(SourceLoc Loc, unsigned BufferID = 0) const {
assert(Loc.isValid());
return LLVMSourceMgr.getLineAndColumn(Loc.Value, BufferID);
}
/// Returns the column for the given source location in the given buffer.
unsigned getColumnInBuffer(SourceLoc Loc, unsigned BufferID) const;
StringRef getEntireTextForBuffer(unsigned BufferID) const;
StringRef extractText(CharSourceRange Range,
Optional<unsigned> BufferID = None) const;
llvm::SMDiagnostic GetMessage(SourceLoc Loc, llvm::SourceMgr::DiagKind Kind,
const Twine &Msg,
ArrayRef<llvm::SMRange> Ranges,
ArrayRef<llvm::SMFixIt> FixIts) const;
/// Verifies that all buffers are still valid.
void verifyAllBuffers() const;
/// Translate line and column pair to the offset.
/// If the column number is the maximum unsinged int, return the offset of the end of the line.
llvm::Optional<unsigned> resolveFromLineCol(unsigned BufferId, unsigned Line,
unsigned Col) const;
/// Translate the end position of the given line to the offset.
llvm::Optional<unsigned> resolveOffsetForEndOfLine(unsigned BufferId,
unsigned Line) const;
/// Get the length of the line
llvm::Optional<unsigned> getLineLength(unsigned BufferId, unsigned Line) const;
SourceLoc getLocForLineCol(unsigned BufferId, unsigned Line, unsigned Col) const {
auto Offset = resolveFromLineCol(BufferId, Line, Col);
return Offset.has_value() ? getLocForOffset(BufferId, Offset.value()) :
SourceLoc();
}
std::string getLineString(unsigned BufferID, unsigned LineNumber);
/// Retrieve the buffer ID for \p Path, loading if necessary.
unsigned getExternalSourceBufferID(StringRef Path);
SourceLoc getLocFromExternalSource(StringRef Path, unsigned Line, unsigned Col);
/// Retrieve the virtual file for the given \p Loc, or nullptr if none exists.
const VirtualFile *getVirtualFile(SourceLoc Loc) const;
/// Whether or not \p Loc is after a \c #sourceLocation directive, ie. its
/// file, line, and column should be reported using the information in the
/// directive.
bool isLocInVirtualFile(SourceLoc Loc) const {
return getVirtualFile(Loc) != nullptr;
}
/// Return a SourceLoc in \c this corresponding to \p otherLoc, which must be
/// owned by \p otherManager. Returns an invalid SourceLoc if it cannot be
/// translated.
SourceLoc getLocForForeignLoc(SourceLoc otherLoc, SourceManager &otherMgr);
private:
int getLineOffset(SourceLoc Loc) const {
if (auto VFile = getVirtualFile(Loc))
return VFile->LineOffset;
else
return 0;
}
};
} // end namespace swift
#endif // SWIFT_BASIC_SOURCEMANAGER_H