//===--- Demangle.h - Interface to Swift symbol demangling ------*- C++ -*-===// // // This source file is part of the Swift.org open source project // // Copyright (c) 2014 - 2017 Apple Inc. and the Swift project authors // Licensed under Apache License v2.0 with Runtime Library Exception // // See https://swift.org/LICENSE.txt for license information // See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors // //===----------------------------------------------------------------------===// // // This file is the public API of the demangler library. // Tools which use the demangler library (like lldb) must include this - and // only this - header file. // //===----------------------------------------------------------------------===// #ifndef SWIFT_DEMANGLING_DEMANGLE_H #define SWIFT_DEMANGLING_DEMANGLE_H #include #include #include #include #include "llvm/ADT/StringRef.h" namespace llvm { class raw_ostream; } namespace swift { namespace Demangle { struct DemangleOptions { bool SynthesizeSugarOnTypes = false; bool DisplayDebuggerGeneratedModule = true; bool QualifyEntities = true; bool DisplayExtensionContexts = true; bool DisplayUnmangledSuffix = true; bool DisplayModuleNames = true; bool DisplayGenericSpecializations = true; bool DisplayProtocolConformances = true; bool DisplayWhereClauses = true; bool DisplayEntityTypes = true; bool ShortenPartialApply = false; bool ShortenThunk = false; bool ShortenValueWitness = false; bool ShortenArchetype = false; bool ShowPrivateDiscriminators = true; bool ShowFunctionArgumentTypes = true; DemangleOptions() {} static DemangleOptions SimplifiedUIDemangleOptions() { auto Opt = DemangleOptions(); Opt.SynthesizeSugarOnTypes = true; Opt.QualifyEntities = true; Opt.DisplayExtensionContexts = false; Opt.DisplayUnmangledSuffix = false; Opt.DisplayModuleNames = false; Opt.DisplayGenericSpecializations = false; Opt.DisplayProtocolConformances = false; Opt.DisplayWhereClauses = false; Opt.DisplayEntityTypes = false; Opt.ShortenPartialApply = true; Opt.ShortenThunk = true; Opt.ShortenValueWitness = true; Opt.ShortenArchetype = true; Opt.ShowPrivateDiscriminators = false; Opt.ShowFunctionArgumentTypes = false; return Opt; }; }; class Node; typedef Node *NodePointer; enum class FunctionSigSpecializationParamKind : unsigned { // Option Flags use bits 0-5. This give us 6 bits implying 64 entries to // work with. ConstantPropFunction = 0, ConstantPropGlobal = 1, ConstantPropInteger = 2, ConstantPropFloat = 3, ConstantPropString = 4, ClosureProp = 5, BoxToValue = 6, BoxToStack = 7, // Option Set Flags use bits 6-31. This gives us 26 bits to use for option // flags. Dead = 1 << 6, OwnedToGuaranteed = 1 << 7, SROA = 1 << 8, }; /// The pass that caused the specialization to occur. We use this to make sure /// that two passes that generate similar changes do not yield the same /// mangling. This currently cannot happen, so this is just a safety measure /// that creates separate name spaces. enum class SpecializationPass : uint8_t { AllocBoxToStack, ClosureSpecializer, CapturePromotion, CapturePropagation, FunctionSignatureOpts, GenericSpecializer, }; static inline char encodeSpecializationPass(SpecializationPass Pass) { return char(uint8_t(Pass)) + '0'; } enum class ValueWitnessKind { #define VALUE_WITNESS(MANGLING, NAME) \ NAME, #include "swift/Demangling/ValueWitnessMangling.def" }; enum class Directness { Direct, Indirect }; class NodeFactory; class Context; class Node { public: enum class Kind : uint16_t { #define NODE(ID) ID, #include "swift/Demangling/DemangleNodes.def" }; typedef uint64_t IndexType; friend class NodeFactory; private: Kind NodeKind; enum class PayloadKind : uint8_t { None, Text, Index }; PayloadKind NodePayloadKind; union { llvm::StringRef TextPayload; IndexType IndexPayload; }; NodePointer *Children = nullptr; size_t NumChildren = 0; size_t ReservedChildren = 0; Node(Kind k) : NodeKind(k), NodePayloadKind(PayloadKind::None) { } Node(Kind k, llvm::StringRef t) : NodeKind(k), NodePayloadKind(PayloadKind::Text) { TextPayload = t; } Node(Kind k, IndexType index) : NodeKind(k), NodePayloadKind(PayloadKind::Index) { IndexPayload = index; } Node(const Node &) = delete; Node &operator=(const Node &) = delete; public: Kind getKind() const { return NodeKind; } bool hasText() const { return NodePayloadKind == PayloadKind::Text; } llvm::StringRef getText() const { assert(hasText()); return TextPayload; } bool hasIndex() const { return NodePayloadKind == PayloadKind::Index; } uint64_t getIndex() const { assert(hasIndex()); return IndexPayload; } typedef NodePointer *iterator; typedef const NodePointer *const_iterator; typedef size_t size_type; bool hasChildren() const { return NumChildren != 0; } size_t getNumChildren() const { return NumChildren; } iterator begin() { return Children; } iterator end() { return Children + NumChildren; } const_iterator begin() const { return Children; } const_iterator end() const { return Children + NumChildren; } NodePointer getFirstChild() const { assert(NumChildren >= 1); return Children[0]; } NodePointer getChild(size_t index) const { assert(NumChildren > index); return Children[index]; } // inline void addChild(NodePointer Child, Context &Ctx); // Only to be used by the demangler parsers. void addChild(NodePointer Child, NodeFactory &Factory); // Reverses the order of children. void reverseChildren(size_t StartingAt = 0); /// Prints the whole node tree in readable form to stderr. /// /// Useful to be called from the debugger. void dump(); }; /// Returns true if the mangledName starts with the swift mangling prefix. /// /// \param mangledName A null-terminated string containing a mangled name. bool isSwiftSymbol(const char *mangledName); class Demangler; /// The demangler context. /// /// It owns the allocated nodes which are created during demangling. /// It is always preferable to use the demangling via this context class as it /// ensures efficient memory management. Especially if demangling is done for /// multiple symbols. Typical usage: /// \code /// Context Ctx; /// for (...) { /// NodePointer Root = Ctx.demangleSymbolAsNode(MangledName); /// // Do something with Root /// Ctx.clear(); // deallocates Root /// } /// \endcode /// Declaring the context out of the loop minimizes the amount of needed memory /// allocations. /// class Context { Demangler *D; friend class Node; public: Context(); ~Context(); /// Demangle the given symbol and return the parse tree. /// /// \param MangledName The mangled symbol string, which start with the /// mangling prefix _T. /// /// \returns A parse tree for the demangled string - or a null pointer /// on failure. /// The lifetime of the returned node tree ends with the lifetime of the /// context or with a call of clear(). NodePointer demangleSymbolAsNode(llvm::StringRef MangledName); /// Demangle the given type and return the parse tree. /// /// \param MangledName The mangled type string, which does _not_ start with /// the mangling prefix _T. /// /// \returns A parse tree for the demangled string - or a null pointer /// on failure. /// The lifetime of the returned node tree ends with the lifetime of the /// context or with a call of clear(). NodePointer demangleTypeAsNode(llvm::StringRef MangledName); /// Demangle the given symbol and return the readable name. /// /// \param MangledName The mangled symbol string, which start with the /// mangling prefix _T. /// /// \returns The demangled string. std::string demangleSymbolAsString(llvm::StringRef MangledName, const DemangleOptions &Options = DemangleOptions()); /// Demangle the given type and return the readable name. /// /// \param MangledName The mangled type string, which does _not_ start with /// the mangling prefix _T. /// /// \returns The demangled string. std::string demangleTypeAsString(llvm::StringRef MangledName, const DemangleOptions &Options = DemangleOptions()); /// Returns true if the mangledName refers to a thunk function. /// /// Thunk functions are either (ObjC) partial apply forwarder, swift-as-ObjC /// or ObjC-as-swift thunks. bool isThunkSymbol(llvm::StringRef MangledName); /// Returns the mangled name of the target of a thunk. /// /// \returns Returns the remaining name after removing the thunk mangling /// characters from \p MangledName. If \p MangledName is not a thunk symbol /// or the thunk target cannot be derived from the mangling, an empty string /// is returned. std::string getThunkTarget(llvm::StringRef MangledName); /// Returns true if the \p mangledName refers to a function which conforms to /// the Swift calling convention. /// /// The return value is unspecified if the \p MangledName does not refer to a /// function symbol. bool hasSwiftCallingConvention(llvm::StringRef MangledName); /// Deallocates all nodes. /// /// The memory which is used for nodes is not freed but recycled for the next /// demangling operation. void clear(); }; /// Standalone utility function to demangle the given symbol as string. /// /// If performance is an issue when demangling multiple symbols, /// Context::demangleSymbolAsString should be used instead. /// \param mangledName The mangled name string pointer. /// \param mangledNameLength The length of the mangledName string. /// \returns The demangled string. std::string demangleSymbolAsString(const char *mangledName, size_t mangledNameLength, const DemangleOptions &options = DemangleOptions()); /// Standalone utility function to demangle the given symbol as string. /// /// If performance is an issue when demangling multiple symbols, /// Context::demangleSymbolAsString should be used instead. /// \param mangledName The mangled name string. /// \returns The demangled string. inline std::string demangleSymbolAsString(const std::string &mangledName, const DemangleOptions &options = DemangleOptions()) { return demangleSymbolAsString(mangledName.data(), mangledName.size(), options); } /// Standalone utility function to demangle the given symbol as string. /// /// If performance is an issue when demangling multiple symbols, /// Context::demangleSymbolAsString should be used instead. /// \param MangledName The mangled name string. /// \returns The demangled string. inline std::string demangleSymbolAsString(llvm::StringRef MangledName, const DemangleOptions &Options = DemangleOptions()) { return demangleSymbolAsString(MangledName.data(), MangledName.size(), Options); } /// Standalone utility function to demangle the given type as string. /// /// If performance is an issue when demangling multiple symbols, /// Context::demangleTypeAsString should be used instead. /// \param mangledName The mangled name string pointer. /// \param mangledNameLength The length of the mangledName string. /// \returns The demangled string. std::string demangleTypeAsString(const char *mangledName, size_t mangledNameLength, const DemangleOptions &options = DemangleOptions()); /// Standalone utility function to demangle the given type as string. /// /// If performance is an issue when demangling multiple symbols, /// Context::demangleTypeAsString should be used instead. /// \param mangledName The mangled name string. /// \returns The demangled string. inline std::string demangleTypeAsString(const std::string &mangledName, const DemangleOptions &options = DemangleOptions()) { return demangleTypeAsString(mangledName.data(), mangledName.size(), options); } /// Standalone utility function to demangle the given type as string. /// /// If performance is an issue when demangling multiple symbols, /// Context::demangleTypeAsString should be used instead. /// \param MangledName The mangled name string. /// \returns The demangled string. inline std::string demangleTypeAsString(llvm::StringRef MangledName, const DemangleOptions &Options = DemangleOptions()) { return demangleTypeAsString(MangledName.data(), MangledName.size(), Options); } enum class OperatorKind { NotOperator, Prefix, Postfix, Infix, }; /// \brief Mangle an identifier using Swift's mangling rules. void mangleIdentifier(const char *data, size_t length, OperatorKind operatorKind, std::string &out, bool usePunycode = true); /// \brief Remangle a demangled parse tree. /// /// This should always round-trip perfectly with demangleSymbolAsNode. std::string mangleNode(const NodePointer &root); /// \brief Transform the node structure to a string. /// /// Typical usage: /// \code /// std::string aDemangledName = /// swift::Demangler::nodeToString(aNode) /// \endcode /// /// \param Root A pointer to a parse tree generated by the demangler. /// \param Options An object encapsulating options to use to perform this demangling. /// /// \returns A string representing the demangled name. /// std::string nodeToString(NodePointer Root, const DemangleOptions &Options = DemangleOptions()); /// A class for printing to a std::string. class DemanglerPrinter { public: DemanglerPrinter() = default; DemanglerPrinter &operator<<(llvm::StringRef Value) & { Stream.append(Value.data(), Value.size()); return *this; } DemanglerPrinter &operator<<(char c) & { Stream.push_back(c); return *this; } DemanglerPrinter &operator<<(unsigned long long n) &; DemanglerPrinter &operator<<(long long n) &; DemanglerPrinter &operator<<(unsigned long n) & { return *this << (unsigned long long)n; } DemanglerPrinter &operator<<(long n) & { return *this << (long long)n; } DemanglerPrinter &operator<<(unsigned n) & { return *this << (unsigned long long)n; } DemanglerPrinter &operator<<(int n) & { return *this << (long long)n; } template DemanglerPrinter &&operator<<(T &&x) && { return std::move(*this << std::forward(x)); } std::string &&str() && { return std::move(Stream); } llvm::StringRef getStringRef() const { return Stream; } /// Shrinks the buffer. void resetSize(size_t toPos) { assert(toPos <= Stream.size()); Stream.resize(toPos); } private: std::string Stream; }; /// Returns a the node kind \p k as string. const char *getNodeKindString(swift::Demangle::Node::Kind k); /// Prints the whole node tree \p Root in readable form into a std::string. /// /// Useful for debugging. std::string getNodeTreeAsString(NodePointer Root); bool isSpecialized(Node *node); NodePointer getUnspecialized(Node *node, NodeFactory &Factory); std::string archetypeName(Node::IndexType index, Node::IndexType depth); } // end namespace Demangle } // end namespace swift #endif // SWIFT_DEMANGLING_DEMANGLE_H