//===--- SILConstants.h - SIL constant representation -----------*- C++ -*-===// // // This source file is part of the Swift.org open source project // // Copyright (c) 2014 - 2017 Apple Inc. and the Swift project authors // Licensed under Apache License v2.0 with Runtime Library Exception // // See https://swift.org/LICENSE.txt for license information // See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors // //===----------------------------------------------------------------------===// // // This defines an interface to represent SIL level structured constants in a // memory efficient way. // //===----------------------------------------------------------------------===// #ifndef SWIFT_SIL_CONSTANTS_H #define SWIFT_SIL_CONSTANTS_H #include "swift/SIL/SILValue.h" #include "llvm/Support/CommandLine.h" namespace swift { class SingleValueInstruction; class SILValue; class SILBuilder; class SerializedSILLoader; struct APIntSymbolicValue; struct ArraySymbolicValue; struct DerivedAddressValue; struct EnumWithPayloadSymbolicValue; struct SymbolicValueMemoryObject; struct UnknownSymbolicValue; extern llvm::cl::opt ConstExprLimit; /// When we fail to constant fold a value, this captures a reason why, /// allowing the caller to produce a specific diagnostic. The "Unknown" /// SymbolicValue representation also includes a pointer to the SILNode in /// question that was problematic. enum class UnknownReason { // TODO: Eliminate the default code, by making classifications for each // failure mode. Default, /// The constant expression was too big. This is reported on a random /// instruction within the constexpr that triggered the issue. TooManyInstructions, /// A control flow loop was found. Loop, /// Integer overflow detected. Overflow, /// Unspecified trap detected. Trap, /// An operation was applied over operands whose symbolic values were /// constants but were not valid for the operation. InvalidOperandValue, /// Encountered an instruction not supported by the interpreter. UnsupportedInstruction, /// Encountered a function call where the body of the called function is /// not available. CalleeImplementationUnknown, /// Attempted to load from/store into a SIL value that was not tracked by /// the interpreter. UntrackedSILValue, /// Attempted to find a concrete protocol conformance for a witness method /// and failed. UnknownWitnessMethodConformance, /// Attempted to determine the SIL function of a witness method (based on a /// concrete protocol conformance) and failed. UnresolvableWitnessMethod, /// The value of a top-level variable cannot be determined to be a constant. /// This is only relevant in the backward evaluation mode, which is used by /// #assert. NotTopLevelConstant, /// A top-level value has multiple writers. This is only relevant in the /// non-flow-sensitive evaluation mode, which is used by #assert. MutipleTopLevelWriters, /// Indicates the return value of an instruction that was not evaluated during /// interpretation. ReturnedByUnevaluatedInstruction, /// Indicates that the value was possibly modified by an instruction /// that was not evaluated during the interpretation. MutatedByUnevaluatedInstruction, }; /// An abstract class that exposes functions for allocating symbolic values. /// The implementors of this class have to determine where to allocate them and /// and manage the lifetime of the allocated symbolic values. class SymbolicValueAllocator { public: virtual ~SymbolicValueAllocator() {} /// Allocate raw bytes. /// \param byteSize number of bytes to allocate. /// \param alignment alignment for the allocated bytes. virtual void *allocate(unsigned long byteSize, unsigned alignment) = 0; /// Allocate storage for a given number of elements of a specific type /// provided as a template parameter. Precondition: \c T must have an /// accesible zero argument constructor. /// \param numElts number of elements of the type to allocate. template T *allocate(unsigned numElts) { T *res = (T *)allocate(sizeof(T) * numElts, alignof(T)); for (unsigned i = 0; i != numElts; ++i) new (res + i) T(); return res; } }; /// A class that allocates symbolic values in a local bump allocator. The /// lifetime of the bump allocator is same as the lifetime of \c this object. class SymbolicValueBumpAllocator : public SymbolicValueAllocator { private: llvm::BumpPtrAllocator bumpAllocator; public: SymbolicValueBumpAllocator() {} ~SymbolicValueBumpAllocator() {} void *allocate(unsigned long byteSize, unsigned alignment) { return bumpAllocator.Allocate(byteSize, alignment); } }; /// This is the symbolic value tracked for each SILValue in a scope. We /// support multiple representational forms for the constant node in order to /// avoid pointless memory bloat + copying. This is intended to be a /// light-weight POD type we can put in hash tables and pass around by-value. /// /// Internally, this value has multiple ways to represent the same sorts of /// symbolic values (e.g. to save memory). It provides a simpler public /// interface though. class SymbolicValue { private: enum RepresentationKind { /// This value is an alloc stack that has not (yet) been initialized /// by flow-sensitive analysis. RK_UninitMemory, /// This symbolic value cannot be determined, carries multiple values /// (i.e., varies dynamically at the top level), or is of some type that /// we cannot analyze and propagate (e.g. NSObject). /// RK_Unknown, /// This value is known to be a metatype reference. The type is stored /// in the "metatype" member. RK_Metatype, /// This value is known to be a function reference, e.g. through /// function_ref directly, or a devirtualized method reference. RK_Function, /// This value is represented with a bump-pointer allocated APInt. RK_Integer, /// This value is represented with an inline integer representation. RK_IntegerInline, /// This value is represented with a bump-pointer allocated char array /// representing a UTF-8 encoded string. RK_String, /// This value is a struct or tuple of constants. This is tracked by the /// "aggregate" member of the value union. RK_Aggregate, /// This value is an enum with no payload. RK_Enum, /// This value is an enum with a payload. RK_EnumWithPayload, /// This represents the address of a memory object. RK_DirectAddress, /// This represents an index *into* a memory object. RK_DerivedAddress, }; union { /// When the value is Unknown, this contains information about the /// unfoldable part of the computation. UnknownSymbolicValue *unknown; /// This is always a SILType with an object category. This is the value /// of the underlying instance type, not the MetatypeType. TypeBase *metatype; SILFunction *function; /// When this SymbolicValue is of "Integer" kind, this pointer stores /// the words of the APInt value it holds. uint64_t *integer; /// This holds the bits of an integer for an inline representation. uint64_t integerInline; /// When this SymbolicValue is of "String" kind, this pointer stores /// information about the StringRef value it holds. const char *string; /// When this SymbolicValue is of "Aggregate" kind, this pointer stores /// information about the array elements and count. const SymbolicValue *aggregate; /// When this SymbolicValue is of "Enum" kind, this pointer stores /// information about the enum case type. EnumElementDecl *enumVal; /// When this SymbolicValue is of "EnumWithPayload" kind, this pointer /// stores information about the enum case type and its payload. EnumWithPayloadSymbolicValue *enumValWithPayload; /// When the representationKind is "DirectAddress", this pointer is the /// memory object referenced. SymbolicValueMemoryObject *directAddress; /// When this SymbolicValue is of "DerivedAddress" kind, this pointer stores /// information about the memory object and access path of the access. DerivedAddressValue *derivedAddress; } value; RepresentationKind representationKind : 8; union { /// This is the reason code for RK_Unknown values. UnknownReason unknownReason : 32; /// This is the number of bits in an RK_Integer or RK_IntegerInline /// representation, which makes the number of entries in the list derivable. unsigned integerBitwidth; /// This is the number of bytes for an RK_String representation. unsigned stringNumBytes; /// This is the number of elements for an RK_Aggregate representation. unsigned aggregateNumElements; } auxInfo; public: /// This enum is used to indicate the sort of value held by a SymbolicValue /// independent of its concrete representation. This is the public /// interface to SymbolicValue. enum Kind { /// This is a value that isn't a constant. Unknown, /// This is a known metatype value. Metatype, /// This is a function, represented as a SILFunction. Function, /// This is an integer constant. Integer, /// String values may have SIL type of Builtin.RawPointer or Builtin.Word /// type. String, /// This can be an array, struct, tuple, etc. Aggregate, /// This is an enum without payload. Enum, /// This is an enum with payload (formally known as "associated value"). EnumWithPayload, /// This value represents the address of, or into, a memory object. Address, /// These values are generally only seen internally to the system, external /// clients shouldn't have to deal with them. UninitMemory }; /// For constant values, return the type classification of this value. Kind getKind() const; /// Return true if this represents a constant value. bool isConstant() const { auto kind = getKind(); return kind != Unknown && kind != UninitMemory; } static SymbolicValue getUnknown(SILNode *node, UnknownReason reason, llvm::ArrayRef callStack, SymbolicValueAllocator &allocator); /// Return true if this represents an unknown result. bool isUnknown() const { return getKind() == Unknown; } /// Return the call stack for an unknown result. ArrayRef getUnknownCallStack() const; /// Return the node that triggered an unknown result. SILNode *getUnknownNode() const; /// Return the reason an unknown result was generated. UnknownReason getUnknownReason() const; static SymbolicValue getUninitMemory() { SymbolicValue result; result.representationKind = RK_UninitMemory; return result; } static SymbolicValue getMetatype(CanType type) { SymbolicValue result; result.representationKind = RK_Metatype; result.value.metatype = type.getPointer(); return result; } CanType getMetatypeValue() const { assert(representationKind == RK_Metatype); return CanType(value.metatype); } static SymbolicValue getFunction(SILFunction *fn) { assert(fn && "Function cannot be null"); SymbolicValue result; result.representationKind = RK_Function; result.value.function = fn; return result; } SILFunction *getFunctionValue() const { assert(getKind() == Function); return value.function; } static SymbolicValue getInteger(int64_t value, unsigned bitWidth); static SymbolicValue getInteger(const APInt &value, SymbolicValueAllocator &allocator); APInt getIntegerValue() const; unsigned getIntegerValueBitWidth() const; /// Returns a SymbolicValue representing a UTF-8 encoded string. static SymbolicValue getString(StringRef string, SymbolicValueAllocator &allocator); /// Returns the UTF-8 encoded string underlying a SymbolicValue. StringRef getStringValue() const; /// This returns an aggregate value with the specified elements in it. This /// copies the elements into the specified Allocator. static SymbolicValue getAggregate(ArrayRef elements, SymbolicValueAllocator &allocator); ArrayRef getAggregateValue() const; /// This returns a constant Symbolic value for the enum case in `decl`, which /// must not have an associated value. static SymbolicValue getEnum(EnumElementDecl *decl) { assert(decl); SymbolicValue result; result.representationKind = RK_Enum; result.value.enumVal = decl; return result; } /// `payload` must be a constant. static SymbolicValue getEnumWithPayload(EnumElementDecl *decl, SymbolicValue payload, SymbolicValueAllocator &allocator); EnumElementDecl *getEnumValue() const; SymbolicValue getEnumPayloadValue() const; /// Return a symbolic value that represents the address of a memory object. static SymbolicValue getAddress(SymbolicValueMemoryObject *memoryObject) { SymbolicValue result; result.representationKind = RK_DirectAddress; result.value.directAddress = memoryObject; return result; } /// Return a symbolic value that represents the address of a memory object /// indexed by a path. static SymbolicValue getAddress(SymbolicValueMemoryObject *memoryObject, ArrayRef indices, SymbolicValueAllocator &allocator); /// Return the memory object of this reference along with any access path /// indices involved. SymbolicValueMemoryObject * getAddressValue(SmallVectorImpl &accessPath) const; /// Return just the memory object for an address value. SymbolicValueMemoryObject *getAddressValueMemoryObject() const; //===--------------------------------------------------------------------===// // Helpers /// Dig through single element aggregates, return the ultimate thing inside of /// it. This is useful when dealing with integers and floats, because they /// are often wrapped in single-element struct wrappers. SymbolicValue lookThroughSingleElementAggregates() const; /// Given that this is an 'Unknown' value, emit diagnostic notes providing /// context about what the problem is. If there is no location for some /// reason, we fall back to using the specified location. void emitUnknownDiagnosticNotes(SILLocation fallbackLoc); bool isUnknownDueToUnevaluatedInstructions(); /// Clone this SymbolicValue into the specified Allocator and return the new /// version. This only works for valid constants. SymbolicValue cloneInto(SymbolicValueAllocator &allocator) const; void print(llvm::raw_ostream &os, unsigned indent = 0) const; void dump() const; }; static_assert(sizeof(SymbolicValue) == 2 * sizeof(void *), "SymbolicValue should stay small"); static_assert(std::is_pod::value, "SymbolicValue should stay POD"); inline llvm::raw_ostream &operator<<(llvm::raw_ostream &os, SymbolicValue val) { val.print(os); return os; } /// This is a representation of a memory object referred to by an address. /// Memory objects may be mutated over their lifetime, but their overall type /// remains the same. struct SymbolicValueMemoryObject { Type getType() const { return type; } SymbolicValue getValue() const { return value; } void setValue(SymbolicValue newValue) { value = newValue; } /// Create a new memory object whose overall type is as specified. static SymbolicValueMemoryObject *create(Type type, SymbolicValue value, SymbolicValueAllocator &allocator); /// Given that this memory object contains an aggregate value like /// {{1, 2}, 3}, and given an access path like [0,1], return the indexed /// element, e.g. "2" in this case. /// /// Returns uninit memory if the access path points at or into uninit memory. /// /// Precondition: The access path must be valid for this memory object's type. SymbolicValue getIndexedElement(ArrayRef accessPath); /// Given that this memory object contains an aggregate value like /// {{1, 2}, 3}, given an access path like [0,1], and given a new element like /// "4", set the indexed element to the specified scalar, producing {{1, 4}, /// 3} in this case. /// /// Precondition: The access path must be valid for this memory object's type. void setIndexedElement(ArrayRef accessPath, SymbolicValue newElement, SymbolicValueAllocator &allocator); private: const Type type; SymbolicValue value; SymbolicValueMemoryObject(Type type, SymbolicValue value) : type(type), value(value) {} SymbolicValueMemoryObject(const SymbolicValueMemoryObject &) = delete; void operator=(const SymbolicValueMemoryObject &) = delete; }; } // end namespace swift #endif