mirror of
https://github.com/apple/swift.git
synced 2025-12-14 20:36:38 +01:00
415 lines
12 KiB
Swift
415 lines
12 KiB
Swift
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This source file is part of the Swift.org open source project
|
|
//
|
|
// Copyright (c) 2014 - 2018 Apple Inc. and the Swift project authors
|
|
// Licensed under Apache License v2.0 with Runtime Library Exception
|
|
//
|
|
// See https://swift.org/LICENSE.txt for license information
|
|
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
import SwiftShims
|
|
|
|
//
|
|
// StringGuts is a parameterization over String's representations. It provides
|
|
// functionality and guidance for efficiently working with Strings.
|
|
//
|
|
@_fixed_layout @usableFromInline
|
|
internal struct _StringGuts {
|
|
@usableFromInline
|
|
internal var _object: _StringObject
|
|
|
|
@inlinable @inline(__always)
|
|
internal init(_ object: _StringObject) {
|
|
self._object = object
|
|
_invariantCheck()
|
|
}
|
|
|
|
// Empty string
|
|
@inlinable @inline(__always)
|
|
init() {
|
|
self.init(_StringObject(empty: ()))
|
|
}
|
|
}
|
|
|
|
// Raw
|
|
extension _StringGuts {
|
|
@usableFromInline
|
|
internal typealias RawBitPattern = _StringObject.RawBitPattern
|
|
|
|
@inlinable
|
|
internal var rawBits: RawBitPattern {
|
|
@inline(__always) get { return _object.rawBits }
|
|
}
|
|
|
|
@inlinable @inline(__always)
|
|
init(raw bits: RawBitPattern) {
|
|
self.init(_StringObject(raw: bits))
|
|
}
|
|
|
|
}
|
|
|
|
// Creation
|
|
extension _StringGuts {
|
|
@inlinable @inline(__always)
|
|
internal init(_ smol: _SmallString) {
|
|
self.init(_StringObject(smol))
|
|
}
|
|
|
|
@inlinable @inline(__always)
|
|
internal init(_ bufPtr: UnsafeBufferPointer<UInt8>, isKnownASCII: Bool) {
|
|
self.init(_StringObject(immortal: bufPtr, isASCII: isKnownASCII))
|
|
}
|
|
|
|
@inlinable @inline(__always)
|
|
internal init(_ storage: _StringStorage) {
|
|
// TODO(UTF8): We should probably store perf flags on the storage's capacity
|
|
self.init(_StringObject(storage, isASCII: false))
|
|
}
|
|
|
|
internal init(_ storage: _SharedStringStorage) {
|
|
// TODO(UTF8 perf): Is it better, or worse, to throw the object away if
|
|
// immortal? We could avoid having to ARC the object itself when owner is
|
|
// nil, at the cost of repeatedly creating a new one when this string is
|
|
// bridged back-and-forth to ObjC. For now, we're choosing to keep the
|
|
// object allocation, perform some ARC, and require a dependent load for
|
|
// literals that have bridged back in from ObjC. Long term, we will likely
|
|
// emit some kind of "immortal" object for literals with efficient bridging
|
|
// anyways, so this may be a short-term decision.
|
|
|
|
// TODO(UTF8): We should probably store perf flags in the object
|
|
self.init(_StringObject(storage, isASCII: false))
|
|
}
|
|
|
|
internal init(cocoa: AnyObject, providesFastUTF8: Bool, length: Int) {
|
|
self.init(_StringObject(
|
|
cocoa: cocoa, providesFastUTF8: providesFastUTF8, length: length))
|
|
}
|
|
}
|
|
|
|
// Queries
|
|
extension _StringGuts {
|
|
// The number of code units
|
|
@inlinable
|
|
internal var count: Int { @inline(__always) get { return _object.count } }
|
|
|
|
@inlinable
|
|
internal var isEmpty: Bool { @inline(__always) get { return count == 0 } }
|
|
|
|
@inlinable
|
|
internal var isKnownASCII: Bool {
|
|
@inline(__always) get { return _object.isASCII }
|
|
}
|
|
|
|
internal var nativeCapacity: Int? {
|
|
guard hasNativeStorage else { return nil }
|
|
return _object.nativeStorage.capacity
|
|
}
|
|
|
|
internal var nativeUnusedCapacity: Int? {
|
|
guard hasNativeStorage else { return nil }
|
|
return _object.nativeStorage.unusedCapacity
|
|
}
|
|
|
|
// If natively stored and uniquely referenced, return the storage's total
|
|
// capacity. Otherwise, nil.
|
|
internal var uniqueNativeCapacity: Int? {
|
|
@inline(__always) mutating get {
|
|
guard isUniqueNative else { return nil }
|
|
return _object.nativeStorage.capacity
|
|
}
|
|
}
|
|
|
|
// If natively stored and uniquely referenced, return the storage's spare
|
|
// capacity. Otherwise, nil.
|
|
internal var uniqueNativeUnusedCapacity: Int? {
|
|
@inline(__always) mutating get {
|
|
guard isUniqueNative else { return nil }
|
|
return _object.nativeStorage.unusedCapacity
|
|
}
|
|
}
|
|
|
|
@inlinable
|
|
internal var hasNativeStorage: Bool { return _object.hasNativeStorage }
|
|
}
|
|
|
|
//
|
|
extension _StringGuts {
|
|
// Whether we can provide fast access to contiguous UTF-8 code units
|
|
@inlinable
|
|
internal var isFastUTF8: Bool {
|
|
@inline(__always) get {
|
|
// TODO(UTF8 merge): Can we add the Builtin.expected here?
|
|
return _object.providesFastUTF8
|
|
}
|
|
}
|
|
// A String which does not provide fast access to contiguous UTF-8 code units
|
|
@inlinable
|
|
internal var isForeign: Bool {
|
|
@inline(__always) get { return _object.isForeign }
|
|
}
|
|
|
|
@inlinable @inline(__always)
|
|
internal func withFastUTF8<R>(
|
|
_ f: (UnsafeBufferPointer<UInt8>) throws -> R
|
|
) rethrows -> R {
|
|
_sanityCheck(isFastUTF8)
|
|
|
|
if _object.isSmall { return try _object.asSmallString.withUTF8(f) }
|
|
|
|
defer { _fixLifetime(self) }
|
|
return try f(_object.fastUTF8)
|
|
}
|
|
|
|
@inlinable @inline(__always)
|
|
internal func withUTF8IfAvailable<R>(
|
|
_ f: (UnsafeBufferPointer<UInt8>) throws -> R
|
|
) rethrows -> R? {
|
|
if _slowPath(isForeign) { return nil }
|
|
return try withFastUTF8(f)
|
|
}
|
|
}
|
|
|
|
// Internal invariants
|
|
extension _StringGuts {
|
|
@inlinable @inline(__always)
|
|
internal func _invariantCheck() {
|
|
#if INTERNAL_CHECKS_ENABLED
|
|
_object._invariantCheck()
|
|
#if arch(i386) || arch(arm)
|
|
_sanityCheck(MemoryLayout<String>.size == 12, """
|
|
the runtime is depending on this, update Reflection.mm and \
|
|
this if you change it
|
|
""")
|
|
#else
|
|
_sanityCheck(MemoryLayout<String>.size == 16, """
|
|
the runtime is depending on this, update Reflection.mm and \
|
|
this if you change it
|
|
""")
|
|
#endif
|
|
#endif // INTERNAL_CHECKS_ENABLED
|
|
}
|
|
|
|
internal func _dump() { _object._dump() }
|
|
}
|
|
|
|
// Append
|
|
extension _StringGuts {
|
|
@usableFromInline // @testable
|
|
internal var isUniqueNative: Bool {
|
|
@inline(__always) mutating get {
|
|
// Note: mutating so that self is `inout`.
|
|
guard hasNativeStorage else { return false }
|
|
defer { _fixLifetime(self) }
|
|
var bits: UInt = _object.largeAddressBits
|
|
return _isUnique_native(&bits)
|
|
}
|
|
}
|
|
|
|
internal mutating func reserveCapacity(_ n: Int) {
|
|
// Check if there's nothing to do
|
|
if n <= _SmallString.capacity { return }
|
|
if let currentCap = self.uniqueNativeCapacity, currentCap >= n { return }
|
|
|
|
// Grow
|
|
self.grow(n)
|
|
}
|
|
|
|
// Grow to accomodate at least `n` code units
|
|
internal mutating func grow(_ n: Int) {
|
|
defer { self._invariantCheck() }
|
|
|
|
_sanityCheck(
|
|
self.uniqueNativeCapacity == nil || self.uniqueNativeCapacity! < n)
|
|
|
|
if _fastPath(isFastUTF8) {
|
|
let storage = self.withFastUTF8 {
|
|
_StringStorage.create(initializingFrom: $0, capacity: n)
|
|
}
|
|
|
|
// TODO(UTF8): Track known ascii
|
|
self = _StringGuts(storage)
|
|
return
|
|
}
|
|
|
|
_foreignGrow(n)
|
|
}
|
|
|
|
@inline(never) // slow-path
|
|
internal mutating func _foreignGrow(_ n: Int) {
|
|
// TODO(UTF8 perf): skip the intermediary arrays
|
|
let selfUTF8 = Array(String(self).utf8)
|
|
selfUTF8.withUnsafeBufferPointer {
|
|
self = _StringGuts(_StringStorage.create(
|
|
initializingFrom: $0, capacity: n))
|
|
}
|
|
}
|
|
|
|
internal mutating func append(_ other: _StringGuts) {
|
|
defer { self._invariantCheck() }
|
|
|
|
// Try to form a small string if possible
|
|
if !hasNativeStorage {
|
|
if let smol = _SmallString(base: self, appending: other) {
|
|
self = _StringGuts(smol)
|
|
return
|
|
}
|
|
}
|
|
|
|
// See if we can accomodate without growing or copying. If we have
|
|
// sufficient capacity, we do not need to grow, and we can skip the copy if
|
|
// unique. Otherwise, growth is required.
|
|
let otherUTF8Count = other.utf8Count
|
|
let sufficientCapacity: Bool
|
|
if let unused = self.nativeUnusedCapacity, unused >= otherUTF8Count {
|
|
sufficientCapacity = true
|
|
} else {
|
|
sufficientCapacity = false
|
|
}
|
|
if !self.isUniqueNative || !sufficientCapacity {
|
|
let totalCount = self.utf8Count + otherUTF8Count
|
|
|
|
// Non-unique storage: just make a copy of the appropriate size, otherwise
|
|
// grow like an array.
|
|
let growthTarget: Int
|
|
if sufficientCapacity {
|
|
growthTarget = totalCount
|
|
} else {
|
|
growthTarget = Swift.max(
|
|
totalCount, _growArrayCapacity(nativeCapacity ?? 0))
|
|
}
|
|
self.grow(growthTarget)
|
|
}
|
|
|
|
_sanityCheck(self.uniqueNativeUnusedCapacity != nil,
|
|
"growth should produce uniqueness")
|
|
|
|
if other.isFastUTF8 {
|
|
other.withFastUTF8 { self.appendInPlace($0) }
|
|
return
|
|
}
|
|
_foreignAppendInPlace(other)
|
|
}
|
|
|
|
internal mutating func appendInPlace(_ other: UnsafeBufferPointer<UInt8>) {
|
|
self._object.nativeStorage.appendInPlace(other)
|
|
|
|
// We re-initialize from the modified storage to pick up new count, flags,
|
|
// etc.
|
|
self = _StringGuts(self._object.nativeStorage)
|
|
}
|
|
|
|
@inline(never) // slow-path
|
|
internal mutating func _foreignAppendInPlace(_ other: _StringGuts) {
|
|
_sanityCheck(!other.isFastUTF8)
|
|
_sanityCheck(self.uniqueNativeUnusedCapacity != nil)
|
|
|
|
var iter = String(other).utf8.makeIterator()
|
|
self._object.nativeStorage.appendInPlace(&iter)
|
|
|
|
// We re-initialize from the modified storage to pick up new count, flags,
|
|
// etc.
|
|
self = _StringGuts(self._object.nativeStorage)
|
|
}
|
|
}
|
|
|
|
// C String interop
|
|
extension _StringGuts {
|
|
@inlinable @inline(__always) // fast-path: already C-string compatible
|
|
internal func withCString<Result>(
|
|
_ body: (UnsafePointer<Int8>) throws -> Result
|
|
) rethrows -> Result {
|
|
if _slowPath(!_object.isFastZeroTerminated) {
|
|
return try _slowWithCString(body)
|
|
}
|
|
|
|
return try self.withFastUTF8 {
|
|
let ptr = $0._asCChar.baseAddress._unsafelyUnwrappedUnchecked
|
|
return try body(ptr)
|
|
}
|
|
}
|
|
|
|
@inline(never) // slow-path
|
|
@usableFromInline
|
|
internal func _slowWithCString<Result>(
|
|
_ body: (UnsafePointer<Int8>) throws -> Result
|
|
) rethrows -> Result {
|
|
_sanityCheck(!_object.isFastZeroTerminated)
|
|
return try String(self).utf8CString.withUnsafeBufferPointer {
|
|
let ptr = $0.baseAddress._unsafelyUnwrappedUnchecked
|
|
return try body(ptr)
|
|
}
|
|
}
|
|
}
|
|
|
|
extension _StringGuts {
|
|
// Copy UTF-8 contents. Returns number written or nil if not enough space.
|
|
// Contents of the buffer are unspecified if nil is returned.
|
|
@inlinable
|
|
internal func copyUTF8(into mbp: UnsafeMutableBufferPointer<UInt8>) -> Int? {
|
|
let ptr = mbp.baseAddress._unsafelyUnwrappedUnchecked
|
|
if _fastPath(self.isFastUTF8) {
|
|
return self.withFastUTF8 { utf8 in
|
|
guard utf8.count <= mbp.count else { return nil }
|
|
|
|
let utf8Start = utf8.baseAddress._unsafelyUnwrappedUnchecked
|
|
ptr.initialize(from: utf8Start, count: utf8.count)
|
|
return utf8.count
|
|
}
|
|
}
|
|
|
|
return _foreignCopyUTF8(into: mbp)
|
|
}
|
|
|
|
@_effects(releasenone)
|
|
@usableFromInline @inline(never) // slow-path
|
|
internal func _foreignCopyUTF8(
|
|
into mbp: UnsafeMutableBufferPointer<UInt8>
|
|
) -> Int? {
|
|
var ptr = mbp.baseAddress._unsafelyUnwrappedUnchecked
|
|
var numWritten = 0
|
|
for cu in String(self).utf8 {
|
|
guard numWritten < mbp.count else { return nil }
|
|
ptr.initialize(to: cu)
|
|
ptr += 1
|
|
numWritten += 1
|
|
}
|
|
|
|
return numWritten
|
|
}
|
|
|
|
internal var utf8Count: Int {
|
|
@inline(__always) get {
|
|
// TODO: Might be worth burning a bit for count-is-UTF-8, regardless of
|
|
// fast status.
|
|
if _fastPath(self.isFastUTF8) {
|
|
return self.count
|
|
}
|
|
return _foreignUTF8Count()
|
|
}
|
|
}
|
|
|
|
@_effects(releasenone)
|
|
@inline(never) // slow-path
|
|
internal func _foreignUTF8Count() -> Int {
|
|
return String(self).utf8.count
|
|
}
|
|
}
|
|
|
|
// Index
|
|
extension _StringGuts {
|
|
@usableFromInline
|
|
internal typealias Index = String.Index
|
|
|
|
@inlinable
|
|
internal var startIndex: String.Index {
|
|
@inline(__always) get { return Index(encodedOffset: 0) }
|
|
}
|
|
@inlinable
|
|
internal var endIndex: String.Index {
|
|
@inline(__always) get { return Index(encodedOffset: self.count) }
|
|
}
|
|
}
|