mirror of
https://github.com/apple/swift.git
synced 2025-12-21 12:14:44 +01:00
This necessary for ensuring the property that String doesn't keep
inaccessible memory alive. For example, before this change,
String(s.dropFirst().unicodeScalars)
would compile and produce a String that owned inaccessible memory.
Now it no longer compiles.
String's view's SubSequences are the same as the Substring's
view. E.g. String.UnicodeScalarView.SubSequence is
Substring.UnicodeScalarView.
New compatibility inits added, to work around the fact that many
previously failable initializers are now non-failable.
605 lines
20 KiB
Plaintext
605 lines
20 KiB
Plaintext
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This source file is part of the Swift.org open source project
|
|
//
|
|
// Copyright (c) 2014 - 2017 Apple Inc. and the Swift project authors
|
|
// Licensed under Apache License v2.0 with Runtime Library Exception
|
|
//
|
|
// See https://swift.org/LICENSE.txt for license information
|
|
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
extension String {
|
|
// FIXME(strings): at least temporarily remove it to see where it was applied
|
|
/// Creates a new string from the given substring.
|
|
///
|
|
/// - Parameter substring: A substring to convert to a standalone `String`
|
|
/// instance.
|
|
///
|
|
/// - Complexity: O(*n*), where *n* is the length of `substring`.
|
|
public init(_ substring: Substring) {
|
|
self = String(substring._slice)
|
|
}
|
|
}
|
|
|
|
/// A slice of a string.
|
|
///
|
|
/// When you create a slice of a string, a `Substring` instance is the result.
|
|
/// Operating on substrings is fast and efficient because a substring shares
|
|
/// its storage with the original string. The `Substring` type presents the
|
|
/// same interface as `String`, so you can avoid or defer any copying of the
|
|
/// string's contents.
|
|
///
|
|
/// The following example creates a `greeting` string, and then finds the
|
|
/// substring of the first sentence:
|
|
///
|
|
/// let greeting = "Hi there! It's nice to meet you! 👋"
|
|
/// let endOfSentence = greeting.index(of: "!")!
|
|
/// let firstSentence = greeting[...endOfSentence]
|
|
/// // firstSentence == "Hi there!"
|
|
///
|
|
/// You can perform many string operations on a substring. Here, we find the
|
|
/// length of the first sentence and create an uppercase version.
|
|
///
|
|
/// print("'\(firstSentence)' is \(firstSentence.count) characters long.")
|
|
/// // Prints "'Hi there!' is 9 characters long."
|
|
///
|
|
/// let shoutingSentence = firstSentence.uppercased()
|
|
/// // shoutingSentence == "HI THERE!"
|
|
///
|
|
/// Converting a Substring to a String
|
|
/// ==================================
|
|
///
|
|
/// This example defines a `rawData` string with some unstructured data, and
|
|
/// then uses the string's `prefix(while:)` method to create a substring of
|
|
/// the numeric prefix:
|
|
///
|
|
/// let rawInput = "126 a.b 22219 zzzzzz"
|
|
/// let numericPrefix = rawInput.prefix(while: { "0"..."9" ~= $0 })
|
|
/// // numericPrefix is the substring "126"
|
|
///
|
|
/// When you need to store a substring or pass it to a function that requires a
|
|
/// `String` instance, convert it using the `String.init(_:)` initializer.
|
|
///
|
|
/// _ = Int(numericPrefix, radix: 10)
|
|
/// // error: cannot convert value...
|
|
/// let prefix = Int(String(numericPrefix), radix: 10)
|
|
/// // prefix == 126
|
|
///
|
|
/// Calling this initializer copies the contents of the substring to a new
|
|
/// string.
|
|
///
|
|
/// - Important: Don't store substrings longer than you need them to perform a
|
|
/// specific operation. A substring holds a reference to the entire storage
|
|
/// of the string it comes from, not just to the portion it presents, even
|
|
/// when there is no other reference to the original string. Storing
|
|
/// substrings may, therefore, prolong the lifetime of string data that is
|
|
/// no longer otherwise accessible, which can appear to be memory leakage.
|
|
public struct Substring : StringProtocol {
|
|
public typealias Index = String.Index
|
|
public typealias IndexDistance = String.IndexDistance
|
|
public typealias SubSequence = Substring
|
|
|
|
internal var _slice: RangeReplaceableBidirectionalSlice<String>
|
|
|
|
/// Creates an empty substring.
|
|
public init() {
|
|
_slice = RangeReplaceableBidirectionalSlice()
|
|
}
|
|
|
|
internal init(_slice: RangeReplaceableBidirectionalSlice<String>) {
|
|
self._slice = _slice
|
|
}
|
|
|
|
/// Creates a substring with the specified bounds within the given string.
|
|
///
|
|
/// - Parameters:
|
|
/// - base: The string to create a substring of.
|
|
/// - bounds: The range of `base` to use for the substring. The lower and
|
|
/// upper bounds of `bounds` must be valid indices of `base`.
|
|
public init(_base base: String, _ bounds: Range<Index>) {
|
|
_slice = RangeReplaceableBidirectionalSlice(base: base, bounds: bounds)
|
|
}
|
|
|
|
internal init<R: RangeExpression>(
|
|
_base base: String, _ bounds: R
|
|
) where R.Bound == Index {
|
|
self.init(_base: base, bounds.relative(to: base))
|
|
}
|
|
|
|
public var startIndex: Index { return _slice.startIndex }
|
|
public var endIndex: Index { return _slice.endIndex }
|
|
|
|
public func index(after i: Index) -> Index {
|
|
_precondition(i < endIndex, "Cannot increment beyond endIndex")
|
|
_precondition(i >= startIndex, "Cannot increment an invalid index")
|
|
// FIXME(strings): slice types currently lack necessary bound checks
|
|
return _slice.index(after: i)
|
|
}
|
|
|
|
public func index(before i: Index) -> Index {
|
|
_precondition(i <= endIndex, "Cannot decrement an invalid index")
|
|
_precondition(i > startIndex, "Cannot decrement beyond startIndex")
|
|
// FIXME(strings): slice types currently lack necessary bound checks
|
|
return _slice.index(before: i)
|
|
}
|
|
|
|
public func index(_ i: Index, offsetBy n: IndexDistance) -> Index {
|
|
let result = _slice.index(i, offsetBy: n)
|
|
// FIXME(strings): slice types currently lack necessary bound checks
|
|
_precondition(
|
|
(_slice._startIndex ... _slice.endIndex).contains(result),
|
|
"Operation results in an invalid index")
|
|
return result
|
|
}
|
|
|
|
public func index(
|
|
_ i: Index, offsetBy n: IndexDistance, limitedBy limit: Index
|
|
) -> Index? {
|
|
let result = _slice.index(i, offsetBy: n, limitedBy: limit)
|
|
// FIXME(strings): slice types currently lack necessary bound checks
|
|
_precondition(result.map {
|
|
(_slice._startIndex ... _slice.endIndex).contains($0)
|
|
} ?? true,
|
|
"Operation results in an invalid index")
|
|
return result
|
|
}
|
|
|
|
public func distance(from start: Index, to end: Index) -> IndexDistance {
|
|
return _slice.distance(from: start, to: end)
|
|
}
|
|
|
|
public subscript(i: Index) -> Character {
|
|
return _slice[i]
|
|
}
|
|
|
|
public mutating func replaceSubrange<C>(
|
|
_ bounds: Range<Index>,
|
|
with newElements: C
|
|
) where C : Collection, C.Iterator.Element == Iterator.Element {
|
|
// FIXME(strings): slice types currently lack necessary bound checks
|
|
_slice.replaceSubrange(bounds, with: newElements)
|
|
}
|
|
|
|
% for Range in ['Range', 'ClosedRange']:
|
|
|
|
public mutating func replaceSubrange(
|
|
_ bounds: ${Range}<Index>, with newElements: Substring
|
|
) {
|
|
replaceSubrange(bounds, with: newElements._slice)
|
|
}
|
|
|
|
% end
|
|
|
|
/// Creates a string from the given Unicode code units in the specified
|
|
/// encoding.
|
|
///
|
|
/// - Parameters:
|
|
/// - codeUnits: A collection of code units encoded in the ecoding
|
|
/// specified in `sourceEncoding`.
|
|
/// - sourceEncoding: The encoding in which `codeUnits` should be
|
|
/// interpreted.
|
|
public init<C: Collection, Encoding: _UnicodeEncoding>(
|
|
decoding codeUnits: C, as sourceEncoding: Encoding.Type
|
|
) where C.Iterator.Element == Encoding.CodeUnit {
|
|
self.init(String(decoding: codeUnits, as: sourceEncoding))
|
|
}
|
|
|
|
/// Creates a string from the null-terminated, UTF-8 encoded sequence of
|
|
/// bytes at the given pointer.
|
|
///
|
|
/// - Parameter nullTerminatedUTF8: A pointer to a sequence of contiguous,
|
|
/// UTF-8 encoded bytes ending just before the first zero byte.
|
|
public init(cString nullTerminatedUTF8: UnsafePointer<CChar>) {
|
|
self.init(String(cString: nullTerminatedUTF8))
|
|
}
|
|
|
|
/// Creates a string from the null-terminated sequence of bytes at the given
|
|
/// pointer.
|
|
///
|
|
/// - Parameters:
|
|
/// - nullTerminatedCodeUnits: A pointer to a sequence of contiguous code
|
|
/// units in the encoding specified in `sourceEncoding`, ending just
|
|
/// before the first zero code unit.
|
|
/// - sourceEncoding: The encoding in which the code units should be
|
|
/// interpreted.
|
|
public init<Encoding: _UnicodeEncoding>(
|
|
decodingCString nullTerminatedCodeUnits: UnsafePointer<Encoding.CodeUnit>,
|
|
as sourceEncoding: Encoding.Type
|
|
) {
|
|
self.init(
|
|
String(decodingCString: nullTerminatedCodeUnits, as: sourceEncoding))
|
|
}
|
|
|
|
/// Calls the given closure with a pointer to the contents of the string,
|
|
/// represented as a null-terminated sequence of UTF-8 code units.
|
|
///
|
|
/// The pointer passed as an argument to `body` is valid only during the
|
|
/// execution of `withCString(_:)`. Do not store or return the pointer for
|
|
/// later use.
|
|
///
|
|
/// - Parameter body: A closure with a pointer parameter that points to a
|
|
/// null-terminated sequence of UTF-8 code units. If `body` has a return
|
|
/// value, that value is also used as the return value for the
|
|
/// `withCString(_:)` method. The pointer argument is valid only for the
|
|
/// duration of the method's execution.
|
|
/// - Returns: The return value, if any, of the `body` closure parameter.
|
|
public func withCString<Result>(
|
|
_ body: (UnsafePointer<CChar>) throws -> Result) rethrows -> Result {
|
|
return try _wholeString._core._withCSubstringAndLength(
|
|
in: startIndex.encodedOffset..<endIndex.encodedOffset,
|
|
encoding: UTF8.self) {
|
|
p, length in try p.withMemoryRebound(to: CChar.self, capacity: length) {
|
|
try body($0)
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Calls the given closure with a pointer to the contents of the string,
|
|
/// represented as a null-terminated sequence of code units.
|
|
///
|
|
/// The pointer passed as an argument to `body` is valid only during the
|
|
/// execution of `withCString(encodedAs:_:)`. Do not store or return the
|
|
/// pointer for later use.
|
|
///
|
|
/// - Parameters:
|
|
/// - body: A closure with a pointer parameter that points to a
|
|
/// null-terminated sequence of code units. If `body` has a return
|
|
/// value, that value is also used as the return value for the
|
|
/// `withCString(encodedAs:_:)` method. The pointer argument is valid
|
|
/// only for the duration of the method's execution.
|
|
/// - targetEncoding: The encoding in which the code units should be
|
|
/// interpreted.
|
|
/// - Returns: The return value, if any, of the `body` closure parameter.
|
|
public func withCString<Result, TargetEncoding: _UnicodeEncoding>(
|
|
encodedAs targetEncoding: TargetEncoding.Type,
|
|
_ body: (UnsafePointer<TargetEncoding.CodeUnit>) throws -> Result
|
|
) rethrows -> Result {
|
|
return try _wholeString._core._withCSubstring(
|
|
in: startIndex.encodedOffset..<endIndex.encodedOffset,
|
|
encoding: targetEncoding, body)
|
|
}
|
|
}
|
|
|
|
extension Substring : _SwiftStringView {
|
|
var _persistentContent: String {
|
|
let wholeCore = _wholeString._core
|
|
let native = wholeCore.nativeBuffer
|
|
if _fastPath(native != nil) {
|
|
let wholeString = String(wholeCore)
|
|
let n = native._unsafelyUnwrappedUnchecked
|
|
if _fastPath(
|
|
n.start == wholeCore._baseAddress
|
|
&& n.usedCount == wholeCore.count
|
|
&& _slice.startIndex == wholeString.startIndex
|
|
&& _slice.endIndex == wholeString.endIndex
|
|
) {
|
|
return wholeString
|
|
}
|
|
}
|
|
var r = String()
|
|
r._core.append(_ephemeralContent._core)
|
|
_sanityCheck(r._core._owner !== _ephemeralContent._core._owner)
|
|
return r
|
|
}
|
|
|
|
public // @testable
|
|
var _ephemeralContent: String {
|
|
let wholeCore = _wholeString._core
|
|
let subCore : _StringCore = wholeCore[
|
|
startIndex.encodedOffset..<endIndex.encodedOffset]
|
|
// Check that we haven't allocated a new buffer for the result, if we have
|
|
// contiguous storage.
|
|
_sanityCheck(
|
|
subCore._owner === wholeCore._owner || !wholeCore.hasContiguousStorage)
|
|
|
|
return String(subCore)
|
|
}
|
|
|
|
internal
|
|
var _wholeString: String {
|
|
return _slice._base
|
|
}
|
|
}
|
|
|
|
extension Substring : CustomReflectable {
|
|
public var customMirror: Mirror {
|
|
return String(self).customMirror
|
|
}
|
|
}
|
|
|
|
extension Substring : CustomPlaygroundQuickLookable {
|
|
public var customPlaygroundQuickLook: PlaygroundQuickLook {
|
|
return String(self).customPlaygroundQuickLook
|
|
}
|
|
}
|
|
|
|
extension Substring : CustomStringConvertible {
|
|
public var description: String {
|
|
return String(self)
|
|
}
|
|
}
|
|
|
|
extension Substring : CustomDebugStringConvertible {
|
|
public var debugDescription: String {
|
|
return String(self).debugDescription
|
|
}
|
|
}
|
|
|
|
extension Substring : LosslessStringConvertible {
|
|
public init(_ content: String) {
|
|
self.init(_base: content, content.startIndex ..< content.endIndex)
|
|
}
|
|
}
|
|
|
|
extension StringProtocol {
|
|
public static func ==<R: StringProtocol>(lhs: Self, rhs: R) -> Bool {
|
|
return lhs._ephemeralString == rhs._ephemeralString
|
|
}
|
|
|
|
public static func !=<R: StringProtocol>(lhs: Self, rhs: R) -> Bool {
|
|
return lhs._ephemeralString != rhs._ephemeralString
|
|
}
|
|
}
|
|
|
|
extension StringProtocol {
|
|
public static func < <R: StringProtocol>(lhs: Self, rhs: R) -> Bool {
|
|
return lhs._ephemeralString < rhs._ephemeralString
|
|
}
|
|
|
|
public static func > <R: StringProtocol>(lhs: Self, rhs: R) -> Bool {
|
|
return rhs < lhs
|
|
}
|
|
|
|
public static func <= <R: StringProtocol>(lhs: Self, rhs: R) -> Bool {
|
|
return !(rhs < lhs)
|
|
}
|
|
|
|
public static func >= <R: StringProtocol>(lhs: Self, rhs: R) -> Bool {
|
|
return !(lhs < rhs)
|
|
}
|
|
}
|
|
|
|
extension StringProtocol {
|
|
public var hashValue : Int {
|
|
return self._ephemeralString.hashValue
|
|
}
|
|
}
|
|
|
|
% for (property, ViewPrefix) in [
|
|
% ('utf8', 'UTF8'),
|
|
% ('utf16', 'UTF16'),
|
|
% ('unicodeScalars', 'UnicodeScalar'),
|
|
% ('characters', 'Character')
|
|
% ]:
|
|
% View = ViewPrefix + 'View'
|
|
% RangeReplaceable = 'RangeReplaceable' if property == 'unicodeScalars' else ''
|
|
extension Substring {
|
|
public struct ${View} {
|
|
var _slice: ${RangeReplaceable}BidirectionalSlice<String.${View}>
|
|
}
|
|
}
|
|
|
|
extension Substring.${View} : BidirectionalCollection {
|
|
public typealias Index = String.Index
|
|
public typealias SubSequence = Substring.${View}
|
|
|
|
/// Creates an instance that slices `base` at `_bounds`.
|
|
internal init(_ base: String.${View}, _bounds: Range<Index>) {
|
|
_slice = ${RangeReplaceable}BidirectionalSlice(
|
|
base: String(base._core).${property},
|
|
bounds: _bounds)
|
|
}
|
|
|
|
/// The entire String onto whose slice this view is a projection.
|
|
internal var _wholeString: String {
|
|
return String(_slice._base._core)
|
|
}
|
|
|
|
public var startIndex: Index { return _slice.startIndex }
|
|
public var endIndex: Index { return _slice.endIndex }
|
|
public func index(after i: Index) -> Index {
|
|
return _slice.index(after: i)
|
|
}
|
|
public func index(before i: Index) -> Index {
|
|
return _slice.index(before: i)
|
|
}
|
|
public subscript(i: Index) -> String.${View}.Element {
|
|
return _slice[i]
|
|
}
|
|
public subscript(r: Range<Index>) -> SubSequence {
|
|
return Substring.${View}(_wholeString.${property}, _bounds: r)
|
|
}
|
|
}
|
|
|
|
extension Substring {
|
|
public var ${property}: ${View} {
|
|
get {
|
|
return ${View}(_wholeString.${property}, _bounds: startIndex..<endIndex)
|
|
}
|
|
set {
|
|
self = Substring(newValue)
|
|
}
|
|
}
|
|
|
|
/// Creates a Substring having the given content.
|
|
///
|
|
/// - Complexity: O(1)
|
|
public init(_ content: ${View}) {
|
|
self = content._wholeString[content.startIndex..<content.endIndex]
|
|
}
|
|
}
|
|
|
|
extension String {
|
|
% if property in ('utf8', 'utf16'):
|
|
/// Creates a String having the given content.
|
|
///
|
|
/// If `codeUnits` is an ill-formed code unit sequence, the result is `nil`.
|
|
///
|
|
/// - Complexity: O(N), where N is the length of the resulting `String`'s
|
|
/// UTF-16.
|
|
public init?(_ codeUnits: Substring.${View}) {
|
|
let wholeString = codeUnits._wholeString
|
|
guard
|
|
codeUnits.startIndex.samePosition(in: wholeString.unicodeScalars) != nil
|
|
&& codeUnits.endIndex.samePosition(in: wholeString.unicodeScalars) != nil
|
|
else { return nil }
|
|
self = String(Substring(codeUnits))
|
|
}
|
|
% else:
|
|
/// Creates a String having the given content.
|
|
///
|
|
/// - Complexity: O(N), where N is the length of the resulting `String`'s
|
|
/// UTF-16.
|
|
public init(_ content: Substring.${View}) {
|
|
self = String(Substring(content))
|
|
}
|
|
% end
|
|
}
|
|
% end
|
|
|
|
// FIXME: The other String views should be RangeReplaceable too.
|
|
extension Substring.UnicodeScalarView : RangeReplaceableCollection {
|
|
public init() { _slice = RangeReplaceableBidirectionalSlice.init() }
|
|
|
|
public mutating func replaceSubrange<C : Collection>(
|
|
_ target: Range<Index>, with replacement: C
|
|
) where C.Element == Element {
|
|
_slice.replaceSubrange(target, with: replacement)
|
|
}
|
|
}
|
|
|
|
#if _runtime(_ObjC)
|
|
|
|
extension Substring {
|
|
public func hasPrefix(_ prefix: String) -> Bool {
|
|
return String(self).hasPrefix(prefix)
|
|
}
|
|
|
|
public func hasSuffix(_ suffix: String) -> Bool {
|
|
return String(self).hasSuffix(suffix)
|
|
}
|
|
}
|
|
|
|
#endif
|
|
|
|
extension Substring : RangeReplaceableCollection {
|
|
public init<S : Sequence>(_ elements: S)
|
|
where S.Element == Character {
|
|
let e0 = elements as? _SwiftStringView
|
|
if _fastPath(e0 != nil), let e = e0 {
|
|
self = e._ephemeralContent[...]
|
|
}
|
|
else {
|
|
self = String(elements)[...]
|
|
}
|
|
}
|
|
|
|
public mutating func append<S : Sequence>(contentsOf elements: S)
|
|
where S.Element == Character {
|
|
var c = self._ephemeralContent._core
|
|
self = Substring()
|
|
|
|
let e0 = elements as? _SwiftStringView
|
|
if _fastPath(e0 != nil), let e1 = e0 {
|
|
c.append(contentsOf: e1._ephemeralContent.utf16)
|
|
self = String(c)[...]
|
|
}
|
|
else {
|
|
var s = String(c)
|
|
s.append(contentsOf: elements)
|
|
self = s[...]
|
|
}
|
|
}
|
|
}
|
|
|
|
extension Substring {
|
|
public func lowercased() -> String {
|
|
return String(self).lowercased()
|
|
}
|
|
|
|
public func uppercased() -> String {
|
|
return String(self).uppercased()
|
|
}
|
|
|
|
public func filter(
|
|
_ isIncluded: (Element) throws -> Bool
|
|
) rethrows -> String {
|
|
return try String(self.lazy.filter(isIncluded))
|
|
}
|
|
}
|
|
|
|
extension Substring : TextOutputStream {
|
|
public mutating func write(_ other: String) {
|
|
append(contentsOf: other)
|
|
}
|
|
}
|
|
|
|
extension Substring : TextOutputStreamable {
|
|
public func write<Target : TextOutputStream>(to target: inout Target) {
|
|
target.write(String(self))
|
|
}
|
|
}
|
|
|
|
extension Substring : ExpressibleByUnicodeScalarLiteral {
|
|
public init(unicodeScalarLiteral value: String) {
|
|
self.init(_base: value, value.startIndex ..< value.endIndex)
|
|
}
|
|
}
|
|
extension Substring : ExpressibleByExtendedGraphemeClusterLiteral {
|
|
public init(extendedGraphemeClusterLiteral value: String) {
|
|
self.init(_base: value, value.startIndex ..< value.endIndex)
|
|
}
|
|
}
|
|
|
|
extension Substring : ExpressibleByStringLiteral {
|
|
public init(stringLiteral value: String) {
|
|
self.init(_base: value, value.startIndex ..< value.endIndex)
|
|
}
|
|
}
|
|
|
|
//===--- String/Substring Slicing Support ---------------------------------===//
|
|
/// In Swift 3.2, in the absence of type context,
|
|
///
|
|
/// someString[someString.startIndex..<someString.endIndex]
|
|
///
|
|
/// was deduced to be of type `String`. Therefore have a more-specific
|
|
/// Swift-3-only `subscript` overload on `String` (and `Substring`) that
|
|
/// continues to produce `String`.
|
|
extension String {
|
|
@available(swift, introduced: 4)
|
|
public subscript(r: Range<Index>) -> Substring {
|
|
return Substring(
|
|
_slice: RangeReplaceableBidirectionalSlice(base: self, bounds: r))
|
|
}
|
|
|
|
@available(swift, obsoleted: 4)
|
|
public subscript(bounds: Range<Index>) -> String {
|
|
return String(characters[bounds])
|
|
}
|
|
|
|
@available(swift, obsoleted: 4)
|
|
public subscript(bounds: ClosedRange<Index>) -> String {
|
|
return String(characters[bounds])
|
|
}
|
|
}
|
|
|
|
extension Substring {
|
|
@available(swift, introduced: 4)
|
|
public subscript(r: Range<Index>) -> Substring {
|
|
return Substring(_slice: _slice[r])
|
|
}
|
|
|
|
@available(swift, obsoleted: 4)
|
|
public subscript(bounds: Range<Index>) -> String {
|
|
return String(characters[bounds])
|
|
}
|
|
|
|
@available(swift, obsoleted: 4)
|
|
public subscript(bounds: ClosedRange<Index>) -> String {
|
|
return String(characters[bounds])
|
|
}
|
|
}
|
|
//===----------------------------------------------------------------------===//
|