mirror of
https://github.com/apple/swift.git
synced 2025-12-14 20:36:38 +01:00
226 lines
6.6 KiB
Swift
226 lines
6.6 KiB
Swift
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This source file is part of the Swift.org open source project
|
|
//
|
|
// Copyright (c) 2014 - 2015 Apple Inc. and the Swift project authors
|
|
// Licensed under Apache License v2.0 with Runtime Library Exception
|
|
//
|
|
// See http://swift.org/LICENSE.txt for license information
|
|
// See http://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// Implementation Note: Because StaticString is used in the
|
|
// implementation of _precondition(), _fatalErrorMessage(), etc., we
|
|
// keep it extremely close to the bare metal. In particular, because
|
|
// we store only Builtin types, we are guaranteed that no assertions
|
|
// are involved in its construction. This feature is crucial for
|
|
// preventing infinite recursion even in non-asserting cases.
|
|
|
|
/// An simple string designed to represent text that is "knowable at
|
|
/// compile-time".
|
|
///
|
|
/// Logically speaking, each instance looks something like this::
|
|
///
|
|
/// enum StaticString {
|
|
/// case ASCII(start: UnsafePointer<UInt8>, length: Int)
|
|
/// case UTF8(start: UnsafePointer<UInt8>, length: Int)
|
|
/// case Scalar(UnicodeScalar)
|
|
/// }
|
|
public struct StaticString
|
|
: _BuiltinUnicodeScalarLiteralConvertible,
|
|
_BuiltinExtendedGraphemeClusterLiteralConvertible,
|
|
_BuiltinStringLiteralConvertible,
|
|
UnicodeScalarLiteralConvertible,
|
|
ExtendedGraphemeClusterLiteralConvertible,
|
|
StringLiteralConvertible,
|
|
Printable,
|
|
DebugPrintable {
|
|
|
|
/// Either a pointer to the start of UTF-8 data, or an integer representation
|
|
/// of a single Unicode scalar.
|
|
var _startPtrOrData: Builtin.RawPointer
|
|
|
|
/// If `_startPtrOrData` is a pointer, contains the length of the UTF-8 data
|
|
/// in bytes.
|
|
var _byteSize: Builtin.Word
|
|
|
|
/// Extra flags:
|
|
///
|
|
/// - bit 0: set to 0 if `_startPtrOrData` is a pointer, or to 1 if it is a
|
|
/// Unicode scalar.
|
|
///
|
|
/// - bit 1: set to 1 if `_startPtrOrData` is a pointer and string data is
|
|
/// ASCII.
|
|
var _flags: Builtin.Word
|
|
|
|
/// A pointer to the beginning of UTF-8 code units
|
|
///
|
|
/// Requires: `self` stores a pointer to either ASCII or UTF-8 code
|
|
/// units.
|
|
@transparent
|
|
public var utf8Start: UnsafePointer<UInt8> {
|
|
_precondition(
|
|
hasPointerRepresentation,
|
|
"StaticString should have pointer representation")
|
|
return UnsafePointer(_startPtrOrData)
|
|
}
|
|
|
|
/// The stored Unicode scalar value
|
|
///
|
|
/// Requires: `self` stores a single Unicode scalar value.
|
|
@transparent
|
|
public var unicodeScalar: UnicodeScalar {
|
|
_precondition(
|
|
!hasPointerRepresentation,
|
|
"StaticString should have Unicode scalar representation")
|
|
return UnicodeScalar(UInt32(unsafeBitCast(_startPtrOrData, UWord.self)))
|
|
}
|
|
|
|
/// If `self` stores a pointer to ASCII or UTF-8 code units, the
|
|
/// length in bytes of that data.
|
|
///
|
|
/// If `self` stores a single Unicode scalar value, the value of
|
|
/// `byteSize` is unspecified.
|
|
@transparent
|
|
public var byteSize: Word {
|
|
_precondition(
|
|
hasPointerRepresentation,
|
|
"StaticString should have pointer representation")
|
|
return Word(_byteSize)
|
|
}
|
|
|
|
/// `true` iff `self` stores a pointer to ASCII or UTF-8 code units
|
|
@transparent
|
|
public var hasPointerRepresentation: Bool {
|
|
return (UWord(_flags) & 0x1) == 0
|
|
}
|
|
|
|
/// `true` if `self` stores a pointer to ASCII code units.
|
|
///
|
|
/// If `self` stores a single Unicode scalar value, the value of
|
|
/// `isASCII` is unspecified.
|
|
@transparent
|
|
public var isASCII: Bool {
|
|
return (UWord(_flags) & 0x2) != 0
|
|
}
|
|
|
|
/// Invoke `body` with a buffer containing the UTF-8 code units of
|
|
/// `self`.
|
|
///
|
|
/// This method works regardless of what `self` stores.
|
|
public func withUTF8Buffer<R>(body: (UnsafeBufferPointer<UInt8>) -> R) -> R {
|
|
if hasPointerRepresentation {
|
|
return body(UnsafeBufferPointer(start: utf8Start, count: Int(byteSize)))
|
|
} else {
|
|
var buffer: UInt64 = 0
|
|
var i = 0
|
|
var sink = SinkOf<UInt8> {
|
|
(byte) in
|
|
buffer = buffer | (UInt64(byte) << (UInt64(i) * 8))
|
|
++i
|
|
}
|
|
UTF8.encode(unicodeScalar, output: &sink)
|
|
return body(UnsafeBufferPointer(
|
|
start: UnsafePointer(Builtin.addressof(&buffer)),
|
|
count: i))
|
|
}
|
|
}
|
|
|
|
/// Return a `String` representing the same sequence of Unicode
|
|
/// scalar values as `self` does.
|
|
@transparent
|
|
public var stringValue: String {
|
|
return withUTF8Buffer {
|
|
(buffer) in
|
|
return String._fromWellFormedCodeUnitSequence(UTF8.self, input: buffer)
|
|
}
|
|
}
|
|
|
|
/// Create an empty instance.
|
|
@transparent
|
|
public init() {
|
|
self = ""
|
|
}
|
|
|
|
@transparent
|
|
init(
|
|
start: Builtin.RawPointer, byteSize: Builtin.Word, isASCII: Builtin.Int1
|
|
) {
|
|
self._startPtrOrData = start
|
|
self._byteSize = byteSize
|
|
self._flags = Bool(isASCII) ? 0x2.value : 0x0.value
|
|
}
|
|
|
|
@transparent
|
|
init(
|
|
unicodeScalar: Builtin.Int32
|
|
) {
|
|
self._startPtrOrData =
|
|
unsafeBitCast(UWord(UInt32(unicodeScalar)), COpaquePointer.self)._rawValue
|
|
self._byteSize = 0.value
|
|
self._flags = UnicodeScalar(unicodeScalar).isASCII() ? 0x3.value : 0x1.value
|
|
}
|
|
|
|
@effects(readonly)
|
|
@transparent
|
|
public init(_builtinUnicodeScalarLiteral value: Builtin.Int32) {
|
|
self = StaticString(unicodeScalar: value)
|
|
}
|
|
|
|
/// Create an instance initialized to `value`.
|
|
@effects(readonly)
|
|
@transparent
|
|
public init(unicodeScalarLiteral value: StaticString) {
|
|
self = value
|
|
}
|
|
|
|
@effects(readonly)
|
|
@transparent
|
|
public init(
|
|
_builtinExtendedGraphemeClusterLiteral start: Builtin.RawPointer,
|
|
byteSize: Builtin.Word,
|
|
isASCII: Builtin.Int1
|
|
) {
|
|
self = StaticString(
|
|
_builtinStringLiteral: start,
|
|
byteSize: byteSize,
|
|
isASCII: isASCII
|
|
)
|
|
}
|
|
|
|
/// Create an instance initialized to `value`.
|
|
@effects(readonly)
|
|
@transparent
|
|
public init(extendedGraphemeClusterLiteral value: StaticString) {
|
|
self = value
|
|
}
|
|
|
|
@effects(readonly)
|
|
@transparent
|
|
public init(
|
|
_builtinStringLiteral start: Builtin.RawPointer,
|
|
byteSize: Builtin.Word,
|
|
isASCII: Builtin.Int1
|
|
) {
|
|
self = StaticString(start: start, byteSize: byteSize, isASCII: isASCII)
|
|
}
|
|
|
|
/// Create an instance initialized to `value`.
|
|
@effects(readonly)
|
|
@transparent
|
|
public init(stringLiteral value: StaticString) {
|
|
self = value
|
|
}
|
|
|
|
/// A textual representation of `self`.
|
|
public var description: String {
|
|
return self.stringValue
|
|
}
|
|
|
|
/// A textual representation of `self`, suitable for debugging.
|
|
public var debugDescription: String {
|
|
return self.stringValue.debugDescription
|
|
}
|
|
}
|