Charles Hu c01e9dadee
rdar://107955097 (FoundationPreview: Batch move string API (continued)) (#34)
* rdar://107955097 (FoundationPreview: Batch move string API (continued))

- Move localized uppercase and lowercase to FoundationLocalization
- if-def out of CharacterSet from FoundationPreview. It's not implemented at all there, and having a no-op stub is misleading

* rdar://107955097 (FoundationPreview: Batch move string API (continued))

- Move components separated by string and range of string functions

* rdar://107955097 (FoundationPreview: Batch move string API (continued))

Enable snake case options for JSON encoder and decoder. We haven't been able to enable this option because it needed `CharacterSet`, which hasn't been properly implemented for FoundationPreview. Now that we have `BuiltInUnicodeScalarSet`, which mirrors `CharacterSet`, we can switch to that and enable the options.

* rdar://107955097 (FoundationPreview: Batch move string API (continued))

- Move `StringProtocol.lineRange(for:)` and `paragraphRange(for:)` to FoundationEssentials
- Rename String+Regex.swift to RegexPatternCache.swift
- Consolidate extensions on various String family members and remove one redundant swift file

---------

Co-authored-by: I-Ting Tina Liu <iting_liu@apple.com>
2023-04-17 18:23:51 -07:00

122 lines
4.6 KiB
Swift

//===----------------------------------------------------------------------===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2014 - 2017 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
//
//===----------------------------------------------------------------------===//
@available(macOS 10.10, iOS 8.0, watchOS 2.0, tvOS 9.0, *)
extension String {
func _capitalized() -> String {
var new = ""
new.reserveCapacity(utf8.count)
let uppercaseSet = BuiltInUnicodeScalarSet.uppercaseLetters
let lowercaseSet = BuiltInUnicodeScalarSet.lowercaseLetters
let cfcaseIgnorableSet = BuiltInUnicodeScalarSet.caseIgnorables
var isLastCased = false
for scalar in unicodeScalars {
let properties = scalar.properties
if uppercaseSet.contains(scalar) {
new += isLastCased ? properties.lowercaseMapping : String(scalar)
isLastCased = true
} else if lowercaseSet.contains(scalar) {
new += isLastCased ? String(scalar) : properties.titlecaseMapping
isLastCased = true
} else if !cfcaseIgnorableSet.contains(scalar) {
// We only use a subset of case-ignorable characters as defined in CF instead of the full set of characters satisfying `property.isCaseIgnorable` for compatibility reasons
new += String(scalar)
isLastCased = false
} else {
new += String(scalar)
}
}
return new
}
/// Creates a new string equivalent to the given bytes interpreted in the
/// specified encoding.
///
/// - Parameters:
/// - bytes: A sequence of bytes to interpret using `encoding`.
/// - encoding: The ecoding to use to interpret `bytes`.
public init?<S: Sequence>(bytes: __shared S, encoding: Encoding)
where S.Iterator.Element == UInt8
{
#if FOUNDATION_FRAMEWORK // TODO: Move init?(bytes:encoding) to Swift
func makeString(bytes: UnsafeBufferPointer<UInt8>) -> String? {
if encoding == .utf8 || encoding == .ascii,
let str = String._tryFromUTF8(bytes) {
if encoding == .utf8 || (encoding == .ascii && str._guts._isContiguousASCII) {
return str
}
}
if let ns = NSString(
bytes: bytes.baseAddress.unsafelyUnwrapped, length: bytes.count, encoding: encoding.rawValue) {
return String._unconditionallyBridgeFromObjectiveC(ns)
} else {
return nil
}
}
if let string = (bytes.withContiguousStorageIfAvailable(makeString) ??
Array(bytes).withUnsafeBufferPointer(makeString)) {
self = string
} else {
return nil
}
#else
guard encoding == .utf8 || encoding == .ascii else {
return nil
}
func makeString(buffer: UnsafeBufferPointer<UInt8>) -> String? {
if let string = String._tryFromUTF8(buffer),
(encoding == .utf8 || (encoding == .ascii && string._guts._isContiguousASCII)) {
return string
}
return buffer.withMemoryRebound(to: CChar.self) { ptr in
guard let address = ptr.baseAddress else {
return nil
}
return String(validatingUTF8: address)
}
}
if let string = bytes.withContiguousStorageIfAvailable(makeString) ??
Array(bytes).withUnsafeBufferPointer(makeString) {
self = string
} else {
return nil
}
#endif // FOUNDATION_FRAMEWORK
}
/// Returns a `String` initialized by converting given `data` into
/// Unicode characters using a given `encoding`.
public init?(data: __shared Data, encoding: Encoding) {
if encoding == .utf8 || encoding == .ascii,
let str = data.withUnsafeBytes({
String._tryFromUTF8($0.bindMemory(to: UInt8.self))
}) {
if encoding == .utf8 || (encoding == .ascii && str._guts._isContiguousASCII) {
self = str
return
}
}
#if FOUNDATION_FRAMEWORK
guard let s = NSString(data: data, encoding: encoding.rawValue) else { return nil }
self = String._unconditionallyBridgeFromObjectiveC(s)
#else
return nil
#endif // FOUNDATION_FRAMEWORK
}
}