mirror of
https://github.com/apple/swift-foundation.git
synced 2025-05-23 22:13:35 +08:00
* (112770879) “Washington, D.c.” capitalized incorrectly Theoretically "." is a case-ignorable character, so "D.C." is conceptually the same as "DC", whose capitalized mapping would be "Dc". This behavior doesn't seem to align with real-world use cases well though. Workaround this by splitting the string with "." and titlecasing each substring individually. * (112770879) “Washington, D.c.” capitalized incorrectly, cont. For FoundationPreview: Move String comparison utilities from FoundationEssentials fo _FoundationInternals so they can be accessed from FoundationInternalization too.
164 lines
6.7 KiB
Swift
164 lines
6.7 KiB
Swift
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This source file is part of the Swift.org open source project
|
|
//
|
|
// Copyright (c) 2014 - 2017 Apple Inc. and the Swift project authors
|
|
// Licensed under Apache License v2.0 with Runtime Library Exception
|
|
//
|
|
// See https://swift.org/LICENSE.txt for license information
|
|
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
// MARK: - Exported Types
|
|
@available(macOS 10.0, iOS 8.0, watchOS 2.0, tvOS 9.0, *)
|
|
extension String {
|
|
#if FOUNDATION_FRAMEWORK
|
|
public typealias CompareOptions = NSString.CompareOptions
|
|
#else
|
|
/// These options apply to the various search/find and comparison methods (except where noted).
|
|
public struct CompareOptions : OptionSet, Sendable {
|
|
public let rawValue: UInt
|
|
|
|
public init(rawValue: UInt) {
|
|
self.rawValue = rawValue
|
|
}
|
|
|
|
public static let caseInsensitive = CompareOptions(rawValue: 1)
|
|
/// Exact character-by-character equivalence
|
|
public static let literal = CompareOptions(rawValue: 2)
|
|
/// Search from end of source string
|
|
public static let backwards = CompareOptions(rawValue: 4)
|
|
/// Search is limited to start (or end, if `.backwards`) of source string
|
|
public static let anchored = CompareOptions(rawValue: 8)
|
|
/// Numbers within strings are compared using numeric value, that is,
|
|
/// Foo2.txt < Foo7.txt < Foo25.txt;
|
|
/// only applies to compare methods, not find
|
|
public static let numeric = CompareOptions(rawValue: 64)
|
|
/// If specified, ignores diacritics (o-umlaut == o)
|
|
public static let diacriticInsensitive = CompareOptions(rawValue: 128)
|
|
/// If specified, ignores width differences ('a' == UFF41)
|
|
public static let widthInsensitive = CompareOptions(rawValue: 256)
|
|
/// If specified, comparisons are forced to return either `.orderedAscending`
|
|
/// or `.orderedDescending` if the strings are equivalent but not strictly equal,
|
|
/// for stability when sorting (e.g. "aaa" > "AAA" with `.caseInsensitive` specified)
|
|
public static let forcedOrdering = CompareOptions(rawValue: 512)
|
|
/// The search string is treated as an ICU-compatible regular expression;
|
|
/// if set, no other options can apply except `.caseInsensitive` and `.anchored`
|
|
public static let regularExpression = CompareOptions(rawValue: 1024)
|
|
}
|
|
#endif // FOUNDATION_FRAMEWORK
|
|
}
|
|
|
|
@available(macOS 10.10, iOS 8.0, watchOS 2.0, tvOS 9.0, *)
|
|
extension String {
|
|
func _capitalized() -> String {
|
|
var new = ""
|
|
new.reserveCapacity(utf8.count)
|
|
|
|
let uppercaseSet = BuiltInUnicodeScalarSet.uppercaseLetters
|
|
let lowercaseSet = BuiltInUnicodeScalarSet.lowercaseLetters
|
|
let cfcaseIgnorableSet = BuiltInUnicodeScalarSet.caseIgnorables
|
|
|
|
var isLastCased = false
|
|
for scalar in unicodeScalars {
|
|
let properties = scalar.properties
|
|
if uppercaseSet.contains(scalar) {
|
|
new += isLastCased ? properties.lowercaseMapping : String(scalar)
|
|
isLastCased = true
|
|
} else if lowercaseSet.contains(scalar) {
|
|
new += isLastCased ? String(scalar) : properties.titlecaseMapping
|
|
isLastCased = true
|
|
} else if !cfcaseIgnorableSet.contains(scalar) {
|
|
// We only use a subset of case-ignorable characters as defined in CF instead of the full set of characters satisfying `property.isCaseIgnorable` for compatibility reasons
|
|
new += String(scalar)
|
|
isLastCased = false
|
|
} else {
|
|
new += String(scalar)
|
|
}
|
|
}
|
|
|
|
return new
|
|
}
|
|
|
|
// MARK: - Public API
|
|
|
|
/// Creates a new string equivalent to the given bytes interpreted in the
|
|
/// specified encoding.
|
|
///
|
|
/// - Parameters:
|
|
/// - bytes: A sequence of bytes to interpret using `encoding`.
|
|
/// - encoding: The encoding to use to interpret `bytes`.
|
|
public init?<S: Sequence>(bytes: __shared S, encoding: Encoding)
|
|
where S.Iterator.Element == UInt8
|
|
{
|
|
#if FOUNDATION_FRAMEWORK // TODO: Move init?(bytes:encoding) to Swift
|
|
func makeString(bytes: UnsafeBufferPointer<UInt8>) -> String? {
|
|
if encoding == .utf8 || encoding == .ascii,
|
|
let str = String._tryFromUTF8(bytes) {
|
|
if encoding == .utf8 || (encoding == .ascii && str._guts._isContiguousASCII) {
|
|
return str
|
|
}
|
|
}
|
|
|
|
if let ns = NSString(
|
|
bytes: bytes.baseAddress.unsafelyUnwrapped, length: bytes.count, encoding: encoding.rawValue) {
|
|
return String._unconditionallyBridgeFromObjectiveC(ns)
|
|
} else {
|
|
return nil
|
|
}
|
|
}
|
|
if let string = (bytes.withContiguousStorageIfAvailable(makeString) ??
|
|
Array(bytes).withUnsafeBufferPointer(makeString)) {
|
|
self = string
|
|
} else {
|
|
return nil
|
|
}
|
|
#else
|
|
guard encoding == .utf8 || encoding == .ascii else {
|
|
return nil
|
|
}
|
|
func makeString(buffer: UnsafeBufferPointer<UInt8>) -> String? {
|
|
if let string = String._tryFromUTF8(buffer),
|
|
(encoding == .utf8 || (encoding == .ascii && string._guts._isContiguousASCII)) {
|
|
return string
|
|
}
|
|
|
|
return buffer.withMemoryRebound(to: CChar.self) { ptr in
|
|
guard let address = ptr.baseAddress else {
|
|
return nil
|
|
}
|
|
return String(validatingUTF8: address)
|
|
}
|
|
}
|
|
|
|
if let string = bytes.withContiguousStorageIfAvailable(makeString) ??
|
|
Array(bytes).withUnsafeBufferPointer(makeString) {
|
|
self = string
|
|
} else {
|
|
return nil
|
|
}
|
|
#endif // FOUNDATION_FRAMEWORK
|
|
}
|
|
|
|
/// Returns a `String` initialized by converting given `data` into
|
|
/// Unicode characters using a given `encoding`.
|
|
public init?(data: __shared Data, encoding: Encoding) {
|
|
if encoding == .utf8 || encoding == .ascii,
|
|
let str = data.withUnsafeBytes({
|
|
$0.withMemoryRebound(to: UInt8.self, String._tryFromUTF8(_:))
|
|
}) {
|
|
if encoding == .utf8 || (encoding == .ascii && str._guts._isContiguousASCII) {
|
|
self = str
|
|
return
|
|
}
|
|
}
|
|
#if FOUNDATION_FRAMEWORK
|
|
guard let s = NSString(data: data, encoding: encoding.rawValue) else { return nil }
|
|
self = String._unconditionallyBridgeFromObjectiveC(s)
|
|
#else
|
|
return nil
|
|
#endif // FOUNDATION_FRAMEWORK
|
|
}
|
|
}
|