|
| 1 | +//===--- UTF16Decode.swift -------------------------------------------------===// |
| 2 | +// |
| 3 | +// This source file is part of the Swift.org open source project |
| 4 | +// |
| 5 | +// Copyright (c) 2014 - 2017 Apple Inc. and the Swift project authors |
| 6 | +// Licensed under Apache License v2.0 with Runtime Library Exception |
| 7 | +// |
| 8 | +// See https://swift.org/LICENSE.txt for license information |
| 9 | +// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors |
| 10 | +// |
| 11 | +//===----------------------------------------------------------------------===// |
| 12 | + |
| 13 | +import TestsUtils |
| 14 | +import Foundation |
| 15 | + |
| 16 | +public let UTF16Decode = [ |
| 17 | + BenchmarkInfo( |
| 18 | + name: "UTF16Decode", |
| 19 | + runFunction: run_UTF16Decode, |
| 20 | + tags: [.validation, .api, .String]), |
| 21 | + BenchmarkInfo( |
| 22 | + name: "UTF16Decode_InitFromCustom_contiguous", |
| 23 | + runFunction: run_UTF16Decode_InitFromCustom_contiguous, |
| 24 | + tags: [.validation, .api, .String]), |
| 25 | + BenchmarkInfo( |
| 26 | + name: "UTF16Decode_InitFromCustom_contiguous_ascii", |
| 27 | + runFunction: run_UTF16Decode_InitFromCustom_contiguous_ascii, |
| 28 | + tags: [.validation, .api, .String]), |
| 29 | + BenchmarkInfo( |
| 30 | + name: "UTF16Decode_InitFromCustom_noncontiguous", |
| 31 | + runFunction: run_UTF16Decode_InitFromCustom_noncontiguous, |
| 32 | + tags: [.validation, .api, .String]), |
| 33 | + BenchmarkInfo( |
| 34 | + name: "UTF16Decode_InitFromCustom_noncontiguous_ascii", |
| 35 | + runFunction: run_UTF16Decode_InitFromCustom_noncontiguous_ascii, |
| 36 | + tags: [.validation, .api, .String]), |
| 37 | + BenchmarkInfo( |
| 38 | + name: "UTF16Decode_InitFromData", |
| 39 | + runFunction: run_UTF16Decode_InitFromData, |
| 40 | + tags: [.validation, .api, .String]), |
| 41 | + BenchmarkInfo( |
| 42 | + name: "UTF16Decode_InitDecoding", |
| 43 | + runFunction: run_UTF16Decode_InitDecoding, |
| 44 | + tags: [.validation, .api, .String]), |
| 45 | + BenchmarkInfo( |
| 46 | + name: "UTF16Decode_InitFromData_ascii", |
| 47 | + runFunction: run_UTF16Decode_InitFromData_ascii, |
| 48 | + tags: [.validation, .api, .String]), |
| 49 | + BenchmarkInfo( |
| 50 | + name: "UTF16Decode_InitDecoding_ascii", |
| 51 | + runFunction: run_UTF16Decode_InitDecoding_ascii, |
| 52 | + tags: [.validation, .api, .String]), |
| 53 | + BenchmarkInfo( |
| 54 | + name: "UTF16Decode_InitFromData_ascii_as_ascii", |
| 55 | + runFunction: run_UTF16Decode_InitFromData_ascii_as_ascii, |
| 56 | + tags: [.validation, .api, .String]), |
| 57 | +] |
| 58 | + |
| 59 | +typealias CodeUnit = UInt16 |
| 60 | + |
| 61 | +// 1-byte sequences |
| 62 | +// This test case is the longest as it's the most performance sensitive. |
| 63 | +let ascii = "Swift is a multi-paradigm, compiled programming language created for iOS, OS X, watchOS, tvOS and Linux development by Apple Inc. Swift is designed to work with Apple's Cocoa and Cocoa Touch frameworks and the large body of existing Objective-C code written for Apple products. Swift is intended to be more resilient to erroneous code (\"safer\") than Objective-C and also more concise. It is built with the LLVM compiler framework included in Xcode 6 and later and uses the Objective-C runtime, which allows C, Objective-C, C++ and Swift code to run within a single program." |
| 64 | +let asciiCodeUnits: [CodeUnit] = Array(ascii.utf16) |
| 65 | +let asciiData: Data = asciiCodeUnits.withUnsafeBytes { Data($0) } |
| 66 | + |
| 67 | +// 2-byte sequences |
| 68 | +let russian = "Ру́сский язы́к один из восточнославянских языков, национальный язык русского народа." |
| 69 | +// 3-byte sequences |
| 70 | +let japanese = "日本語(にほんご、にっぽんご)は、主に日本国内や日本人同士の間で使われている言語である。" |
| 71 | +// 4-byte sequences |
| 72 | +// Most commonly emoji, which are usually mixed with other text. |
| 73 | +let emoji = "Panda 🐼, Dog 🐶, Cat 🐱, Mouse 🐭." |
| 74 | + |
| 75 | +let allStrings: [[CodeUnit]] = [ascii, russian, japanese, emoji].map { Array($0.utf16) } |
| 76 | +let allStringsCodeUnits: [CodeUnit] = Array(allStrings.joined()) |
| 77 | +let allStringsData: Data = allStringsCodeUnits.withUnsafeBytes { Data($0) } |
| 78 | + |
| 79 | + |
| 80 | +@inline(never) |
| 81 | +public func run_UTF16Decode(_ N: Int) { |
| 82 | + let strings = allStrings |
| 83 | + |
| 84 | + func isEmpty(_ result: UnicodeDecodingResult) -> Bool { |
| 85 | + switch result { |
| 86 | + case .emptyInput: |
| 87 | + return true |
| 88 | + default: |
| 89 | + return false |
| 90 | + } |
| 91 | + } |
| 92 | + |
| 93 | + for _ in 1...200*N { |
| 94 | + for string in strings { |
| 95 | + var it = string.makeIterator() |
| 96 | + var utf16 = UTF16() |
| 97 | + while !isEmpty(utf16.decode(&it)) { } |
| 98 | + } |
| 99 | + } |
| 100 | +} |
| 101 | + |
| 102 | +@inline(never) |
| 103 | +public func run_UTF16Decode_InitFromData(_ N: Int) { |
| 104 | + let input = allStringsData |
| 105 | + for _ in 0..<200*N { |
| 106 | + blackHole(String(data: input, encoding: .utf16)) |
| 107 | + } |
| 108 | +} |
| 109 | +@inline(never) |
| 110 | +public func run_UTF16Decode_InitDecoding(_ N: Int) { |
| 111 | + let input: [CodeUnit] = allStringsCodeUnits |
| 112 | + for _ in 0..<200*N { |
| 113 | + blackHole(String(decoding: input, as: UTF16.self)) |
| 114 | + } |
| 115 | +} |
| 116 | + |
| 117 | +@inline(never) |
| 118 | +public func run_UTF16Decode_InitFromData_ascii(_ N: Int) { |
| 119 | + let input = asciiData |
| 120 | + for _ in 0..<1_000*N { |
| 121 | + blackHole(String(data: input, encoding: .utf16)) |
| 122 | + } |
| 123 | +} |
| 124 | +@inline(never) |
| 125 | +public func run_UTF16Decode_InitDecoding_ascii(_ N: Int) { |
| 126 | + let input = asciiCodeUnits |
| 127 | + for _ in 0..<1_000*N { |
| 128 | + blackHole(String(decoding: input, as: UTF16.self)) |
| 129 | + } |
| 130 | +} |
| 131 | + |
| 132 | +@inline(never) |
| 133 | +public func run_UTF16Decode_InitFromData_ascii_as_ascii(_ N: Int) { |
| 134 | + let input = asciiData |
| 135 | + for _ in 0..<1_000*N { |
| 136 | + blackHole(String(data: input, encoding: .ascii)) |
| 137 | + } |
| 138 | +} |
| 139 | + |
| 140 | +struct CustomContiguousCollection: Collection { |
| 141 | + let storage: [CodeUnit] |
| 142 | + typealias Index = Int |
| 143 | + typealias Element = CodeUnit |
| 144 | + |
| 145 | + init(_ codeUnits: [CodeUnit]) { self.storage = codeUnits } |
| 146 | + subscript(position: Int) -> Element { self.storage[position] } |
| 147 | + var startIndex: Index { 0 } |
| 148 | + var endIndex: Index { storage.count } |
| 149 | + func index(after i: Index) -> Index { i+1 } |
| 150 | + |
| 151 | + @inline(never) |
| 152 | + func withContiguousStorageIfAvailable<R>( |
| 153 | + _ body: (UnsafeBufferPointer<CodeUnit>) throws -> R |
| 154 | + ) rethrows -> R? { |
| 155 | + try storage.withContiguousStorageIfAvailable(body) |
| 156 | + } |
| 157 | +} |
| 158 | +struct CustomNoncontiguousCollection: Collection { |
| 159 | + let storage: [CodeUnit] |
| 160 | + typealias Index = Int |
| 161 | + typealias Element = CodeUnit |
| 162 | + |
| 163 | + init(_ codeUnits: [CodeUnit]) { self.storage = codeUnits } |
| 164 | + subscript(position: Int) -> Element { self.storage[position] } |
| 165 | + var startIndex: Index { 0 } |
| 166 | + var endIndex: Index { storage.count } |
| 167 | + func index(after i: Index) -> Index { i+1 } |
| 168 | + |
| 169 | + @inline(never) |
| 170 | + func withContiguousStorageIfAvailable<R>( |
| 171 | + _ body: (UnsafeBufferPointer<UInt8>) throws -> R |
| 172 | + ) rethrows -> R? { |
| 173 | + nil |
| 174 | + } |
| 175 | +} |
| 176 | +let allStringsCustomContiguous = CustomContiguousCollection(allStringsCodeUnits) |
| 177 | +let asciiCustomContiguous = CustomContiguousCollection(Array(ascii.utf16)) |
| 178 | +let allStringsCustomNoncontiguous = CustomNoncontiguousCollection(allStringsCodeUnits) |
| 179 | +let asciiCustomNoncontiguous = CustomNoncontiguousCollection(Array(ascii.utf16)) |
| 180 | + |
| 181 | +@inline(never) |
| 182 | +public func run_UTF16Decode_InitFromCustom_contiguous(_ N: Int) { |
| 183 | + let input = allStringsCustomContiguous |
| 184 | + for _ in 0..<200*N { |
| 185 | + blackHole(String(decoding: input, as: UTF16.self)) |
| 186 | + } |
| 187 | +} |
| 188 | +@inline(never) |
| 189 | +public func run_UTF16Decode_InitFromCustom_contiguous_ascii(_ N: Int) { |
| 190 | + let input = asciiCustomContiguous |
| 191 | + for _ in 0..<1_000*N { |
| 192 | + blackHole(String(decoding: input, as: UTF16.self)) |
| 193 | + } |
| 194 | +} |
| 195 | + |
| 196 | +@inline(never) |
| 197 | +public func run_UTF16Decode_InitFromCustom_noncontiguous(_ N: Int) { |
| 198 | + let input = allStringsCustomNoncontiguous |
| 199 | + for _ in 0..<200*N { |
| 200 | + blackHole(String(decoding: input, as: UTF16.self)) |
| 201 | + } |
| 202 | +} |
| 203 | +@inline(never) |
| 204 | +public func run_UTF16Decode_InitFromCustom_noncontiguous_ascii(_ N: Int) { |
| 205 | + let input = asciiCustomNoncontiguous |
| 206 | + for _ in 0..<1_000*N { |
| 207 | + blackHole(String(decoding: input, as: UTF16.self)) |
| 208 | + } |
| 209 | +} |
| 210 | + |
0 commit comments