-
Notifications
You must be signed in to change notification settings - Fork 10.4k
/
Copy pathCharacterRecognizer.swift
97 lines (88 loc) · 4.13 KB
/
CharacterRecognizer.swift
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
//===--- StringEdits.swift ------------------------------------------------===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2014 - 2023 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
//
//===----------------------------------------------------------------------===//
import TestsUtils
public var benchmarks: [BenchmarkInfo] {
guard #available(macOS 9999, iOS 9999, watchOS 9999, tvOS 9999, *) else {
return []
}
return [
BenchmarkInfo(
name: "CharacterRecognizer.mixed",
runFunction: { n in
run(string: mixedString, n: n)
},
tags: [.api, .String],
setUpFunction: { blackHole(mixedString) }),
BenchmarkInfo(
name: "CharacterRecognizer.ascii",
runFunction: { n in
run(string: asciiString, n: n)
},
tags: [.api, .String],
setUpFunction: { blackHole(asciiString) }),
]
}
let mixedString = #"""
The powerful programming language that is also easy to learn.
손쉽게 학습할 수 있는 강력한 프로그래밍 언어.
🪙 A 🥞 short 🍰 piece 🫘 of 🌰 text 👨👨👧👧 with 👨👩👦 some 🚶🏽 emoji 🇺🇸🇨🇦 characters 🧈
some🔩times 🛺 placed 🎣 in 🥌 the 🆘 mid🔀dle 🇦🇶or🏁 around 🏳️🌈 a 🍇 w🍑o🥒r🥨d
Unicode is such fun!
U̷n̷i̷c̷o̴d̴e̷ ̶i̸s̷ ̸s̵u̵c̸h̷ ̸f̵u̷n̴!̵
U̴̡̲͋̾n̵̻̳͌ì̶̠̕c̴̭̈͘ǫ̷̯͋̊d̸͖̩̈̈́ḛ̴́ ̴̟͎͐̈i̴̦̓s̴̜̱͘ ̶̲̮̚s̶̙̞͘u̵͕̯̎̽c̵̛͕̜̓h̶̘̍̽ ̸̜̞̿f̵̤̽ṷ̴͇̎͘ń̷͓̒!̷͍̾̚
U̷̢̢̧̨̼̬̰̪͓̞̠͔̗̼̙͕͕̭̻̗̮̮̥̣͉̫͉̬̲̺͍̺͊̂ͅ\#
n̶̨̢̨̯͓̹̝̲̣̖̞̼̺̬̤̝̊̌́̑̋̋͜͝ͅ\#
ḭ̸̦̺̺͉̳͎́͑\#
c̵̛̘̥̮̙̥̟̘̝͙̤̮͉͔̭̺̺̅̀̽̒̽̏̊̆͒͌̂͌̌̓̈́̐̔̿̂͑͠͝͝ͅ\#
ö̶̱̠̱̤̙͚͖̳̜̰̹̖̣̻͎͉̞̫̬̯͕̝͔̝̟̘͔̙̪̭̲́̆̂͑̌͂̉̀̓́̏̎̋͗͛͆̌̽͌̄̎̚͝͝͝͝ͅ\#
d̶̨̨̡̡͙̟͉̱̗̝͙͍̮͍̘̮͔͑\#
e̶̢͕̦̜͔̘̘̝͈̪̖̺̥̺̹͉͎͈̫̯̯̻͑͑̿̽͂̀̽͋́̎̈́̈̿͆̿̒̈́̽̔̇͐͛̀̓͆̏̾̀̌̈́̆̽̕ͅ
"""#
let _asciiString = #"""
Swift is a high-performance system programming language. It has a clean
and modern syntax, offers seamless access to existing C and Objective-C code
and frameworks, and is memory safe by default.
Although inspired by Objective-C and many other languages, Swift is not itself
a C-derived language. As a complete and independent language, Swift packages
core features like flow control, data structures, and functions, with
high-level constructs like objects, protocols, closures, and generics. Swift
embraces modules, eliminating the need for headers and the code duplication
they entail.
Swift toolchains are created using the script
[build-toolchain](https://github.com/apple/swift/blob/main/utils/build-toolchain).
This script is used by swift.org's CI to produce snapshots and can allow for
one to locally reproduce such builds for development or distribution purposes.
A typical invocation looks like the following:
```
$ ./swift/utils/build-toolchain $BUNDLE_PREFIX
```
where ``$BUNDLE_PREFIX`` is a string that will be prepended to the build date
to give the bundle identifier of the toolchain's ``Info.plist``. For instance,
if ``$BUNDLE_PREFIX`` was ``com.example``, the toolchain produced will have
the bundle identifier ``com.example.YYYYMMDD``. It will be created in the
directory you run the script with a filename of the form:
``swift-LOCAL-YYYY-MM-DD-a-osx.tar.gz``.
"""#
let asciiString = String(repeating: _asciiString, count: 10)
@available(macOS 9999, iOS 9999, watchOS 9999, tvOS 9999, *)
func run(string: String, n: Int) {
var state = Unicode._CharacterRecognizer()
var c = 0
for _ in 0 ..< n {
for scalar in string.unicodeScalars {
if state.hasBreak(before: scalar) {
c += 1
}
}
}
blackHole(c)
}