-
Notifications
You must be signed in to change notification settings - Fork 465
/
Copy pathbelt_internalSetBuckets.ml
157 lines (132 loc) · 4.44 KB
/
belt_internalSetBuckets.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
(* Copyright (C) 2017 Hongbo Zhang, Authors of ReScript
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* In addition to the permissions granted to you by the LGPL, you may combine
* or link a "work that uses the Library" with a publicly distributed version
* of this file to produce a combined library or application, then distribute
* that combined work under the terms of your choosing, with no requirement
* to comply with the obligations normally placed on you by section 4 of the
* LGPL version 3 (or the corresponding section of a later version of the LGPL
* should you choose to use a later version).
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. *)
(* We do dynamic hashing, and resize the table and rehash the elements
when buckets become too long. *)
module C = Belt_internalBucketsType
(* TODO:
the current implementation relies on the fact that bucket
empty value is `undefined` in both places,
in theory, it can be different
*)
type 'a bucket = {
mutable key : 'a;
mutable next : 'a bucket C.opt
}
and ('hash, 'eq, 'a) t = ('hash, 'eq, 'a bucket) C.container
module A = Belt_Array
let rec copy ( x : _ t) : _ t=
{ hash = x.hash;
eq = x.eq;
size = x.size;
buckets = copyBuckets x.buckets
}
and copyBuckets ( buckets : _ bucket C.opt array) =
let len = A.length buckets in
let newBuckets = A.makeUninitializedUnsafe len in
for i = 0 to len - 1 do
A.setUnsafe newBuckets i
(copyBucket (A.getUnsafe buckets i))
done ;
newBuckets
and copyBucket c =
match C.toOpt c with
| None -> c
| Some c ->
let head = { key = c.key ;
next = C.emptyOpt } in
copyAuxCont c.next head;
C.return head
and copyAuxCont c prec =
match C.toOpt c with
| None -> ()
| Some nc ->
let ncopy = { key = nc.key; next = C.emptyOpt} in
prec.next <- (C.return ncopy) ;
copyAuxCont nc.next ncopy
let rec bucketLength accu buckets =
match C.toOpt buckets with
| None -> accu
| Some cell -> bucketLength (accu + 1) cell.next
let rec doBucketIter ~f buckets =
match C.toOpt buckets with
| None ->
()
| Some cell ->
f cell.key [@bs]; doBucketIter ~f cell.next
let forEachU h f =
let d = h.C.buckets in
for i = 0 to A.length d - 1 do
doBucketIter ~f (A.getUnsafe d i)
done
let forEach h f = forEachU h (fun[@bs] a -> f a )
let rec fillArray i arr cell =
A.setUnsafe arr i cell.key;
match C.toOpt cell.next with
| None -> i + 1
| Some v -> fillArray (i + 1) arr v
let toArray h =
let d = h.C.buckets in
let current = ref 0 in
let arr = A.makeUninitializedUnsafe h.C.size in
for i = 0 to A.length d - 1 do
let cell = A.getUnsafe d i in
match C.toOpt cell with
| None -> ()
| Some cell ->
current .contents<- fillArray current.contents arr cell
done;
arr
let rec doBucketFold ~f b accu =
match C.toOpt b with
| None ->
accu
| Some cell ->
doBucketFold ~f cell.next (f accu cell.key [@bs])
let reduceU h init f =
let d = h.C.buckets in
let accu = ref init in
for i = 0 to A.length d - 1 do
accu.contents<- doBucketFold ~f (A.getUnsafe d i) accu.contents
done;
accu.contents
let reduce h init f = reduceU h init (fun [@bs] a b -> f a b)
let getMaxBucketLength h =
A.reduceU (h.C.buckets ) 0
(fun[@bs] m b ->
let len = bucketLength 0 b in
Pervasives.max m len)
let getBucketHistogram h =
let mbl = getMaxBucketLength h in
let histo = A.makeByU (mbl + 1) (fun[@bs] _ -> 0) in
A.forEachU (h.C.buckets )
(fun[@bs] b ->
let l = bucketLength 0 b in
A.setUnsafe histo l (A.getUnsafe histo l + 1)
);
histo
let logStats h =
let histogram = getBucketHistogram h in
Js.log [%obj{ bindings = h.C.size ;
buckets = A.length (h.C.buckets );
histogram }]