forked from rescript-lang/rescript
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathhash_set_gen.ml
164 lines (141 loc) · 4.51 KB
/
hash_set_gen.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
(* Copyright (C) 2015-2016 Bloomberg Finance L.P.
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* In addition to the permissions granted to you by the LGPL, you may combine
* or link a "work that uses the Library" with a publicly distributed version
* of this file to produce a combined library or application, then distribute
* that combined work under the terms of your choosing, with no requirement
* to comply with the obligations normally placed on you by section 4 of the
* LGPL version 3 (or the corresponding section of a later version of the LGPL
* should you choose to use a later version).
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. *)
(* We do dynamic hashing, and resize the table and rehash the elements
when buckets become too long. *)
type 'a t =
{ mutable size: int; (* number of entries *)
mutable data: 'a list array; (* the buckets *)
initial_size: int; (* initial array size *)
}
let create initial_size =
let s = Ext_util.power_2_above 16 initial_size in
{ initial_size = s; size = 0; data = Array.make s [] }
let clear h =
h.size <- 0;
let len = Array.length h.data in
for i = 0 to len - 1 do
Array.unsafe_set h.data i []
done
let reset h =
h.size <- 0;
h.data <- Array.make h.initial_size [ ]
let copy h = { h with data = Array.copy h.data }
let length h = h.size
let iter f h =
let rec do_bucket = function
| [ ] ->
()
| k :: rest ->
f k ; do_bucket rest in
let d = h.data in
for i = 0 to Array.length d - 1 do
do_bucket (Array.unsafe_get d i)
done
let fold f h init =
let rec do_bucket b accu =
match b with
[ ] ->
accu
| k :: rest ->
do_bucket rest (f k accu) in
let d = h.data in
let accu = ref init in
for i = 0 to Array.length d - 1 do
accu := do_bucket (Array.unsafe_get d i) !accu
done;
!accu
let resize indexfun h =
let odata = h.data in
let osize = Array.length odata in
let nsize = osize * 2 in
if nsize < Sys.max_array_length then begin
let ndata = Array.make nsize [ ] in
h.data <- ndata; (* so that indexfun sees the new bucket count *)
let rec insert_bucket = function
[ ] -> ()
| key :: rest ->
let nidx = indexfun h key in
ndata.(nidx) <- key :: ndata.(nidx);
insert_bucket rest
in
for i = 0 to osize - 1 do
insert_bucket (Array.unsafe_get odata i)
done
end
let elements set =
fold (fun k acc -> k :: acc) set []
let stats h =
let mbl =
Array.fold_left (fun m b -> max m (List.length b)) 0 h.data in
let histo = Array.make (mbl + 1) 0 in
Array.iter
(fun b ->
let l = List.length b in
histo.(l) <- histo.(l) + 1)
h.data;
{Hashtbl.num_bindings = h.size;
num_buckets = Array.length h.data;
max_bucket_length = mbl;
bucket_histogram = histo }
let rec small_bucket_mem eq_key key lst =
match lst with
| [] -> false
| key1::rest ->
eq_key key key1 ||
match rest with
| [] -> false
| key2 :: rest ->
eq_key key key2 ||
match rest with
| [] -> false
| key3 :: rest ->
eq_key key key3 ||
small_bucket_mem eq_key key rest
let rec remove_bucket eq_key key (h : _ t) buckets =
match buckets with
| [ ] ->
[ ]
| k :: next ->
if eq_key k key
then begin h.size <- h.size - 1; next end
else k :: remove_bucket eq_key key h next
module type S =
sig
type key
type t
val create: int -> t
val clear : t -> unit
val reset : t -> unit
val copy: t -> t
val remove: t -> key -> unit
val add : t -> key -> unit
val of_array : key array -> t
val check_add : t -> key -> bool
val mem : t -> key -> bool
val iter: (key -> unit) -> t -> unit
val fold: (key -> 'b -> 'b) -> t -> 'b -> 'b
val length: t -> int
val stats: t -> Hashtbl.statistics
val elements : t -> key list
end