Source file hashtbl_intf.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
(** Hashtbl is a reimplementation of the standard {{:
https://caml.inria.fr/pub/docs/manual-ocaml/libref/MoreLabels.Hashtbl.html}[MoreLabels.Hashtbl]}. Its
worst case time complexity is O(log(N)) for lookups and additions, unlike the standard
[MoreLabels.Hashtbl], which is O(N).
A hash table is implemented as an array of AVL trees (see [Avltree]). If
[growth_allowed] (default true) is false then [size] is the final size of the array;
the table can always hold more elements than [size], but they will all go into
tree nodes. If it is true (default) then the array will double in size when the number
of elements in the table reaches twice the size of the array. When this happens, all
existing elements will be reinserted, which can take a long time. If you care about
latency, set [size] and [growth_allowed=false] if possible.
In most cases, functions passed as arguments to hash table accessors must not mutate
the hash table while it is being accessed, as this will result in an exception. For
example, [iter] and [change] take a function [f] which must not modify [t]. In a few
cases, mutation is allowed, such as in [Hashtbl.find_and_call], where all access to
[t] is finished before the [~if_found] and [~if_not_found] arguments are invoked.
We have three kinds of hash table modules:
- [Hashtbl]
- [Hashtbl.Poly]
- [Key.Table] (a class of similar modules)
There are three kinds of hash-table functions:
- creation from nothing ([create], [of_alist])
- sexp converters ([t_of_sexp], [sexp_of_t], and [bin_io] too)
- accessors and mappers ([fold], [mem], [find], [map], [filter_map], ...)
Here is a table showing what classes of functions are available in each kind
of hash-table module:
{v
creation sexp-conv accessors
Hashtbl X
Hashtbl.Poly X X
Key.Table X X X'
v}
The entry marked with [X'] is there for historical reasons, and may be eliminated at
some point. The upshot is that one should use [Hashtbl] for accessors, [Hashtbl.Poly]
for hash-table creation and sexp conversion using polymorphic compare/hash, and
[Key.Table] for hash-table creation and sexp conversion using [Key.compare] and
[Key.hash].
{2:usage Usage}
For many students of OCaml, using hashtables is complicated by the
functors. Here are a few tips:
{ol
{- For a list of hashtable functions see {!Core.Hashtbl_intf.S}.}
{- To create a hashtable with string keys use [String.Table]:
{[
let table = String.Table.create () ~size:4 in
List.iter ~f:(fun (key, data) -> Hashtbl.set table ~key ~data)
[ ("A", 1); ("B", 2); ("C", 3); ];
Hashtbl.find table "C"
]}
Here 4 need only be a guess at the hashtable's future size. There are other similar
pre-made hashtables, e.g., [Int63.Table] or [Host_and_port.Table].
}
{- To create a hashtable with a custom key type use Hashable:
{[
module Key = struct
module T = struct
type t = String.t * Int63.t [@@deriving compare, hash, sexp]
end
include T
include Hashable.Make (T)
end
let table = Key.Table.create () ~size:4 in
List.iter ~f:(fun (key, data) -> Hashtbl.set table ~key ~data)
[ (("pi", Int63.zero), 3.14159);
(("e", Int63.minus_one), 2.71828);
(("Euler", Int63.one), 0.577215);
];
Hashtbl.find table ("pi", Int63.zero)
]}
Performance {i may} improve if you define [equal] and [hash] explicitly, e.g.:
{[
let equal (x, y) (x', y') = String.(=) x x' && Int63.(=) y y'
let hash (x, y) = String.hash x + Int63.hash y * 65599
]}
}
}
*)
open! Import
module Binable = Binable0
module Hashtbl = Base.Hashtbl
module type Key_plain = Hashtbl.Key.S
module Hashable = Base.Hashable
module Merge_into_action = Base.Hashtbl.Merge_into_action
module type Hashable = Base.Hashable.Hashable
module type Key = sig
type t [@@deriving sexp]
include Key_plain with type t := t
end
module type Key_binable = sig
type t [@@deriving bin_io, sexp]
include Key with type t := t
end
module type Key_stable = sig
type t [@@deriving bin_io, sexp, stable_witness]
include Key_binable with type t := t
end
module type Creators = Hashtbl.Private.Creators_generic
module type Accessors = sig
include Hashtbl.Accessors
val validate : name:('a key -> string) -> 'b Validate.check -> ('a, 'b) t Validate.check
end
module type Multi = Hashtbl.Multi
type ('key, 'data, 'z) create_options_with_first_class_module =
('key, 'data, 'z) Hashtbl.create_options
type ('key, 'data, 'z) create_options_without_hashable =
('key, 'data, 'z) Hashtbl.Private.create_options_without_first_class_module
type ('key, 'data, 'z) create_options_with_hashable =
?growth_allowed:bool (** defaults to [true] *)
-> ?size:int (** initial size -- default 0 *)
-> hashable:'key Hashable.t
-> 'z
module type M_quickcheck = sig
type t [@@deriving compare, hash, quickcheck, sexp_of]
end
module type For_deriving = sig
include Base.Hashtbl.For_deriving
module type M_quickcheck = M_quickcheck
val quickcheck_generator_m__t
: (module M_quickcheck with type t = 'k)
-> 'v Base_quickcheck.Generator.t
-> ('k, 'v) t Quickcheck.Generator.t
val quickcheck_observer_m__t
: (module M_quickcheck with type t = 'k)
-> 'v Quickcheck.Observer.t
-> ('k, 'v) t Quickcheck.Observer.t
val quickcheck_shrinker_m__t
: (module M_quickcheck with type t = 'k)
-> 'v Quickcheck.Shrinker.t
-> ('k, 'v) t Quickcheck.Shrinker.t
end
module type S_plain = sig
type key
type ('a, 'b) hashtbl
type 'b t = (key, 'b) hashtbl [@@deriving equal, sexp_of]
type ('a, 'b) t_ = 'b t
type 'a key_ = key
val hashable : key Hashable.t
include Invariant.S1 with type 'b t := 'b t
include
Creators
with type ('a, 'b) t := ('a, 'b) t_
with type 'a key := 'a key_
with type ('key, 'data, 'z) create_options :=
('key, 'data, 'z) create_options_without_hashable
module Provide_of_sexp
(Key : sig
type t [@@deriving of_sexp]
end
with type t := key) : sig
type _ t [@@deriving of_sexp]
end
with type 'a t := 'a t
module Provide_bin_io
(Key : sig
type t [@@deriving bin_io]
end
with type t := key) : sig
type 'a t [@@deriving bin_io]
end
with type 'a t := 'a t
end
module type S = sig
include S_plain
include sig
type _ t [@@deriving of_sexp]
end
with type 'a t := 'a t
end
module type S_binable = sig
include S
include Binable.S1 with type 'v t := 'v t
end
module type S_stable = sig
include S_binable
type nonrec 'a t = 'a t [@@deriving stable_witness]
end
module type Hashtbl = sig
include Hashtbl.S_without_submodules (** @inline *)
val validate : name:('a key -> string) -> 'b Validate.check -> ('a, 'b) t Validate.check
module Using_hashable : sig
include
Creators
with type ('a, 'b) t := ('a, 'b) t
with type 'a key := 'a key
with type ('a, 'b, 'z) create_options := ('a, 'b, 'z) create_options_with_hashable
end
module Poly : sig
type nonrec ('a, 'b) t = ('a, 'b) t [@@deriving bin_io]
include Hashtbl.S_poly with type ('a, 'b) t := ('a, 'b) t
val validate
: name:('a key -> string)
-> 'b Validate.check
-> ('a, 'b) t Validate.check
end
module type Key_plain = Key_plain
module type Key = Key
module type Key_binable = Key_binable
module type Key_stable = Key_stable
module type S_plain = S_plain with type ('a, 'b) hashtbl = ('a, 'b) t
module type S = S with type ('a, 'b) hashtbl = ('a, 'b) t
module type S_binable = S_binable with type ('a, 'b) hashtbl = ('a, 'b) t
module type S_stable = S_stable with type ('a, 'b) hashtbl = ('a, 'b) t
module Make_plain (Key : Key_plain) : S_plain with type key = Key.t
module Make (Key : Key) : S with type key = Key.t
module Make_binable (Key : Key_binable) : S_binable with type key = Key.t
module Make_stable (Key : Key_stable) : S_stable with type key = Key.t
module Make_plain_with_hashable (T : sig
module Key : Key_plain
val hashable : Key.t Hashable.t
end) : S_plain with type key = T.Key.t
module Make_with_hashable (T : sig
module Key : Key
val hashable : Key.t Hashable.t
end) : S with type key = T.Key.t
module Make_binable_with_hashable (T : sig
module Key : Key_binable
val hashable : Key.t Hashable.t
end) : S_binable with type key = T.Key.t
module Make_stable_with_hashable (T : sig
module Key : Key_stable
val hashable : Key.t Hashable.t
end) : S_stable with type key = T.Key.t
module M (K : T.T) : sig
type nonrec 'v t = (K.t, 'v) t
end
module Hashable = Hashable
module Merge_into_action = Merge_into_action
val hashable : ('key, _) t -> 'key Hashable.t
module type For_deriving = For_deriving
include For_deriving with type ('a, 'b) t := ('a, 'b) t
end