forked from ocaml/ocaml
-
Notifications
You must be signed in to change notification settings - Fork 0
/
ephemeron.mli
300 lines (234 loc) · 10.8 KB
/
ephemeron.mli
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
(**************************************************************************)
(* *)
(* OCaml *)
(* *)
(* Damien Doligez, projet Para, INRIA Rocquencourt *)
(* *)
(* Copyright 1997 Institut National de Recherche en Informatique et *)
(* en Automatique. *)
(* *)
(* All rights reserved. This file is distributed under the terms of *)
(* the GNU Lesser General Public License version 2.1, with the *)
(* special exception on linking described in the file LICENSE. *)
(* *)
(**************************************************************************)
(** Ephemerons and weak hash tables.
Ephemerons and weak hash tables are useful when one wants to cache
or memorize the computation of a function, as long as the
arguments and the function are used, without creating memory leaks
by continuously keeping old computation results that are not
useful anymore because one argument or the function is freed. An
implementation using {!Hashtbl.t} is not suitable because all
associations would keep the arguments and the result in memory.
Ephemerons can also be used for "adding" a field to an arbitrary
boxed OCaml value: you can attach some information to a value
created by an external library without memory leaks.
Ephemerons hold some keys and one or no data. They are all boxed
OCaml values. The keys of an ephemeron have the same behavior
as weak pointers according to the garbage collector. In fact
OCaml weak pointers are implemented as ephemerons without data.
The keys and data of an ephemeron are said to be full if they
point to a value, or empty if the value has never been set, has
been unset, or was erased by the GC. In the function that accesses
the keys or data these two states are represented by the [option]
type.
The data is considered by the garbage collector alive if all the
full keys are alive and if the ephemeron is alive. When one of the
keys is not considered alive anymore by the GC, the data is
emptied from the ephemeron. The data could be alive for another
reason and in that case the GC will not free it, but the ephemeron
will not hold the data anymore.
The ephemerons complicate the notion of liveness of values, because
it is not anymore an equivalence with the reachability from root
value by usual pointers (not weak and not ephemerons). With ephemerons
the notion of liveness is constructed by the least fixpoint of:
A value is alive if:
- it is a root value
- it is reachable from alive value by usual pointers
- it is the data of an alive ephemeron with all its full keys alive
Notes:
- All the types defined in this module cannot be marshaled
using {!Stdlib.output_value} or the functions of the
{!Marshal} module.
Ephemerons are defined in a language agnostic way in this paper:
B. Hayes, Ephemerons: A New Finalization Mechanism, OOPSLA'97
@since 4.03
*)
(** {b Unsynchronized accesses} *)
[@@@alert unsynchronized_access
"Unsynchronized accesses to weak hash tables are a programming error."
]
(**
Unsynchronized accesses to a weak hash table may lead to an invalid
weak hash table state. Thus, concurrent accesses to a buffer must be
synchronized (for instance with a {!Mutex.t}).
*)
module type S = sig
(** Propose the same interface as usual hash table. However since
the bindings are weak, even if [mem h k] is true, a subsequent
[find h k] may raise [Not_found] because the garbage collector
can run between the two.
*)
type key
type !'a t
val create : int -> 'a t
val clear : 'a t -> unit
val reset : 'a t -> unit
val copy : 'a t -> 'a t
val add : 'a t -> key -> 'a -> unit
val remove : 'a t -> key -> unit
val find : 'a t -> key -> 'a
val find_opt : 'a t -> key -> 'a option
val find_all : 'a t -> key -> 'a list
val replace : 'a t -> key -> 'a -> unit
val mem : 'a t -> key -> bool
val length : 'a t -> int
val stats : 'a t -> Hashtbl.statistics
val add_seq : 'a t -> (key * 'a) Seq.t -> unit
val replace_seq : 'a t -> (key * 'a) Seq.t -> unit
val of_seq : (key * 'a) Seq.t -> 'a t
val clean: 'a t -> unit
(** remove all dead bindings. Done automatically during automatic resizing. *)
val stats_alive: 'a t -> Hashtbl.statistics
(** same as {!Hashtbl.SeededS.stats} but only count the alive bindings *)
end
(** The output signature of the functors {!K1.Make} and {!K2.Make}.
These hash tables are weak in the keys. If all the keys of a binding are
alive the binding is kept, but if one of the keys of the binding
is dead then the binding is removed.
*)
module type SeededS = sig
type key
type !'a t
val create : ?random (*thwart tools/sync_stdlib_docs*) : bool -> int -> 'a t
val clear : 'a t -> unit
val reset : 'a t -> unit
val copy : 'a t -> 'a t
val add : 'a t -> key -> 'a -> unit
val remove : 'a t -> key -> unit
val find : 'a t -> key -> 'a
val find_opt : 'a t -> key -> 'a option
val find_all : 'a t -> key -> 'a list
val replace : 'a t -> key -> 'a -> unit
val mem : 'a t -> key -> bool
val length : 'a t -> int
val stats : 'a t -> Hashtbl.statistics
val add_seq : 'a t -> (key * 'a) Seq.t -> unit
val replace_seq : 'a t -> (key * 'a) Seq.t -> unit
val of_seq : (key * 'a) Seq.t -> 'a t
val clean: 'a t -> unit
(** remove all dead bindings. Done automatically during automatic resizing. *)
val stats_alive: 'a t -> Hashtbl.statistics
(** same as {!Hashtbl.SeededS.stats} but only count the alive bindings *)
end
(** The output signature of the functors {!K1.MakeSeeded} and {!K2.MakeSeeded}.
*)
module K1 : sig
type ('k,'d) t (** an ephemeron with one key *)
val make : 'k -> 'd -> ('k,'d) t
(** [Ephemeron.K1.make k d] creates an ephemeron with key [k] and data [d]. *)
val query : ('k,'d) t -> 'k -> 'd option
(** [Ephemeron.K1.query eph key] returns [Some x] (where [x] is the
ephemeron's data) if [key] is physically equal to [eph]'s key, and
[None] if [eph] is empty or [key] is not equal to [eph]'s key. *)
module Make (H:Hashtbl.HashedType) : S with type key = H.t
(** Functor building an implementation of a weak hash table *)
module MakeSeeded (H:Hashtbl.SeededHashedType) : SeededS with type key = H.t
(** Functor building an implementation of a weak hash table.
The seed is similar to the one of {!Hashtbl.MakeSeeded}. *)
module Bucket : sig
type ('k, 'd) t
(** A bucket is a mutable "list" of ephemerons. *)
val make : unit -> ('k, 'd) t
(** Create a new bucket. *)
val add : ('k, 'd) t -> 'k -> 'd -> unit
(** Add an ephemeron to the bucket. *)
val remove : ('k, 'd) t -> 'k -> unit
(** [remove b k] removes from [b] the most-recently added
ephemeron with key [k], or does nothing if there is no such
ephemeron. *)
val find : ('k, 'd) t -> 'k -> 'd option
(** Returns the data of the most-recently added ephemeron with the
given key, or [None] if there is no such ephemeron. *)
val length : ('k, 'd) t -> int
(** Returns an upper bound on the length of the bucket. *)
val clear : ('k, 'd) t -> unit
(** Remove all ephemerons from the bucket. *)
end
end
(** Ephemerons with one key. *)
module K2 : sig
type ('k1,'k2,'d) t (** an ephemeron with two keys *)
val make : 'k1 -> 'k2 -> 'd -> ('k1,'k2,'d) t
(** Same as {!Ephemeron.K1.make} *)
val query : ('k1,'k2,'d) t -> 'k1 -> 'k2 -> 'd option
(** Same as {!Ephemeron.K1.query} *)
module Make
(H1:Hashtbl.HashedType)
(H2:Hashtbl.HashedType) :
S with type key = H1.t * H2.t
(** Functor building an implementation of a weak hash table *)
module MakeSeeded
(H1:Hashtbl.SeededHashedType)
(H2:Hashtbl.SeededHashedType) :
SeededS with type key = H1.t * H2.t
(** Functor building an implementation of a weak hash table.
The seed is similar to the one of {!Hashtbl.MakeSeeded}. *)
module Bucket : sig
type ('k1, 'k2, 'd) t
(** A bucket is a mutable "list" of ephemerons. *)
val make : unit -> ('k1, 'k2, 'd) t
(** Create a new bucket. *)
val add : ('k1, 'k2, 'd) t -> 'k1 -> 'k2 -> 'd -> unit
(** Add an ephemeron to the bucket. *)
val remove : ('k1, 'k2, 'd) t -> 'k1 -> 'k2 -> unit
(** [remove b k1 k2] removes from [b] the most-recently added
ephemeron with keys [k1] and [k2], or does nothing if there
is no such ephemeron. *)
val find : ('k1, 'k2, 'd) t -> 'k1 -> 'k2 -> 'd option
(** Returns the data of the most-recently added ephemeron with the
given keys, or [None] if there is no such ephemeron. *)
val length : ('k1, 'k2, 'd) t -> int
(** Returns an upper bound on the length of the bucket. *)
val clear : ('k1, 'k2, 'd) t -> unit
(** Remove all ephemerons from the bucket. *)
end
end
(** Ephemerons with two keys. *)
module Kn : sig
type ('k,'d) t (** an ephemeron with an arbitrary number of keys
of the same type *)
val make : 'k array -> 'd -> ('k,'d) t
(** Same as {!Ephemeron.K1.make} *)
val query : ('k,'d) t -> 'k array -> 'd option
(** Same as {!Ephemeron.K1.query} *)
module Make
(H:Hashtbl.HashedType) :
S with type key = H.t array
(** Functor building an implementation of a weak hash table *)
module MakeSeeded
(H:Hashtbl.SeededHashedType) :
SeededS with type key = H.t array
(** Functor building an implementation of a weak hash table.
The seed is similar to the one of {!Hashtbl.MakeSeeded}. *)
module Bucket : sig
type ('k, 'd) t
(** A bucket is a mutable "list" of ephemerons. *)
val make : unit -> ('k, 'd) t
(** Create a new bucket. *)
val add : ('k, 'd) t -> 'k array -> 'd -> unit
(** Add an ephemeron to the bucket. *)
val remove : ('k, 'd) t -> 'k array -> unit
(** [remove b k] removes from [b] the most-recently added
ephemeron with keys [k], or does nothing if there is no such
ephemeron. *)
val find : ('k, 'd) t -> 'k array -> 'd option
(** Returns the data of the most-recently added ephemeron with the
given keys, or [None] if there is no such ephemeron. *)
val length : ('k, 'd) t -> int
(** Returns an upper bound on the length of the bucket. *)
val clear : ('k, 'd) t -> unit
(** Remove all ephemerons from the bucket. *)
end
end
(** Ephemerons with arbitrary number of keys of the same type. *)