mirror of
https://github.com/c-cube/ocaml-containers.git
synced 2025-12-06 11:15:31 -05:00
added PersistentHashtbl, adapted from persistent arrays of J-C Filliatre
This commit is contained in:
parent
f992f279bc
commit
a82ebf7d59
5 changed files with 399 additions and 0 deletions
|
|
@ -8,6 +8,7 @@ Graph
|
|||
Hashset
|
||||
Heap
|
||||
LazyGraph
|
||||
PersistentHashtbl
|
||||
PHashtbl
|
||||
Sequence
|
||||
SkipList
|
||||
|
|
|
|||
212
persistentHashtbl.ml
Normal file
212
persistentHashtbl.ml
Normal file
|
|
@ -0,0 +1,212 @@
|
|||
(*
|
||||
Copyright (c) 2013, Simon Cruanes
|
||||
All rights reserved.
|
||||
|
||||
Redistribution and use in source and binary forms, with or without
|
||||
modification, are permitted provided that the following conditions are met:
|
||||
|
||||
Redistributions of source code must retain the above copyright notice, this
|
||||
list of conditions and the following disclaimer. Redistributions in binary
|
||||
form must reproduce the above copyright notice, this list of conditions and the
|
||||
following disclaimer in the documentation and/or other materials provided with
|
||||
the distribution.
|
||||
|
||||
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
|
||||
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
||||
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
||||
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
||||
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
||||
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
||||
SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
||||
CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
||||
OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
||||
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
*)
|
||||
|
||||
(** {1 Persistent hash-table on top of OCaml's hashtables} *)
|
||||
|
||||
module type HashedType = sig
|
||||
type t
|
||||
val equal : t -> t -> bool
|
||||
val hash : t -> int
|
||||
end
|
||||
|
||||
(** {2 Signature of such a hashtable} *)
|
||||
|
||||
module type S = sig
|
||||
type key
|
||||
type 'a t
|
||||
|
||||
val create : int -> 'a t
|
||||
(** Create a new hashtable *)
|
||||
|
||||
val is_empty : 'a t -> bool
|
||||
(** Is the table empty? *)
|
||||
|
||||
val find : 'a t -> key -> 'a
|
||||
(** Find the value for this key, or raise Not_found *)
|
||||
|
||||
val mem : 'a t -> key -> bool
|
||||
(** Is the key bound? *)
|
||||
|
||||
val length : 'a t -> int
|
||||
(** Number of bindings *)
|
||||
|
||||
val replace : 'a t -> key -> 'a -> 'a t
|
||||
(** Add the binding to the table, returning a new table. This erases
|
||||
the current binding for [key], if any. *)
|
||||
|
||||
val remove : 'a t -> key -> 'a t
|
||||
(** Remove the key *)
|
||||
|
||||
val copy : 'a t -> 'a t
|
||||
(** Fresh copy of the table; the underlying structure is not shared
|
||||
anymore, so using both tables alternatively will be efficient *)
|
||||
|
||||
val iter : 'a t -> (key -> 'a -> unit) -> unit
|
||||
(** Iterate over bindings *)
|
||||
|
||||
val fold : ('b -> key -> 'a -> 'b) -> 'b -> 'a t -> 'b
|
||||
(** Fold over bindings *)
|
||||
|
||||
val of_gen : ?init:'a t -> (key * 'a) Gen.t -> 'a t
|
||||
(** Add (replace) bindings from the generator to the table *)
|
||||
|
||||
val to_gen : 'a t -> (key * 'a) Gen.t
|
||||
(** Generator on the bindings of the table *)
|
||||
end
|
||||
|
||||
(** {2 Implementation} *)
|
||||
|
||||
module Make(H : HashedType) : S with type key = H.t = struct
|
||||
module Table = Hashtbl.Make(H)
|
||||
(** Imperative hashtable *)
|
||||
|
||||
type key = H.t
|
||||
type 'a t = 'a zipper ref
|
||||
and 'a zipper =
|
||||
| Table of 'a Table.t (** Concrete table *)
|
||||
| Add of key * 'a * 'a t (** Add key *)
|
||||
| Replace of key * 'a * 'a t (** Replace key by value *)
|
||||
| Remove of key * 'a t (** As the table, but without given key *)
|
||||
|
||||
let create i =
|
||||
ref (Table (Table.create i))
|
||||
|
||||
(** Reroot: modify the zipper so that the current node is a proper
|
||||
hashtable, and return the hashtable *)
|
||||
let reroot t =
|
||||
(* pass continuation to get a tailrec rerooting *)
|
||||
let rec reroot t k = match !t with
|
||||
| Table tbl -> k tbl (* done *)
|
||||
| Add (key, v, t') ->
|
||||
reroot t'
|
||||
(fun tbl ->
|
||||
t' := Remove (key, t);
|
||||
Table.add tbl key v;
|
||||
t := Table tbl;
|
||||
k tbl)
|
||||
| Replace (key, v, t') ->
|
||||
reroot t'
|
||||
(fun tbl ->
|
||||
let v' = Table.find tbl key in
|
||||
t' := Replace (key, v', t);
|
||||
t := Table tbl;
|
||||
Table.replace tbl key v;
|
||||
k tbl)
|
||||
| Remove (key, t') ->
|
||||
reroot t'
|
||||
(fun tbl ->
|
||||
let v = Table.find tbl key in
|
||||
t' := Add (key, v, t);
|
||||
t := Table tbl;
|
||||
Table.remove tbl key;
|
||||
k tbl)
|
||||
in
|
||||
reroot t (fun x -> x)
|
||||
|
||||
let is_empty t =
|
||||
match !t with
|
||||
| Table tbl -> Table.length tbl = 0
|
||||
| _ -> Table.length (reroot t) = 0
|
||||
|
||||
let find t k =
|
||||
match !t with
|
||||
| Table tbl -> Table.find tbl k
|
||||
| _ -> Table.find (reroot t) k
|
||||
|
||||
let mem t k =
|
||||
match !t with
|
||||
| Table tbl -> Table.mem tbl k
|
||||
| _ -> Table.mem (reroot t) k
|
||||
|
||||
let length t =
|
||||
match !t with
|
||||
| Table tbl -> Table.length tbl
|
||||
| _ -> Table.length (reroot t)
|
||||
|
||||
let replace t k v =
|
||||
let tbl = match !t with
|
||||
| Table tbl -> tbl
|
||||
| _ -> reroot t in
|
||||
(* create the new hashtable *)
|
||||
let t' = ref (Table tbl) in
|
||||
(* update [t] to point to the new hashtable *)
|
||||
(try
|
||||
let v' = Table.find tbl k in
|
||||
t := Replace (k, v', t')
|
||||
with Not_found ->
|
||||
t := Remove (k, t'));
|
||||
(* modify the underlying hashtable *)
|
||||
Table.replace tbl k v;
|
||||
t'
|
||||
|
||||
let remove t k =
|
||||
let tbl = match !t with
|
||||
| Table tbl -> tbl
|
||||
| _ -> reroot t in
|
||||
try
|
||||
let v' = Table.find tbl k in
|
||||
(* value present, make a new hashtable without this value *)
|
||||
let t' = ref (Table tbl) in
|
||||
t := Add (k, v', t');
|
||||
Table.remove tbl k;
|
||||
t'
|
||||
with Not_found ->
|
||||
(* not member, nothing to do *)
|
||||
t
|
||||
|
||||
let copy t =
|
||||
let tbl = match !t with
|
||||
| Table tbl -> tbl
|
||||
| _ -> reroot t in
|
||||
(* no one will point to the new [t] *)
|
||||
let t = ref (Table (Table.copy tbl)) in
|
||||
t
|
||||
|
||||
let iter t f =
|
||||
let tbl = match !t with
|
||||
| Table tbl -> tbl
|
||||
| _ -> reroot t in
|
||||
Table.iter f tbl
|
||||
|
||||
let fold f acc t =
|
||||
let tbl = match !t with
|
||||
| Table tbl -> tbl
|
||||
| _ -> reroot t in
|
||||
Table.fold (fun k v acc -> f acc k v) tbl acc
|
||||
|
||||
let of_gen ?init gen =
|
||||
let tbl = match init with
|
||||
| None -> Table.create 5
|
||||
| Some t -> Table.copy (reroot t) in
|
||||
Gen.iter (fun (k,v) -> Table.replace tbl k v) gen;
|
||||
ref (Table tbl)
|
||||
|
||||
let to_gen t =
|
||||
(* not efficient at the moment... *)
|
||||
let tbl = reroot t in
|
||||
let bindings = Table.fold (fun k v acc -> (k,v)::acc) tbl [] in
|
||||
Gen.of_list bindings
|
||||
end
|
||||
|
||||
82
persistentHashtbl.mli
Normal file
82
persistentHashtbl.mli
Normal file
|
|
@ -0,0 +1,82 @@
|
|||
(*
|
||||
Copyright (c) 2013, Simon Cruanes
|
||||
All rights reserved.
|
||||
|
||||
Redistribution and use in source and binary forms, with or without
|
||||
modification, are permitted provided that the following conditions are met:
|
||||
|
||||
Redistributions of source code must retain the above copyright notice, this
|
||||
list of conditions and the following disclaimer. Redistributions in binary
|
||||
form must reproduce the above copyright notice, this list of conditions and the
|
||||
following disclaimer in the documentation and/or other materials provided with
|
||||
the distribution.
|
||||
|
||||
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
|
||||
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
||||
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
||||
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
||||
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
||||
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
||||
SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
||||
CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
||||
OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
||||
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
*)
|
||||
|
||||
(** {1 Persistent hash-table on top of OCaml's hashtables} *)
|
||||
|
||||
module type HashedType = sig
|
||||
type t
|
||||
val equal : t -> t -> bool
|
||||
val hash : t -> int
|
||||
end
|
||||
|
||||
(** {2 Signature of such a hashtable} *)
|
||||
|
||||
module type S = sig
|
||||
type key
|
||||
type 'a t
|
||||
|
||||
val create : int -> 'a t
|
||||
(** Create a new hashtable *)
|
||||
|
||||
val is_empty : 'a t -> bool
|
||||
(** Is the table empty? *)
|
||||
|
||||
val find : 'a t -> key -> 'a
|
||||
(** Find the value for this key, or raise Not_found *)
|
||||
|
||||
val mem : 'a t -> key -> bool
|
||||
(** Is the key bound? *)
|
||||
|
||||
val length : 'a t -> int
|
||||
(** Number of bindings *)
|
||||
|
||||
val replace : 'a t -> key -> 'a -> 'a t
|
||||
(** Add the binding to the table, returning a new table. This erases
|
||||
the current binding for [key], if any. *)
|
||||
|
||||
val remove : 'a t -> key -> 'a t
|
||||
(** Remove the key *)
|
||||
|
||||
val copy : 'a t -> 'a t
|
||||
(** Fresh copy of the table; the underlying structure is not shared
|
||||
anymore, so using both tables alternatively will be efficient *)
|
||||
|
||||
val iter : 'a t -> (key -> 'a -> unit) -> unit
|
||||
(** Iterate over bindings *)
|
||||
|
||||
val fold : ('b -> key -> 'a -> 'b) -> 'b -> 'a t -> 'b
|
||||
(** Fold over bindings *)
|
||||
|
||||
val of_gen : ?init:'a t -> (key * 'a) Gen.t -> 'a t
|
||||
(** Add (replace) bindings from the generator to the table *)
|
||||
|
||||
val to_gen : 'a t -> (key * 'a) Gen.t
|
||||
(** Generator on the bindings of the table *)
|
||||
end
|
||||
|
||||
(** {2 Implementation} *)
|
||||
|
||||
module Make(H : HashedType) : S with type key = H.t
|
||||
|
||||
|
|
@ -5,6 +5,7 @@ open OUnit
|
|||
let suite =
|
||||
"all_tests" >:::
|
||||
[ Test_pHashtbl.suite;
|
||||
Test_PersistentHashtbl.suite;
|
||||
Test_vector.suite;
|
||||
Test_gen.suite;
|
||||
Test_deque.suite;
|
||||
|
|
|
|||
103
tests/test_PersistentHashtbl.ml
Normal file
103
tests/test_PersistentHashtbl.ml
Normal file
|
|
@ -0,0 +1,103 @@
|
|||
|
||||
open OUnit
|
||||
|
||||
module H = PersistentHashtbl.Make(struct type t = int let equal = (=) let hash i = i end)
|
||||
open Gen.Infix
|
||||
|
||||
let test_add () =
|
||||
let h = H.create 32 in
|
||||
let h = H.replace h 42 "foo" in
|
||||
OUnit.assert_equal (H.find h 42) "foo"
|
||||
|
||||
let my_list =
|
||||
[ 1, "a";
|
||||
2, "b";
|
||||
3, "c";
|
||||
4, "d";
|
||||
]
|
||||
|
||||
let my_gen = Gen.of_list my_list
|
||||
|
||||
let test_of_gen () =
|
||||
let h = H.of_gen my_gen in
|
||||
OUnit.assert_equal "b" (H.find h 2);
|
||||
OUnit.assert_equal "a" (H.find h 1);
|
||||
OUnit.assert_raises Not_found (fun () -> H.find h 42);
|
||||
()
|
||||
|
||||
let test_to_gen () =
|
||||
let h = H.of_gen my_gen in
|
||||
let l = Gen.to_list (H.to_gen h) in
|
||||
OUnit.assert_equal my_list (List.sort compare l)
|
||||
|
||||
let test_resize () =
|
||||
let h = H.of_gen
|
||||
(Gen.map (fun i -> i, string_of_int i)
|
||||
(Gen.int_range 0 200)) in
|
||||
OUnit.assert_equal 201 (H.length h);
|
||||
()
|
||||
|
||||
let test_persistent () =
|
||||
let h = H.of_gen my_gen in
|
||||
OUnit.assert_equal "a" (H.find h 1);
|
||||
OUnit.assert_raises Not_found (fun () -> H.find h 5);
|
||||
let h' = H.replace h 5 "e" in
|
||||
OUnit.assert_equal "a" (H.find h' 1);
|
||||
OUnit.assert_equal "e" (H.find h' 5);
|
||||
OUnit.assert_equal "a" (H.find h 1);
|
||||
OUnit.assert_raises Not_found (fun () -> H.find h 5);
|
||||
()
|
||||
|
||||
let test_big () =
|
||||
let n = 10000 in
|
||||
let gen = Gen.map (fun i -> i, string_of_int i) (0--n) in
|
||||
let h = H.of_gen gen in
|
||||
(*
|
||||
Format.printf "@[<v2>table:%a@]@." (Gen.pp_gen
|
||||
(fun formatter (k,v) -> Format.fprintf formatter "%d -> \"%s\"" k v))
|
||||
(H.to_gen h);
|
||||
*)
|
||||
Gen.iter
|
||||
(fun (k,v) ->
|
||||
(*
|
||||
Format.printf "lookup %d@." k;
|
||||
*)
|
||||
OUnit.assert_equal ~printer:(fun x -> x) v (H.find h k))
|
||||
gen;
|
||||
OUnit.assert_raises Not_found (fun () -> H.find h (n+1));
|
||||
()
|
||||
|
||||
let test_remove () =
|
||||
let h = H.of_gen my_gen in
|
||||
OUnit.assert_equal (H.find h 2) "b";
|
||||
OUnit.assert_equal (H.find h 3) "c";
|
||||
OUnit.assert_equal (H.find h 4) "d";
|
||||
OUnit.assert_equal (H.length h) 4;
|
||||
let h = H.remove h 2 in
|
||||
OUnit.assert_equal (H.find h 3) "c";
|
||||
OUnit.assert_equal (H.length h) 3;
|
||||
(* test that 2 has been removed *)
|
||||
OUnit.assert_raises Not_found (fun () -> H.find h 2)
|
||||
|
||||
let test_size () =
|
||||
let open Gen.Infix in
|
||||
let n = 10000 in
|
||||
let gen = Gen.map (fun i -> i, string_of_int i) (0 -- n) in
|
||||
let h = H.of_gen gen in
|
||||
OUnit.assert_equal (n+1) (H.length h);
|
||||
let h = Gen.fold (fun h i -> H.remove h i) h (0 -- 500) in
|
||||
OUnit.assert_equal (n-500) (H.length h);
|
||||
OUnit.assert_bool "is_empty" (H.is_empty (H.create 16));
|
||||
()
|
||||
|
||||
let suite =
|
||||
"test_H" >:::
|
||||
[ "test_add" >:: test_add;
|
||||
"test_of_gen" >:: test_of_gen;
|
||||
"test_to_gen" >:: test_to_gen;
|
||||
"test_resize" >:: test_resize;
|
||||
"test_persistent" >:: test_persistent;
|
||||
"test_big" >:: test_big;
|
||||
"test_remove" >:: test_remove;
|
||||
"test_size" >:: test_size;
|
||||
]
|
||||
Loading…
Add table
Reference in a new issue