Source file helper.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
open Plebeia
open Lwt.Syntax
include Debug
include Utils
module RS = Random.State
let temp_file body ext =
let fn = Filename.temp_file body ext in
Unix.unlink fn;
fn
let with_tempdir f =
let d = temp_file "plebeia_test" ".dir" in
Format.eprintf "Using tempdir %s@." d;
Unix.mkdir d 0o700;
f d
let context_confs =
let open Context in
[ { hash_func= `Blake2B; bytes_per_hash= 28; bytes_per_cell= 32 }
; { hash_func= `Blake2B; bytes_per_hash= 28; bytes_per_cell= 36 }
; { hash_func= `Blake2B; bytes_per_hash= 32; bytes_per_cell= 36 }
; { hash_func= `Blake2B; bytes_per_hash= 32; bytes_per_cell= 40 }
; { hash_func= `Blake3; bytes_per_hash= 28; bytes_per_cell= 32 }
]
let with_context_conf f =
List.map (fun conf -> conf, f conf) context_confs
let with_context_conf_lwt f =
Lwt_list.map_s (fun conf -> let* r = f conf in Lwt.return (conf, r)) context_confs
let resize_step_bytes = 100_000
let with_context f =
Lwt_list.map_s (fun ({Context.hash_func; bytes_per_hash; bytes_per_cell} as conf) ->
let* () = Lwt_fmt.eprintf "Testing with %a@." Context.pp_config conf in
let tempfile = temp_file "plebeia" ".context" in
let* context = Context.create ~hash_func ~bytes_per_hash ~bytes_per_cell tempfile ~resize_step_bytes in
let res = f context in
let+ () = Context.close context in
(conf, res)) context_confs
let with_context_lwt f =
Lwt_list.map_s (fun ({Context.hash_func; bytes_per_hash; bytes_per_cell} as conf) ->
let* () = Lwt_fmt.eprintf "Testing with %a@." Context.pp_config conf in
let tempfile = temp_file "plebeia" ".context" in
let* context = Context.create ~hash_func ~bytes_per_hash ~bytes_per_cell tempfile ~resize_step_bytes in
let* res = f context in
let+ () = Context.close context in
(conf, res)) context_confs
let with_memory_only_context f =
Lwt_list.map_s (fun ({Context.hash_func; bytes_per_hash; bytes_per_cell} as conf) ->
let* () = Lwt_fmt.eprintf "Testing with %a@." Context.pp_config conf in
let context = Context.memory_only ~hash_func ~bytes_per_hash ~bytes_per_cell () in
let res = f context in
let+ () = Context.close context in
(conf, res)) context_confs
let with_vc ?prefix f =
Lwt_list.map_s (fun ({Context.hash_func; bytes_per_hash; bytes_per_cell} as conf) ->
let* () = Lwt_fmt.eprintf "Testing with %a@." Context.pp_config conf in
let prefix =
match prefix with
| None -> Filename.temp_file "plebeia" "vc"
| Some p -> Printf.sprintf "%s-%s" p (Context.config_name conf)
in
let* () = Lwt_fmt.eprintf "Using VC %s@." prefix in
let* vc = from_Ok_lwt @@ Vc.create ~bytes_per_cell ~hash_func ~bytes_per_hash ~resize_step_bytes prefix in
let* res = f vc in
let+ () = from_Ok_lwt @@ Vc.close vc in
(conf, res)) context_confs
let with_cursor f =
with_context (fun context ->
let cursor = Cursor.empty context in
f cursor)
let with_memory_only_cursor f =
with_memory_only_context (fun context ->
let cursor = Cursor.empty context in
f cursor)
let regression_by_hash name expected actual =
let h = Hashtbl.hash actual in
match h with
| 129913994 ->
failwithf "%s: Regression error: returning ()?" name;
| 609990030 ->
failwithf "%s: Regression error: returning () with [with_context]?" name;
| _ ->
if expected <> h then
failwithf "%s: Regression error: obtained %d" name h
let path_of_string s = from_Some @@ Segment.of_string s
let ok_or_fail = function
| Ok x -> x
| Error s -> Error.raise s
let must_fail = function
| Ok _ -> failwith "must fail"
| Error _ -> ()
let path = path_of_string
let value = Value.of_string
open Node
let rec normalize ~clear_hash n = match n with
| Hash _ -> n
| Disk _ -> n
| View v -> View (normalize_view ~clear_hash v)
and normalize_view ~clear_hash v = match v with
| Internal (n1, n2, i, h) ->
let h = if clear_hash then Not_Hashed else h in
_Internal (normalize ~clear_hash n1, normalize ~clear_hash n2, i, h)
| Bud (None, i, h) ->
let h = if clear_hash then Not_Hashed else h in
_Bud (None, i, h)
| Bud (Some n, i, h) ->
let h = if clear_hash then Not_Hashed else h in
_Bud (Some (normalize ~clear_hash n), i, h)
| Leaf (a, b, h) ->
let h = if clear_hash then Not_Hashed else h in
_Leaf (a, b, h)
| Extender (seg, n, i, h) ->
let h = if clear_hash then Not_Hashed else h in
_Extender (Segment.normalize seg, normalize ~clear_hash n, i, h)
let equal_nodes ~ignore_hash n1 n2 =
let clear_hash = ignore_hash in
normalize ~clear_hash n1 = normalize ~clear_hash n2
let all_children context node =
let rec aux store = function
| [] -> store
| (segs_rev, node) :: tail ->
match Node_storage.view context node with
| Leaf _ ->
let segment = List.rev segs_rev |> Segment.concat in
aux ((segment, `File) :: store) tail
| Bud (Some child, _, _) ->
let segment = List.rev segs_rev |> Segment.concat in
aux ((segment, `Directory child) :: store) tail
| Bud (None, _, _) -> aux store tail
| Extender (seg, node', _, _) ->
aux store ((seg::segs_rev, node') :: tail)
| Internal (l, r, _, _) ->
aux store (
(Segment.of_sides [Segment.Left] :: segs_rev, l)
:: (Segment.of_sides [Segment.Right] :: segs_rev, r)
:: tail)
in
aux [] [([], node)]
let xassert b =
let open Printexc in
if not b then begin
prerr_endline ("*****************************************************\n" ^ raw_backtrace_to_string (get_callstack 10));
assert false
end
let reraise_after f x e =
try
f x
with
exn -> e exn; raise exn
let reraise_after_lwt (f : 'a -> 'b Lwt.t) (x : 'a) e =
Lwt.catch (fun () -> f x) (fun exn -> e exn; Lwt.fail exn)
let with_random f =
let seed =
let default () =
let st_seed = RS.make_self_init() in
RS.int st_seed @@ (1 lsl 30) - 1
in
match Sys.getenv "PLEBEIA_TEST_SEED" with
| exception Not_found -> default ()
| s ->
try
let i = int_of_string s in
Format.eprintf "PLEBEIA_TEST_SEED=%d@." i;
i
with _ -> default ()
in
let st = RS.make [| seed |] in
reraise_after f st @@ fun _exn ->
Format.eprintf "Failed with seed: PLEBEIA_TEST_SEED=%d@." seed
let with_random_lwt f =
let seed =
let default () =
let st_seed = RS.make_self_init() in
RS.int st_seed @@ (1 lsl 30) - 1
in
match Sys.getenv "PLEBEIA_TEST_SEED" with
| exception Not_found -> default ()
| s ->
try
let i = int_of_string s in
Format.eprintf "PLEBEIA_TEST_SEED=%d@." i;
i
with _ -> default ()
in
let st = RS.make [| seed |] in
reraise_after_lwt f st @@ fun _exn ->
Format.eprintf "Failed with seed: Random.State.make [| %d |]@." seed
let forget_random_nodes rs prob n =
let rec f n = match n with
| Hash _ -> n
| Disk _ -> n
| View v ->
if RS.float rs 1.0 < prob then
match Node.may_forget n with
| None -> n
| Some n -> n
else
match v with
| Leaf _ -> n
| Bud (None, _, _) -> n
| Bud (Some n', i, h) ->
let n' = f n' in
begin match _Bud (Some n', i, h) with
| exception _ -> n
| v -> View v
end
| Extender (seg, n', i, h) ->
let n' = f n' in
begin match _Extender (seg, n', i, h) with
| exception _ -> n
| v -> View v
end
| Internal (nl, nr, i, h) ->
let nl' = f nl in
let nr' = f nr in
begin match _Internal (nl', nr', i, h) with
| exception _ -> n
| v -> View v
end
in
f n
let leaves context node : Segment.t list list =
let rec aux store = function
| [] -> store
| (pathes_rev, node) :: tail ->
all_children context node
|> List.map (function
| (seg, `File) -> List.rev (seg :: pathes_rev) :: store
| (seg, `Directory child) when Segment.is_empty seg ->
aux store ((pathes_rev, child) :: tail)
| (seg, `Directory child) ->
aux store ((seg :: pathes_rev, child) :: tail))
|> List.concat
in
aux [] [([], node)]
let choose_random_node stop_prob st ctxt n0 =
let open Segment in
let rec f segs n =
let v = Node_storage.view ctxt n in
if RS.float st 1.0 < stop_prob then segs
else
match v with
| Leaf _ | Bud (None, _, _) -> f Segs.empty' n0
| Bud (Some n, _, _) -> f (Segs.push_bud segs) n
| Internal (n1, n2, _, _) ->
if RS.bool st then f (Segs.add_side segs Left) n1
else f (Segs.add_side segs Right) n2
| Extender (seg, n, _, _) ->
f (Segs.append_seg segs seg) n
in
f Segs.empty' n0
let make_resemble st ctxt n =
let c =
match Node_tools.count_nodes ~upto:1000 n with
| `EQ i | `GE i -> i
in
let open Segment in
let rec rm i n =
if i = 0 then n
else
let (`EQ c | `GE c) = Node_tools.count_nodes ~upto:1000 n in
let segs = choose_random_node 0.05 st ctxt n in
let segs = Segs.to_segments segs in
if segs = [] then rm (i-1) n
else
let cur = Cursor.(_Cursor (_Top, n, ctxt, Info.empty)) in
match Deep.delete' cur segs with
| Ok Cursor (_, n', _, _) ->
let (`EQ c' | `GE c') = Node_tools.count_nodes ~upto:1000 n' in
if c' * 2 < c then rm (i-1) n
else rm (i-1) n'
| Error _ -> rm (i-1) n
in
let n = rm (if c <= 1000 then 2 else 4) n in
let (`EQ c | `GE c) = Node_tools.count_nodes ~upto:1000 n in
let rec add i n =
if i = 0 then n
else
let segs = choose_random_node 0.05 st ctxt n in
let segs = Segs.append_seg segs @@ Gen.(segment (int 5)) st in
let m =
let open Gen in
one_of
[gen_leaf; gen_bud 8; gen_internal 8; gen_extender 8]
st
in
let segs = Segs.to_segments segs in
match
Deep.alter Cursor.(_Cursor (_Top, n, ctxt, Info.empty)) segs @@ function
| Some _ -> Ok m
| None ->
Ok m
with
| exception _ ->
add (i-1) n
| Ok (Cursor (_, n', _, _)) ->
let (`EQ c' | `GE c') = Node_tools.count_nodes ~upto:1000 n' in
if c' < c then add (i-1) n
else add (i-1) n'
| Error _ -> add (i-1) n
in
let n = add 32 n in
n
let copy_file fn fn' =
let* fd = Lwt_unix.openfile fn [O_RDONLY] 0o644 in
let* fd' = Lwt_unix.openfile fn' [O_CREAT; O_TRUNC; O_WRONLY] 0o644 in
let buf = Bytes.create 4096 in
let rec loop () =
let* nreads = Lwt_unix.read fd buf 0 4096 in
if nreads = 0 then Lwt.return_unit
else begin
let* nwrites = Lwt_unix.write fd' buf 0 nreads in
assert (nreads = nwrites);
loop ()
end
in
let* () = loop () in
let* () = Lwt_unix.close fd in
Lwt_unix.close fd'
let count_nodes ctxt n =
let cntr = ref 0 in
Traverse.Iter.iter (fun t ->
incr cntr;
`Continue (Node_storage.view ctxt t)) n;
!cntr
let gen_node ctxt rng ?min_nodes depth =
match min_nodes with
| None ->
Node_type.gen_bud depth rng
| Some min_nodes ->
let rec aux (max_ns, m) = function
| 0 ->
Format.eprintf "Warning: could not build a node with size >= %d@." min_nodes;
m
| i ->
let n = Node_type.gen_bud depth rng in
let ns = count_nodes ctxt n in
if min_nodes <= ns then begin
Format.eprintf "Build a node with size %d@." ns;
n
end else
let max_ns, m =
if max_ns < ns then ns, n
else max_ns, m
in
aux (max_ns, m) (i-1)
in
aux (1, Node_type.gen_leaf rng) 100
let validate_node ctxt n =
Result.default (Debug.validate_node ctxt n) (fun e ->
to_file ~file:"invalid.dot" @@ Debug.dot_of_node n;
prerr_endline "Saved the current node to invalid.dot";
failwith e)
let check_cursor_is_top c =
match c with
| Cursor.Cursor (Top, _, _, _) -> ()
| _ -> xassert false
let random_segs_to_bud_or_leaf rng c =
let open Cursor in
let Cursor (_, n, context, _) = c in
match Node_storage.view context n with
| Internal _ | Extender _ | Leaf _ -> assert false
| Bud (None, _, _) -> None
| Bud (Some n, _, _) ->
let rec choose_random_segs rev_segs rev_seg n =
let v = Node_storage.view context n in
match v with
| Leaf _ -> List.rev (List.rev rev_seg :: rev_segs)
| Bud (None, _, _) -> List.rev (List.rev rev_seg :: rev_segs)
| Bud (Some n, _, _) ->
let rev_segs = List.rev rev_seg :: rev_segs in
if RS.int rng 2 = 0 then List.rev rev_segs
else choose_random_segs rev_segs [] n
| Internal (n1, n2, _, _) ->
if RS.int rng 2 = 0 then
let rev_seg = Segment.Left :: rev_seg in
choose_random_segs rev_segs rev_seg n1
else
let rev_seg = Segment.Right :: rev_seg in
choose_random_segs rev_segs rev_seg n2
| Extender (seg, n, _, _) ->
let rev_seg = List.rev_append (Segment.to_sides seg) rev_seg in
choose_random_segs rev_segs rev_seg n
in
Some (List.map Segment.of_sides @@ choose_random_segs [] [] n)
let dump_cursor c =
let Cursor.Cursor (_, n, context, _) = c in
to_file ~file:"plebeia.dot" @@ Debug.dot_of_cursor c;
to_file ~file:"plebeia_dumb.dot" @@ Dumb.dot_of_node @@ Dumb.of_plebeia_node context n
let compare_trees dumb (Cursor.Cursor (_, n, context, _) as c) =
if Dumb.get_node dumb <> Dumb.of_plebeia_node context n then begin
to_file ~file:"dumb.dot" @@ Dumb.dot_of_cursor dumb;
dump_cursor c;
let (Cursor (_, n, context, _)) = Cursor.go_top c in
to_file ~file:"plebeia_dumb_root.dot" @@ Dumb.dot_of_node @@ Dumb.of_plebeia_node context n;
assert false
end
let gen_segments (a,b) c = Gen.(list (int_range (a,b)) (segment @@ return c))
let prepare_tree rs c ~path_bits ~nfiles ~vbytes =
let rec loop c segs = function
| 0 -> c, segs
| nfiles ->
let seg = Gen.(segment (return path_bits)) rs in
let v = Value.of_string @@ Gen.(string (return vbytes) char) rs in
match Cursor.insert c seg v with
| Error _ -> loop c segs nfiles
| Ok c -> loop c (seg::segs) (nfiles - 1)
in
loop c [] nfiles
let random_terminal ctxt n rng =
begin match Node_storage.view ctxt n with
| Bud _ -> ()
| _ -> invalid_arg "node must be a Bud"
end;
let rec f segs n =
match Node_storage.view ctxt n with
| Leaf _ | Bud (None, _, _) ->
Segment.Segs.to_segments segs, n
| Bud (Some n, _, _) ->
f (Segment.Segs.push_bud segs) n
| Internal (l, r, _, _) ->
begin match Gen.bool rng with
| true -> f (Segment.Segs.add_side segs Left) l
| false -> f (Segment.Segs.add_side segs Right) r
end
| Extender (seg, n, _, _) ->
f (Segment.Segs.append_seg segs seg) n
in
f Segment.Segs.empty' n
let ignore_lwt v =
Lwt.catch (fun () -> Lwt.bind v (fun _ -> Lwt.return_unit))
(function
| Error.Error e -> Format.eprintf "Error: %a@." Error.pp e; assert false
| exn -> raise exn)
let run_lwt = Lwt_main.run
let run_ignore_lwt v =
run_lwt (ignore_lwt v)
let exec_lwt f () = Lwt_main.run @@ f ()
let for_lwt start stop f =
let rec loop i =
if i >= stop then Lwt.return_unit
else
let* () = f i in
loop (i+1)
in
loop start
module SegmentSet = Set.Make( struct type t = Segment.t let compare = Segment.compare end )
module SegmentListSet = Set.Make(struct
type t = Segment.t list
let compare segs1 segs2 =
let n1 = List.length segs1 in
let n2 = List.length segs2 in
match compare n1 n2 with
| (1 | -1 as x) -> x
| 0 ->
let rec loop = function
| [] -> 0
| (seg1,seg2)::segss ->
match Segment.compare seg1 seg2 with
| (1 | -1 as x) -> x
| 0 -> loop segss
| _ -> assert false
in
loop @@ List.combine segs1 segs2
| _ -> assert false
end)
let get_leaves c =
Cursor.fold ~init:SegmentListSet.empty c (fun acc c ->
let _, v = Cursor.view c in
match v with
| Leaf (_, _, _) ->
`Continue, SegmentListSet.add (Path.to_segments @@ Cursor.path_of_cursor c) acc
| _ -> `Continue, acc)
let get_empty_buds c =
Cursor.fold ~init:[] c (fun acc c ->
let c, v = Cursor.view c in
match c, v with
| Cursor (Top, _, _, _), _ -> `Continue, acc
| _, Bud (None, _, _) -> `Continue, Cursor.path_of_cursor c :: acc
| _ -> `Continue, acc)
module NameStringSegment = struct
type t = string * Segment.t
let equal (s1,seg1) (s2,seg2) = s1 = s2 && Segment.equal seg1 seg2
let to_string (s1,_) = Fs.Name8bits.to_string s1
let pp ppf (s1,seg1) = Format.fprintf ppf "%a|%a" Fs.Name8bits.pp s1 Segment.pp seg1
let to_segment (_,seg) = seg
let of_segment seg = Option.map (fun n -> (n,seg)) @@ Fs.Name8bits.of_segment seg
let test _ = assert false
let ( !/ ) s =
match String.split_by_char (function '/' -> true | _ -> false) s with
| "" :: ss ->
List.map (fun s ->
let seg =
Segment.unsafe_of_encoding (String.length s * 8 + 8)
(s ^ "\000")
in
s, seg) (List.filter (function "" -> false | _ -> true) ss)
| _ -> assert false
let ( ?/ ) segs = List.map fst segs
end