package decompress
Pure OCaml implementation of Zlib
Install
Dune Dependency
Authors
Maintainers
Sources
decompress-0.8.tbz
sha256=ea6987f72816044ccf3edb586e3b64668d53c5ef1b0a735119e5c9d740504240
md5=547eaf0803af3ed01ff7801facfe27e6
doc/src/decompress.impl/decompress_lz77.ml.html
Source file decompress_lz77.ml
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431
module Safe = Decompress_safe module Seq = Decompress_seq module Hunk = Decompress_hunk let repeat atm = let atm = Char.code atm |> Int64.of_int in let ( lor ) = Int64.logor in let ( lsl ) = Int64.shift_left in atm lor (atm lsl 8) lor (atm lsl 16) lor (atm lsl 24) lor (atm lsl 32) lor (atm lsl 40) lor (atm lsl 48) lor (atm lsl 56) type error = | Invalid_level of int | Invalid_wbits of int let pp_error fmt = function | Invalid_level level -> Format.fprintf fmt "(Invalid_level %d)" level | Invalid_wbits wbits -> Format.fprintf fmt "(Invalid_wbits %d)" wbits exception Match of int * int exception Literal of char exception Break type 'i t = { i_off : int ; i_pos : int ; i_len : int ; level : int ; on : Hunk.t -> unit ; state : 'i state } and 'i state = | Deflate of int | Deffast of int | Choose of int | Exception of error and 'i res = | Cont of 'i t | Wait of 'i t * Hunk.t Seq.t | Error of 'i t * error (** XXX: we don't have an [Ok] result because this algorithm does not decide if you need to stop the compression or not - this is decided by the user. It's illogic to force a [`End] state with this algorithm. *) let pp_state fmt = function | Deflate wbits -> Format.fprintf fmt "(Deflate wbits:%d)" wbits | Deffast wbits -> Format.fprintf fmt "(Deffast wbits:%d)" wbits | Choose wbits -> Format.fprintf fmt "(Choose wbits:%d)" wbits | Exception exn -> Format.fprintf fmt "(Exception %a)" pp_error exn let pp fmt { i_off; i_pos; i_len ; level ; state ; _ } = Format.fprintf fmt "{@[<hov>i_off = %d;@ \ i_pos = %d;@ \ i_len = %d;@ \ level = %d;@ \ on = #fun;@ \ state = %a@]}" i_off i_pos i_len level pp_state state let await t lst = Wait (t, lst) let error t exn = Error ({ t with state = Exception exn }, exn) let _max_distance = 8191 let _max_length = 256 let _size_of_int64 = 8 let _idx_boundary = 2 type key = Int32.t option let key src idx len : key = if idx < len - 3 then Some (Safe.get_u32 src idx) else None module T = struct let find table x = try Hashtbl.find table x with Not_found -> [] let add key value table = let rest = find table key in Hashtbl.replace table key (value :: rest) end let longuest_substring src x y len = let rec aux acc l = if l < _max_length && x + l < y && y + l < len && Safe.get src (x + l) = Safe.get src (y + l) then aux (Some (l + 1)) (l + 1) else acc in aux None 0 (* XXX: from ocaml-lz77, no optimized but this algorithm has no constraint. bisoux @samoht. *) let deflate ?(max_fardistance = (1 lsl 15) - 1) src t = let results = Queue.create () in let src_idx = ref (t.i_off + t.i_pos) in let table = Hashtbl.create 1024 in let last = ref 0 in let flush_last () = if !last <> 0 then begin for i = 0 to !last - 1 do t.on (Hunk.Literal (Safe.get src (!src_idx - !last + i))); Queue.push (Hunk.Literal (Safe.get src (!src_idx - !last + i))) results; done; last := 0 end in let find_match idx = let max a b = match a, b with | Some (_, x), Some (_, y) -> if x >= y then a else b | Some _, None -> a | None, Some _ -> b | None, None -> None in let key = key src idx (t.i_off + t.i_len) in let candidates = T.find table key in let rec aux acc = function | [] -> acc | x :: r -> if x >= idx || idx - x >= max_fardistance then acc else match longuest_substring src x idx (t.i_off + t.i_len) with | Some len when len >= 3 -> aux (max acc (Some (x, len))) r | _ -> aux acc r in match aux None candidates with | None -> None | Some (i, len) -> Some (idx - i, len) in while !src_idx < t.i_off + t.i_len do match find_match !src_idx with | None -> T.add (key src !src_idx (t.i_off + t.i_len)) !src_idx table; incr last; incr src_idx; | Some (start, len) -> for i = !src_idx to !src_idx + len - 1 do T.add (key src i (t.i_off + t.i_len)) i table done; flush_last (); t.on (Hunk.Match (len - 3, start - 1)); Queue.push (Hunk.Match (len - 3, start - 1)) results; src_idx := !src_idx + len done; flush_last (); Seq.of_queue results let _hlog = [| 0; 11; 11; 11; 12; 13; 13; 13; 13; 13 |] (* Same as blosclz, fast and imperative implementation *) let deffast : type a. ?accel:int -> ?max_fardistance:int -> (Safe.read, a) Safe.t -> a t -> Hunk.t Seq.t = fun ?(accel = 1) ?(max_fardistance = (1 lsl 15) - 1) src t -> let src_idx = ref (t.i_off + t.i_pos) in let hash_log = Array.get _hlog t.level in let hash_len = 1 lsl hash_log in let hash_tab = Array.make hash_len 0 in let results = Queue.create () in let accel = if accel < 1 then 0 else accel - 1 in t.on (Hunk.Literal (Safe.get src !src_idx)); Queue.push (Hunk.Literal (Safe.get src !src_idx)) results; incr src_idx; t.on (Hunk.Literal (Safe.get src !src_idx)); Queue.push (Hunk.Literal (Safe.get src !src_idx)) results; incr src_idx; let c ref idx = try if Safe.get src !ref = Safe.get src !idx then begin incr ref; incr idx; true end else false with _ -> false in while !src_idx < t.i_off + t.i_len - 12 do let anchor = !src_idx in let src_ref = ref !src_idx in try if Safe.get src !src_idx = Safe.get src (!src_idx - 1) && Safe.get_u16 src (!src_idx - 1) = Safe.get_u16 src (!src_idx + 1) then raise (Match (0, 0)) (* (+3, +1) *); let hval = let v = Safe.get_u16 src !src_idx in let v = (Safe.get_u16 src (!src_idx + 1) lxor (v lsr (16 - hash_log))) lxor v in v land ((1 lsl hash_log) - 1) in src_ref := (Array.get hash_tab hval); let distance = anchor - !src_ref in if distance land accel = 0 then Array.set hash_tab hval (anchor - t.i_off); if distance = 0 || distance >= max_fardistance || c src_ref src_idx = false || c src_ref src_idx = false || c src_ref src_idx = false then raise (Literal (Safe.get src anchor)); if t.level >= 5 && distance >= _max_distance then if c src_ref src_idx = false || c src_ref src_idx = false then raise (Literal (Safe.get src anchor)) else raise (Match (2, distance - 1)) (* (+3, +1) *); raise (Match (!src_idx - anchor - 3, distance - 1)) with Match (len, 0) -> begin let pattern = Safe.get src (anchor + len - 1) in let v1 = repeat pattern in (* _ _ _ _ * |_|_|_|_| * | | | | src_idx * | | | src_ref * | | anchor * | -1 *) src_idx := anchor + (len + 3); (* XXX: in blosclz, [src_ref = anchor - 1 + 3], but in this case, we accept 1 wrong byte. *) src_ref := anchor + (len + 3); try while !src_idx < (t.i_off + t.i_len) - _size_of_int64 - (2 * _idx_boundary) && !src_idx - 3 - anchor < _max_length - _size_of_int64 do let v2 = Safe.get_u64 src !src_ref in if v1 <> v2 then begin while !src_idx < (t.i_off + t.i_len) - _idx_boundary && !src_idx - 3 - anchor < _max_length do if Safe.get src !src_ref <> pattern then raise Break else begin incr src_ref; incr src_idx; end done; raise Break end else begin src_idx := !src_idx + 8; src_ref := !src_ref + 8; end done; raise Break with Break -> begin if !src_idx > t.i_off + t.i_len - _idx_boundary then begin let l = !src_idx - (t.i_off + t.i_len) - _idx_boundary in src_idx := !src_idx - l; src_ref := !src_ref - l; end; t.on (Hunk.Match (!src_idx - 3 - anchor, 0)); Queue.push (Hunk.Match (!src_idx - 3 - anchor, 0)) results; end end | Match (len, dist) -> begin src_idx := anchor + (len + 3); src_ref := anchor - (dist + 1) + (len + 3); try while !src_idx < (t.i_off + t.i_len) - _size_of_int64 - (2 * _idx_boundary) && !src_idx - 3 - anchor < _max_length - _size_of_int64 do if Safe.get_u64 src !src_idx <> Safe.get_u64 src !src_ref then begin while !src_idx < (t.i_off + t.i_len) - _idx_boundary && !src_idx - 3 - anchor < _max_length do if c src_ref src_idx = false then raise Break done; raise Break end else begin src_idx := !src_idx + 8; src_ref := !src_ref + 8; end; done; raise Break with Break -> begin if !src_idx > t.i_off + t.i_len - _idx_boundary then begin let l = !src_idx - (t.i_off + t.i_len) - _idx_boundary in src_idx := !src_idx - l; src_ref := !src_ref - l; end; t.on (Hunk.Match (!src_idx - 3 - anchor, dist)); Queue.push (Hunk.Match (!src_idx - 3 - anchor, dist)) results; end end | Literal chr -> begin src_idx := anchor + 1; t.on (Hunk.Literal chr); Queue.push (Hunk.Literal chr) results; end done; while !src_idx < t.i_off + t.i_len do t.on (Hunk.Literal (Safe.get src !src_idx)); Queue.push (Hunk.Literal (Safe.get src !src_idx)) results; incr src_idx done; Seq.of_queue results let eval src t = let eval0 t = match t.state with | Deflate wbits -> if t.i_len >= 12 then Cont { t with state = Deffast wbits } else let hunks = deflate ~max_fardistance:((1 lsl wbits) - 1) src t in await { t with state = Choose wbits ; i_pos = t.i_len } hunks | Deffast wbits -> if t.i_len >= 12 then let hunks = deffast ~max_fardistance:((1 lsl wbits) - 1) src t in await { t with state = Choose wbits ; i_pos = t.i_len } hunks else Cont { t with state = Deflate wbits } | Choose _ -> await t Seq.empty | Exception exn -> error t exn in let rec loop t = match eval0 t with | Cont t -> loop t | Wait (t, hunks) -> `Await (t, hunks) | Error (t, exn) -> `Error (t, exn) in loop t let refill off len t = if (t.i_len - t.i_pos) = 0 then match t.state with | Choose window_bits -> { t with i_off = off ; i_len = len ; i_pos = 0 ; state = Deflate window_bits } | _ -> { t with i_off = off ; i_len = len ; i_pos = 0 } else invalid_arg (Format.sprintf "L.refill: you lost something (pos: %d, \ len: %d)" t.i_pos t.i_len) let used_in t = t.i_pos let default ?(level = 0) ?(on = fun _ -> ()) wbits = if level >= 0 && level <= 9 && wbits >= 8 && wbits <= 15 then { i_off = 0 ; i_pos = 0 ; i_len = 0 ; level ; on ; state = Deflate wbits } else if wbits >= 8 && wbits <= 15 then { i_off = 0 ; i_pos = 0 ; i_len = 0 ; level = 0 ; on ; state = Exception (Invalid_level level) } else { i_off = 0 ; i_pos = 0 ; i_len = 0 ; level = 0 ; on ; state = Exception (Invalid_wbits wbits) }
sectionYPositions = computeSectionYPositions($el), 10)"
x-init="setTimeout(() => sectionYPositions = computeSectionYPositions($el), 10)"
>