package decompress
Implementation of Zlib in OCaml
Install
Dune Dependency
Authors
Maintainers
Sources
decompress-v0.9.0.tbz
sha256=70dd782b258a51a37c3971b9bd96c656b161876d781e168a626e9bb437833e3b
sha512=34033405c8dca30f67c39cad8f50875e255644d0e0b88019091d59932aaf90d87445070228291b1d3d1c07a98ce97aeca11554daf1a8f3b04d043b4f6c1ab83c
doc/src/decompress.impl/decompress_lz77.ml.html
Source file decompress_lz77.ml
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362
module Safe = Decompress_safe module Seq = Decompress_seq module Hunk = Decompress_hunk module Buffer = Decompress_buffer let pf = Format.fprintf let repeat atm = let atm = Char.code atm |> Int64.of_int in let ( lor ) = Int64.logor in let ( lsl ) = Int64.shift_left in atm lor (atm lsl 8) lor (atm lsl 16) lor (atm lsl 24) lor (atm lsl 32) lor (atm lsl 40) lor (atm lsl 48) lor (atm lsl 56) type error = Invalid_level of int | Invalid_wbits of int let pp_error fmt = function | Invalid_level level -> Format.fprintf fmt "(Invalid_level %d)" level | Invalid_wbits wbits -> Format.fprintf fmt "(Invalid_wbits %d)" wbits exception Match of int * int exception Literal of char exception Break type 'i t = { i_off: int ; i_pos: int ; i_len: int ; level: int ; on: Hunk.t -> unit ; state: 'i state ; witness: 'i Buffer.t } and 'i state = | Deflate of int | Deffast of int | Choose of int | Exception of error and 'i res = | Cont of 'i t | Wait of 'i t * Hunk.t Seq.t | Error of 'i t * error (* XXX: we don't have an [Ok] result because this algorithm does not decide if you need to stop the compression or not - this is decided by the user. It's illogic to force a [`End] state with this algorithm. *) let pp_state ppf = function | Deflate wbits -> pf ppf "(Deflate wbits:%d)" wbits | Deffast wbits -> pf ppf "(Deffast wbits:%d)" wbits | Choose wbits -> pf ppf "(Choose wbits:%d)" wbits | Exception exn -> pf ppf "(Exception @[%a@])" pp_error exn let pp ppf {i_off; i_pos; i_len; level; state; _} = pf ppf "{@[<hov>i_off = %d;@ i_pos = %d;@ i_len = %d;@ level = %d;@ on = #fun;@ \ state = @[%a@]@]}" i_off i_pos i_len level pp_state state let await t lst : 'i res = Wait (t, lst) let error t exn : 'i res = Error ({t with state= Exception exn}, exn) let _max_distance = 8191 let _max_length = 256 let _size_of_int64 = 8 let _idx_boundary = 2 type key = int32 option let key witness src idx len : key = if idx < len - 3 then Some (Safe.get_32 witness src idx) else None module T = struct let find table x = try Hashtbl.find table x with Not_found -> [] let add key value table = let rest = find table key in Hashtbl.replace table key (value :: rest) end let longuest_substring witness src x y len = let rec aux acc l = if l < _max_length && x + l < y && y + l < len && Safe.get witness src (x + l) = Safe.get witness src (y + l) then aux (Some (l + 1)) (l + 1) else acc in aux None 0 (* XXX: from ocaml-lz77, no optimized but this algorithm has no constraint. bisoux @samoht. *) let deflate ?(max_fardistance = (1 lsl 15) - 1) src t = let results = Queue.create () in let src_idx = ref (t.i_off + t.i_pos) in let table = Hashtbl.create 1024 in let last = ref 0 in let flush_last () = if !last <> 0 then ( for i = 0 to !last - 1 do let hunk = Hunk.Literal (Safe.get t.witness src (!src_idx - !last + i)) in t.on hunk ; Queue.push hunk results done ; last := 0 ) in let find_match idx = let max a b = match (a, b) with | Some (_, x), Some (_, y) -> if x >= y then a else b | Some _, None -> a | None, Some _ -> b | None, None -> None in let key = key t.witness src idx (t.i_off + t.i_len) in let candidates = T.find table key in let rec aux acc = function | [] -> acc | x :: r -> ( if x >= idx || idx - x >= max_fardistance then acc else match longuest_substring t.witness src x idx (t.i_off + t.i_len) with | Some len when len >= 3 -> aux (max acc (Some (x, len))) r | _ -> aux acc r ) in match aux None candidates with | None -> None | Some (i, len) -> Some (idx - i, len) in while !src_idx < t.i_off + t.i_len do match find_match !src_idx with | None -> T.add (key t.witness src !src_idx (t.i_off + t.i_len)) !src_idx table ; incr last ; incr src_idx | Some (start, len) -> for i = !src_idx to !src_idx + len - 1 do T.add (key t.witness src i (t.i_off + t.i_len)) i table done ; flush_last () ; t.on (Hunk.Match (len - 3, start - 1)) ; Queue.push (Hunk.Match (len - 3, start - 1)) results ; src_idx := !src_idx + len done ; flush_last () ; Seq.of_queue results let _hlog = [|0; 11; 11; 11; 12; 13; 13; 13; 13; 13|] (* Same as blosclz, fast and imperative implementation *) let deffast : type a. ?accel:int -> ?max_fardistance:int -> (Safe.ro, a) Safe.t -> a t -> Hunk.t Seq.t = fun ?(accel = 1) ?(max_fardistance = (1 lsl 15) - 1) src t -> let src_idx = ref (t.i_off + t.i_pos) in let hash_log = _hlog.(t.level) in let hash_len = 1 lsl hash_log in let hash_tab = Array.make hash_len 0 in let results = Queue.create () in let accel = if accel < 1 then 0 else accel - 1 in t.on (Hunk.Literal (Safe.get t.witness src !src_idx)) ; Queue.push (Hunk.Literal (Safe.get t.witness src !src_idx)) results ; incr src_idx ; t.on (Hunk.Literal (Safe.get t.witness src !src_idx)) ; Queue.push (Hunk.Literal (Safe.get t.witness src !src_idx)) results ; incr src_idx ; let c ref idx = try if Safe.get t.witness src !ref = Safe.get t.witness src !idx then ( incr ref ; incr idx ; true ) else false with _ -> false in while !src_idx < t.i_off + t.i_len - 12 do let anchor = !src_idx in let src_ref = ref !src_idx in try if Safe.get t.witness src !src_idx = Safe.get t.witness src (!src_idx - 1) && Safe.get_16 t.witness src (!src_idx - 1) = Safe.get_16 t.witness src (!src_idx + 1) then raise (Match (0, 0)) (* (+3, +1) *) ; let hval = let v = Safe.get_16 t.witness src !src_idx in let v = Safe.get_16 t.witness src (!src_idx + 1) lxor (v lsr (16 - hash_log)) lxor v in v land ((1 lsl hash_log) - 1) in src_ref := hash_tab.(hval) ; let distance = anchor - !src_ref in if distance land accel = 0 then hash_tab.(hval) <- anchor - t.i_off ; if distance = 0 || distance >= max_fardistance || c src_ref src_idx = false || c src_ref src_idx = false || c src_ref src_idx = false then raise (Literal (Safe.get t.witness src anchor)) ; if t.level >= 5 && distance >= _max_distance then if c src_ref src_idx = false || c src_ref src_idx = false then raise (Literal (Safe.get t.witness src anchor)) else raise (Match (2, distance - 1)) (* (+3, +1) *) ; raise (Match (!src_idx - anchor - 3, distance - 1)) with | Match (len, 0) -> ( let pattern = Safe.get t.witness src (anchor + len - 1) in let v1 = repeat pattern in (* _ _ _ _ * |_|_|_|_| * | | | | src_idx * | | | src_ref * | | anchor * | -1 *) src_idx := anchor + (len + 3) ; (* XXX: in blosclz, [src_ref = anchor - 1 + 3], but in this case, we accept 1 wrong byte. *) src_ref := anchor + (len + 3) ; try while !src_idx < t.i_off + t.i_len - _size_of_int64 - (2 * _idx_boundary) && !src_idx - 3 - anchor < _max_length - _size_of_int64 do let v2 = Safe.get_64 t.witness src !src_ref in if v1 <> v2 then ( while !src_idx < t.i_off + t.i_len - _idx_boundary && !src_idx - 3 - anchor < _max_length do if Safe.get t.witness src !src_ref <> pattern then raise Break else ( incr src_ref ; incr src_idx ) done ; raise Break ) else ( src_idx := !src_idx + 8 ; src_ref := !src_ref + 8 ) done ; raise Break with Break -> if !src_idx > t.i_off + t.i_len - _idx_boundary then ( let l = !src_idx - (t.i_off + t.i_len) - _idx_boundary in src_idx := !src_idx - l ; src_ref := !src_ref - l ) ; t.on (Hunk.Match (!src_idx - 3 - anchor, 0)) ; Queue.push (Hunk.Match (!src_idx - 3 - anchor, 0)) results ) | Match (len, dist) -> ( src_idx := anchor + (len + 3) ; src_ref := anchor - (dist + 1) + (len + 3) ; try while !src_idx < t.i_off + t.i_len - _size_of_int64 - (2 * _idx_boundary) && !src_idx - 3 - anchor < _max_length - _size_of_int64 do if Safe.get_64 t.witness src !src_idx <> Safe.get_64 t.witness src !src_ref then ( while !src_idx < t.i_off + t.i_len - _idx_boundary && !src_idx - 3 - anchor < _max_length do if c src_ref src_idx = false then raise Break done ; raise Break ) else ( src_idx := !src_idx + 8 ; src_ref := !src_ref + 8 ) done ; raise Break with Break -> if !src_idx > t.i_off + t.i_len - _idx_boundary then ( let l = !src_idx - (t.i_off + t.i_len) - _idx_boundary in src_idx := !src_idx - l ; src_ref := !src_ref - l ) ; t.on (Hunk.Match (!src_idx - 3 - anchor, dist)) ; Queue.push (Hunk.Match (!src_idx - 3 - anchor, dist)) results ) | Literal chr -> src_idx := anchor + 1 ; t.on (Hunk.Literal chr) ; Queue.push (Hunk.Literal chr) results done ; while !src_idx < t.i_off + t.i_len do (let hunk = Hunk.Literal (Safe.get t.witness src !src_idx) in t.on hunk ; Queue.push hunk results) ; incr src_idx done ; Seq.of_queue results let eval src t = let eval0 t = match t.state with | Deflate wbits -> if t.i_len >= 12 then Cont {t with state= Deffast wbits} else let hunks = deflate ~max_fardistance:((1 lsl wbits) - 1) src t in await {t with state= Choose wbits; i_pos= t.i_len} hunks | Deffast wbits -> if t.i_len >= 12 then let hunks = deffast ~max_fardistance:((1 lsl wbits) - 1) src t in await {t with state= Choose wbits; i_pos= t.i_len} hunks else Cont {t with state= Deflate wbits} | Choose _ -> await t Seq.empty | Exception exn -> error t exn in let rec loop t = match eval0 t with | Cont t -> loop t | Wait (t, hunks) -> `Await (t, hunks) | Error (t, exn) -> `Error (t, exn) in loop t let refill off len t = if t.i_len - t.i_pos = 0 then match t.state with | Choose window_bits -> {t with i_off= off; i_len= len; i_pos= 0; state= Deflate window_bits} | Deflate _ | Deffast _ | Exception _ -> {t with i_off= off; i_len= len; i_pos= 0} else invalid_arg (Format.sprintf "L.refill: you lost something (pos: %d, len: %d)" t.i_pos t.i_len) let used_in t = t.i_pos let default ~witness ?(level = 0) ?(on = fun _ -> ()) wbits = if level >= 0 && level <= 9 && wbits >= 8 && wbits <= 15 then {i_off= 0; i_pos= 0; i_len= 0; level; on; state= Deflate wbits; witness} else if wbits >= 8 && wbits <= 15 then { i_off= 0 ; i_pos= 0 ; i_len= 0 ; level= 0 ; on ; state= Exception (Invalid_level level) ; witness } else { i_off= 0 ; i_pos= 0 ; i_len= 0 ; level= 0 ; on ; state= Exception (Invalid_wbits wbits) ; witness }
sectionYPositions = computeSectionYPositions($el), 10)"
x-init="setTimeout(() => sectionYPositions = computeSectionYPositions($el), 10)"
>