package dose3

  1. Overview
  2. Docs
Legend:
Page
Library
Module
Module type
Parameter
Class
Class type
Source

Source file input.ml

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
(**************************************************************************************)
(*  Copyright (C) 2009 Pietro Abate <pietro.abate@pps.jussieu.fr>                     *)
(*  Copyright (C) 2009 Mancoosi Project                                               *)
(*                                                                                    *)
(*  This library is free software: you can redistribute it and/or modify              *)
(*  it under the terms of the GNU Lesser General Public License as                    *)
(*  published by the Free Software Foundation, either version 3 of the                *)
(*  License, or (at your option) any later version.  A special linking                *)
(*  exception to the GNU Lesser General Public License applies to this                *)
(*  library, see the COPYING file for more information.                               *)
(**************************************************************************************)

open ExtLib

include Util.Logging (struct
  let label = "dose_common.input"
end)

let gzip_open_file file =
  let ch = Gzip.open_in file in
  let input_char ch =
    try Gzip.input_char ch with End_of_file -> raise IO.No_more_input
  in
  let read ch =
    try Gzip.input ch with End_of_file -> raise IO.No_more_input
  in
  IO.create_in
    ~read:(fun () -> input_char ch)
    ~input:(read ch)
    ~close:(fun () -> Gzip.close_in ch)

let xz_open_file file =
  let ch = Unix.open_process_in ("xzcat " ^ file) in
  let read ch = try input ch with End_of_file -> raise IO.No_more_input in
  IO.create_in
    ~read:(fun () -> input_char ch)
    ~input:(read ch)
    ~close:(fun () -> close_in ch)

let bzip_open_file file =
  (* workaround to avoid segfault :
   * http://bugs.debian.org/cgi-bin/bugreport.cgi?bug=602170 *)
  let _ = Bz2.version in
  let s = Bytes.create 1 in
  let ch = Bz2.open_in (open_in file) in
  let input_char ch =
    try
      ignore (Bz2.read ch s 0 1) ;
      Bytes.get s 0
    with End_of_file -> raise IO.No_more_input
  in
  let read ch s pos len =
    try Bz2.read ch s pos len with End_of_file -> raise IO.No_more_input
  in
  IO.create_in
    ~read:(fun () -> input_char ch)
    ~input:(fun x -> read ch x)
    ~close:(fun () -> Bz2.close_in ch)

let std_open_file file = IO.input_channel (open_in file)

let open_ch ch = IO.input_channel ch

let close_ch ch = IO.close_in ch

exception File_empty

let open_file file =
  if not (Sys.file_exists file) then fatal "Input file %s does not exist." file
  else if (Unix.stat file).Unix.st_size = 0 then (
    warning "Input file %s is empty" file ;
    raise File_empty)
  else
    let openfun =
      try
        let ch = open_in file in
        let openfun =
          match input_byte ch with
          (* gzip magic is 0x1f 0x8b *)
          | 0x1f -> (
              match input_byte ch with
              | 0x8b -> gzip_open_file
              | _ -> std_open_file)
          (* bz2 magic is "BZh" *)
          | 0x42 -> (
              match input_byte ch with
              | 0x5a -> (
                  match input_byte ch with
                  | 0x68 -> bzip_open_file
                  | _ -> std_open_file)
              | _ -> std_open_file)
          (* xz magic is 0xfd "7zXZ" *)
          | 0xfd -> (
              match input_byte ch with
              | 0x37 -> (
                  match input_byte ch with
                  | 0x7a -> (
                      match input_byte ch with
                      | 0x58 -> (
                          match input_byte ch with
                          | 0x5a -> xz_open_file
                          | _ -> std_open_file)
                      | _ -> std_open_file)
                  | _ -> std_open_file)
              | _ -> std_open_file)
          | _ -> std_open_file
        in
        close_in ch ;
        openfun
      with End_of_file -> std_open_file
    in
    openfun file

let parse_uri s =
  let url = Url.of_string s in
  let path = url.Url.path in
  (url.Url.scheme, (None, None, None, None, path), None)

let guess_format urilist =
  match List.flatten urilist with
  | uri :: _ ->
      let (p, _, _) = parse_uri uri in
      p
  | _ -> fatal "Impossible to guess input format"
OCaml

Innovation. Community. Security.