Source file ocsigen_multipart.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
open Lwt.Infix
module S = Ocsigen_lib.Netstring_pcre
module Pcre = Re.Pcre
let section = Lwt_log.Section.make "ocsigen:server:multipart"
exception Multipart_error of string
exception Ocsigen_upload_forbidden
let match_end result = snd (Pcre.get_substring_ofs result 0)
let cr_or_lf_re = S.regexp "[\013\n]"
let =
S.regexp
"([^ \t\r\n:]+):[ \t]*((.*[^ \t\r\n])?([ \t\r]*\n[ \t](.*[^ \t\r\n])?)*)[ \t\r]*\n"
let = S.regexp "([^ \t\r\n:]+):([ \t]*.*\n([ \t].*\n)*)"
let empty_line_re = S.regexp "\013?\n"
let = S.regexp "\n\013?\n"
let ?(downcase = true) ?(unfold = true) ?(strip = false) parstr
~start_pos ~end_pos
=
let =
if unfold || strip then header_stripped_re else header_unstripped_re
in
let rec i l =
match S.string_match header_re parstr i with
| Some r ->
let i' = match_end r in
if i' > end_pos then raise (Multipart_error "Mimestring.scan_header");
let name =
if downcase
then String.lowercase_ascii (S.matched_group r 1 parstr)
else S.matched_group r 1 parstr
in
let value_with_crlf = S.matched_group r 2 parstr in
let value =
if unfold
then S.global_replace cr_or_lf_re "" value_with_crlf
else value_with_crlf
in
parse_header i' ((name, value) :: l)
| None -> (
match S.string_match empty_line_re parstr i with
| Some r' -> List.rev l, match_end r'
| None -> raise (Multipart_error "Mimestring.scan_header"))
in
parse_header start_pos []
let ?downcase ?unfold ?strip s =
let rec s =
Lwt.catch
(fun () ->
let b = Ocsigen_stream.current_buffer s in
match S.string_match empty_line_re b 0 with
| Some r -> Lwt.return (s, match_end r)
| None ->
Lwt.return
(s, match_end (snd (S.search_forward end_of_header_re b 0))))
(function
| Not_found -> (
Ocsigen_stream.enlarge_stream s >>= function
| Ocsigen_stream.Finished _ ->
Lwt.fail Ocsigen_stream.Stream_too_small
| Ocsigen_stream.Cont _ as s -> find_end_of_header s)
| e -> Lwt.fail e)
in
find_end_of_header s >>= fun (s, end_pos) ->
let b = Ocsigen_stream.current_buffer s in
let h, _ = scan_header ?downcase ?unfold ?strip b ~start_pos:0 ~end_pos in
Ocsigen_stream.skip s (Int64.of_int end_pos) >>= fun s -> Lwt.return (s, h)
let lf_re = S.regexp "[\n]"
let rec search_window s re start =
try
Lwt.return
(s, snd (S.search_forward re (Ocsigen_stream.current_buffer s) start))
with Not_found -> (
Ocsigen_stream.enlarge_stream s >>= function
| Ocsigen_stream.Finished _ -> Lwt.fail Ocsigen_stream.Stream_too_small
| Ocsigen_stream.Cont _ as s -> search_window s re start)
let search_end_of_line s k =
Lwt.catch
(fun () ->
search_window s lf_re k >>= fun (s, x) -> Lwt.return (s, match_end x))
(function
| Not_found ->
Lwt.fail
(Multipart_error
"read_multipart_body: MIME boundary without line end")
| e -> Lwt.fail e)
let search_first_boundary ~boundary s =
let re = S.regexp ("\n--" ^ Pcre.quote boundary) in
search_window s re 0 >>= fun (s, x) -> Lwt.return (s, match_end x)
let check_beginning_is_boundary ~boundary s =
let del = "--" ^ boundary in
let ldel = String.length del in
Ocsigen_stream.stream_want s (ldel + 2) >>= function
| Ocsigen_stream.Finished _ as str2 -> Lwt.return (str2, false, false)
| Ocsigen_stream.Cont (ss, _f) as str2 ->
let long = String.length ss in
let isdelim = long >= ldel && String.sub ss 0 ldel = del in
let islast = isdelim && String.sub ss ldel 2 = "--" in
Lwt.return (str2, isdelim, islast)
let rec parse_parts ~boundary ~decode_part s uses_crlf =
let delimiter = (if uses_crlf then "\r" else "") ^ "\n--" ^ boundary in
Ocsigen_stream.substream delimiter s >>= fun a ->
decode_part a >>= fun (y, s) ->
let l_delimiter = String.length delimiter in
Ocsigen_stream.next s >>= fun s ->
Ocsigen_stream.stream_want s (l_delimiter + 2) >>= fun s ->
let last_part =
match s with
| Ocsigen_stream.Finished _ -> false
| Ocsigen_stream.Cont (ss, _f) ->
let long = String.length ss in
long >= l_delimiter + 2
&& ss.[l_delimiter] = '-'
&& ss.[l_delimiter + 1] = '-'
in
if last_part
then Lwt.return [y]
else
search_end_of_line s 2 >>= fun (s, k) ->
Ocsigen_stream.skip s (Int64.of_int k) >>= fun s ->
parse_parts ~boundary ~decode_part s uses_crlf >>= fun l ->
Lwt.return (y :: l)
let read_multipart_body ~boundary ~decode_part s =
check_beginning_is_boundary ~boundary s >>= fun (s, b, islast) ->
if islast
then Lwt.return []
else if b
then
search_end_of_line s 0 >>= fun (s, k_eol) ->
let uses_crlf = (Ocsigen_stream.current_buffer s).[k_eol - 2] = '\r' in
Ocsigen_stream.skip s (Int64.of_int k_eol) >>= fun s ->
parse_parts ~boundary ~decode_part s uses_crlf
else
Lwt.catch
(fun () ->
search_first_boundary ~boundary s >>= fun (s, k_eob) ->
search_end_of_line s k_eob >>= fun (s, k_eol) ->
let uses_crlf = (Ocsigen_stream.current_buffer s).[k_eol - 2] = '\r' in
Ocsigen_stream.skip s (Int64.of_int k_eol) >>= fun s ->
parse_parts ~boundary ~decode_part s uses_crlf)
(function
| Not_found ->
Lwt.return []
| e -> Lwt.fail e)
let empty_stream =
Ocsigen_stream.get (Ocsigen_stream.make (fun () -> Ocsigen_stream.empty None))
let decode_part ~max_size ~create ~add ~stop stream =
read_header stream >>= fun (s, ) ->
let p = create header in
let rec while_stream size = function
| Ocsigen_stream.Finished None -> Lwt.return (size, empty_stream)
| Ocsigen_stream.Finished (Some ss) -> Lwt.return (size, ss)
| Ocsigen_stream.Cont (stri, f) ->
let long = String.length stri in
let size2 = Int64.add size (Int64.of_int long) in
if match max_size with
| None -> false
| Some m -> Int64.compare size2 m > 0
then Lwt.fail Ocsigen_lib.Ocsigen_Request_too_long
else if stri = ""
then Ocsigen_stream.next f >>= while_stream size
else
add p stri >>= fun () -> Ocsigen_stream.next f >>= while_stream size2
in
Lwt.catch
(fun () ->
while_stream Int64.zero s >>= fun (size, s) ->
stop size p >>= fun r -> Lwt.return (r, s))
(fun error -> stop Int64.zero p >>= fun _ -> Lwt.fail error)
let scan_multipart_body_from_stream ?max_size ~boundary ~create ~add ~stop s =
let decode_part = decode_part ~max_size ~create ~add ~stop in
Lwt.catch
(fun () ->
Ocsigen_stream.next s >>= fun s ->
read_multipart_body ~boundary ~decode_part s >>= fun _ -> Lwt.return ())
(function
| Ocsigen_stream.Stream_too_small ->
Lwt.fail Ocsigen_lib.Ocsigen_Bad_Request
| e -> Lwt.fail e)
let get_boundary ctparams = List.assoc "boundary" ctparams
let counter =
let c = ref (Random.int 1000000) in
fun () ->
c := !c + 1;
!c
let field field content_disp =
let _, res =
S.search_forward (S.regexp (field ^ "=.([^\"]*).;?")) content_disp 0
in
S.matched_group res 1 content_disp
let parse_content_type s =
match Ocsigen_lib.String.split ';' s with
| [] -> None
| a :: l -> (
try
let typ, subtype = Ocsigen_lib.String.sep '/' a in
let params =
try List.map (Ocsigen_lib.String.sep '=') l with Not_found -> []
in
Some ((typ, subtype), params)
with Not_found -> None)
type content_type = (string * string) * (string * string) list
type file_info =
{ tmp_filename : string
; filesize : int64
; raw_original_filename : string
; file_content_type : ((string * string) * (string * string) list) option }
type post_data = (string * string) list * (string * file_info) list
let post_params_form_urlencoded body_gen _ _ =
Lwt.catch
(fun () ->
let body = Ocsigen_stream.get body_gen in
Ocsigen_stream.string_of_stream
(Ocsigen_config.get_maxrequestbodysizeinmemory ())
body
>>= fun r ->
let r = Ocsigen_lib.Url.fixup_url_string r in
let l =
Uri.query_of_encoded r
|> List.map (fun (s, l) -> List.map (fun v -> s, v) l)
|> List.concat
in
Lwt.return (l, []))
(function
| Ocsigen_stream.String_too_large ->
Lwt.fail Ocsigen_lib.Input_is_too_large
| e -> Lwt.fail e)
let post_params_multipart_form_data ctparams body_gen upload_dir max_size =
let body = Ocsigen_stream.get body_gen
and boundary = get_boundary ctparams
and params = ref []
and files = ref []
and filenames = ref [] in
let rec add p s =
match p with
| _, `No_file to_buf -> Buffer.add_string to_buf s; Lwt.return ()
| _, `Some_file (_, _, wh, _) ->
let len = String.length s in
let r = Unix.write_substring wh s 0 len in
if r < len
then
add p (String.sub s r (len - r))
else Lwt.pause ()
in
let create hs =
let content_type =
try
let ct = List.assoc "content-type" hs in
parse_content_type ct
with _ -> None
in
let cd = List.assoc "content-disposition" hs in
let p_name = field "name" cd in
try
let store = field "filename" cd in
match upload_dir with
| Some dname ->
let fname =
Printf.sprintf "%s/%f-%d" dname (Unix.gettimeofday ()) (counter ())
in
let fd =
Unix.openfile fname
[Unix.O_CREAT; Unix.O_TRUNC; Unix.O_WRONLY; Unix.O_NONBLOCK]
0o666
in
Lwt_log.ign_info ~section ("Upload file opened: " ^ fname);
filenames := fname :: !filenames;
p_name, `Some_file (fname, store, fd, content_type)
| None -> raise Ocsigen_upload_forbidden
with Not_found -> p_name, `No_file (Buffer.create 1024)
and stop filesize = function
| p_name, `No_file to_buf ->
params := !params @ [p_name, Buffer.contents to_buf];
Lwt.return ()
| ( p_name
, `Some_file (tmp_filename, raw_original_filename, wh, file_content_type)
) ->
let file_info =
{tmp_filename; filesize; raw_original_filename; file_content_type}
in
files := !files @ [p_name, file_info];
Unix.close wh;
Lwt.return ()
in
scan_multipart_body_from_stream ?max_size ~boundary ~create ~add ~stop body
>>= fun () ->
Ocsigen_stream.consume body_gen >>= fun () -> Lwt.return (!params, !files)
let post_params ~content_type body_gen =
let (ct, cst), ctparams = content_type in
match String.lowercase_ascii ct, String.lowercase_ascii cst with
| "application", "x-www-form-urlencoded" ->
Some
(body_gen |> Cohttp_lwt.Body.to_stream |> Ocsigen_stream.of_lwt_stream
|> post_params_form_urlencoded)
| "multipart", "form-data" ->
Some
(body_gen |> Cohttp_lwt.Body.to_stream |> Ocsigen_stream.of_lwt_stream
|> post_params_multipart_form_data ctparams)
| _ -> None