Source file pipeline.ml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
open Core
open Configuration
open Command_configuration
open Command_input
open Rewriter
open Statistics
open Matchers
open Match
open Language
let verbose_out_file = "/tmp/comby.out"
let debug =
  Sys.getenv "DEBUG_COMBY"
  |> Option.is_some
let infer_equality_constraints environment =
  let vars = Environment.vars environment in
  List.fold vars ~init:[] ~f:(fun acc var ->
      if String.is_suffix var ~suffix:"_equal" then
        match String.split var ~on:'_' with
        | _uuid :: target :: _equal ->
          let expression = Language.Ast.Equal (Variable var, Variable target) in
          expression::acc
        | _ -> acc
      else
        acc)
let apply_rule ?(substitute_in_place = true) matcher omega rule matches =
  let open Option in
  List.filter_map matches ~f:(fun ({ environment; _ } as matched) ->
      let rule = rule @ infer_equality_constraints environment in
      let apply =
        if omega then
          Rule.Omega.apply
        else
          Rule.Alpha.apply
      in
      let sat, env = apply ~substitute_in_place ~matcher rule environment in
      (if sat then env else None)
      >>| fun environment -> { matched with environment })
let timed_run
    (module Matcher : Matcher.S)
    ?(fast_offset_conversion = false)
    ?(omega = false)
    ?substitute_in_place
    ~configuration
    ~source
    ~specification:(Specification.{ match_template = template; rule; rewrite_template })
    () =
  (match rewrite_template with
   | Some template -> Matcher.set_rewrite_template template;
   | None -> ());
  let rule = Option.value rule ~default:[Ast.True] in
  let options = if omega then Rule.Omega.options rule else Rule.Alpha.options rule in
  let matches = Matcher.all ~nested:options.nested ~configuration ~template ~source () in
  let matches = apply_rule ?substitute_in_place (module Matcher) omega rule matches in
  List.map matches ~f:(Match.convert_offset ~fast:fast_offset_conversion ~source)
type output =
  | Matches of (Match.t list * int)
  | Replacement of (Replacement.t list * string * int)
  | Nothing
let with_timeout timeout source ~f =
  try Statistics.Time.time_out ~after:timeout f ();
  with Statistics.Time.Time_out ->
    Format.eprintf "Timeout for input: %s!@." (show_input_kind source);
    Out_channel.with_file ~append:true verbose_out_file ~f:(fun out_channel ->
        Out_channel.output_lines out_channel [Format.sprintf "TIMEOUT: %s@." (show_input_kind source) ]);
    []
let log_to_file path =
  Out_channel.with_file ~append:true verbose_out_file ~f:(fun out_channel ->
      Out_channel.output_lines out_channel [Format.sprintf "Processing %s%!" path])
let process_single_source
    matcher
    ?(sequential = false)
    ?(omega = false)
    ?(fast_offset_conversion = false)
    ?(substitute_in_place = false)
    ?(verbose = false)
    ?(timeout = 3)
    ?metasyntax
    configuration
    source
    (Specification.{ rewrite_template; _ } as specification)
  =
  try
    let input_text =
      match source with
      | String input_text -> input_text
      | Path path ->
        if verbose then log_to_file path;
        In_channel.read_all path
    in
    let matches =
      with_timeout timeout source ~f:(fun () ->
          timed_run
            matcher
            ~substitute_in_place
            ~omega
            ~fast_offset_conversion
            ~configuration
            ~specification
            ~source:input_text
            ())
    in
    match rewrite_template with
    | None -> Matches (matches, List.length matches)
    | Some rewrite_template ->
      match matches with
      | [] ->
        
        Replacement ([], input_text, 0)
      | matches ->
        match Rewrite.all ~source:input_text ?metasyntax ~sequential ~rewrite_template matches with
        | None -> Nothing
        | Some { rewritten_source; in_place_substitutions } ->
          Replacement (in_place_substitutions, rewritten_source, List.length matches)
  with
  | exn ->
    if debug then Format.eprintf "Big error: %s@." (Exn.to_string exn);
    Nothing
let output_result output_printer source_path source_content result =
  match result with
  | Nothing -> ()
  | Matches (matches, _) ->
    output_printer (Printer.Matches { source_path; matches })
  | Replacement (replacements, result, _) ->
    let source_content =
      match source_content with
      | String content -> content
      | Path path -> In_channel.read_all path
    in
    output_printer (Printer.Replacements { source_path; replacements; result; source_content })
let run_on_specifications specifications output_printer process (input : single_source) output_file =
  let result, count =
    List.fold specifications ~init:(Nothing, 0) ~f:(fun (result, count) specification ->
        let input =
          match result with
          | Nothing | Matches _ -> input
          | Replacement (_, content, _) -> String content
        in
        process input specification
        |> function
        | Nothing -> Nothing, count
        | Matches (l, number_of_matches) ->
          Matches (l, number_of_matches), count + number_of_matches
        | Replacement (l, content, number_of_matches) ->
          Replacement (l, content, number_of_matches),
          count + number_of_matches)
  in
  output_result output_printer output_file input result;
  count
let run_on_specifications_for_interactive specifications process (input : single_source) =
  let result, count =
    List.fold specifications ~init:(Nothing, 0) ~f:(fun (result, count) specification ->
        let input =
          match result with
          | Nothing | Matches _ -> input
          | Replacement (_, content, _) -> String content
        in
        process input specification
        |> function
        | Nothing -> Nothing, count
        | Matches (m, number_of_matches) ->
          Matches (m, number_of_matches), count + number_of_matches
        | Replacement (r, content, number_of_matches) ->
          if number_of_matches = 0 then
            Nothing, count
          else
            Replacement (r, content, number_of_matches),
            count + number_of_matches)
  in
  match result with
  | Replacement (_, content, _) -> Some content, count
  | _ -> None, 0
let write_statistics number_of_matches sources start_time =
  let total_time = Statistics.Time.stop start_time in
  let lines_of_code, number_of_files =
    match sources with
    | `String source ->
      List.length (String.split_lines source), 1
    | `Paths paths ->
      let lines_of_code = Fold.loc_paths paths in
      lines_of_code, List.length paths
    | `Zip (zip_file, paths) ->
      let lines_of_code = Fold.loc_zip zip_file paths in
      lines_of_code, List.length paths
    | _ -> failwith "No single path handled here"
  in
  let statistics =
    { number_of_files
    ; lines_of_code
    ; number_of_matches
    ; total_time = total_time
    }
  in
  Format.eprintf "%s@."
  @@ Yojson.Safe.pretty_to_string
  @@ Statistics.to_yojson statistics
let run_batch ~f:per_unit sources compute_mode bound_count =
  match compute_mode with
  | `Sequential ->
    Sequential.process ~f:per_unit bound_count sources
  | `Parany number_of_workers ->
    Parallel_parany.process ~f:per_unit number_of_workers bound_count sources
  | `Hack_parallel number_of_workers ->
    Parallel_hack.process ~f:per_unit number_of_workers bound_count sources
let run_interactive
    specifications
    sequential
    matcher
    omega
    fast_offset_conversion
    substitute_in_place
    match_configuration
    verbose
    timeout
    sources
    compute_mode
    interactive_review =
  let with_rewrites ~input ~path:_ =
    run_on_specifications_for_interactive
      specifications
      (fun (input : single_source) specification ->
         process_single_source
           matcher
           ~sequential
           ~omega
           ~fast_offset_conversion
           ~substitute_in_place
           ~verbose
           ~timeout
           match_configuration
           input
           specification)
      input
  in
  let paths =
    match sources with
    | `Paths paths -> paths
    | _ -> failwith "Cannot run interactive mode with this input source, must be file paths."
  in
  let rewrites, count =
    match compute_mode with
    | `Sequential -> Sequential.process_interactive ~f:with_rewrites paths
    | `Parany number_of_workers -> Parallel_parany.process_interactive ~f:with_rewrites paths number_of_workers
    | `Hack_parallel number_of_workers -> Parallel_hack.process_interactive ~f:with_rewrites paths number_of_workers
  in
  let { editor; default_is_accept } = interactive_review in
  Interactive.run editor default_is_accept count rewrites;
  count
let run
    { matcher
    ; sources
    ; specifications
    ; run_options =
        { verbose
        ; match_timeout = timeout
        ; dump_statistics
        ; substitute_in_place
        ; disable_substring_matching
        ; omega
        ; fast_offset_conversion
        ; match_newline_toplevel
        ; bound_count
        ; compute_mode
        }
    ; output_printer
    ; interactive_review
    ; extension = _ 
    }
  =
  let sequential = match compute_mode with | `Sequential -> true | _ -> false in
  let match_configuration =
    Configuration.create
      ~disable_substring_matching
      ~match_kind:Fuzzy
      ~match_newline_toplevel
      ()
  in
  let start_time = Statistics.Time.start () in
  let per_unit ~(input : single_source) ~output_path =
    run_on_specifications
      specifications
      output_printer
      (fun input specification ->
         process_single_source
           matcher
           ~sequential
           ~omega
           ~fast_offset_conversion
           ~substitute_in_place
           ~verbose
           ~timeout
           match_configuration
           input
           specification)
      input
      output_path
  in
  let count =
    match interactive_review with
    | None ->
      begin match sources with
        | `String source ->  per_unit ~input:(String source) ~output_path:None
        | #batch_input as sources -> run_batch ~f:per_unit sources compute_mode bound_count
      end
    | Some interactive_review ->
      run_interactive
        specifications
        sequential
        matcher
        omega
        fast_offset_conversion
        substitute_in_place
        match_configuration
        verbose
        timeout
        sources
        compute_mode
        interactive_review
  in
  if dump_statistics then write_statistics count sources start_time
let execute
    matcher
    ?substitute_in_place
    ?timeout
    ?metasyntax
    ?(configuration = Matchers.Configuration.create ())
    source
    specification =
  process_single_source
    matcher
    ~sequential:true
    ~omega:false
    ~fast_offset_conversion:false
    ?substitute_in_place
    ~verbose:false
    ?timeout
    ?metasyntax
    configuration
    source
    specification