aboutsummaryrefslogtreecommitdiffstats
path: root/backend/Duplicateaux.ml
blob: 54929251e2555c9a6ce35c35a253230777fd6445 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
open RTL
open Maps
open Camlcoq

(* TTL : IR emphasizing the preferred next node *)
module TTL = struct
  type instruction =
  | Tleaf of RTL.instruction
  | Tnext of node * RTL.instruction

  type code = instruction PTree.t
end;;

open TTL

(** RTL to TTL *)

let get_some = function
| None -> failwith "Did not get some"
| Some thing -> thing

let bfs code entrypoint =
  let visited = ref (PTree.map (fun n i -> false) code)
  and bfs_list = ref []
  and to_visit = Queue.create ()
  and node = ref entrypoint
  in begin
    Queue.add entrypoint to_visit;
    while not (Queue.is_empty to_visit) do
      node := Queue.pop to_visit;
      if not (get_some @@ PTree.get !node !visited) then begin
        visited := PTree.set !node true !visited;
        match PTree.get !node code with
        | None -> failwith "No such node"
        | Some i ->
            bfs_list := !bfs_list @ [!node];
            match i with
            | Icall(_, _, _, _, n) -> Queue.add n to_visit
            | Ibuiltin(_, _, _, n) -> Queue.add n to_visit
            | Ijumptable(_, ln) -> List.iter (fun n -> Queue.add n to_visit) ln
            | Itailcall _ | Ireturn _ -> ()
            | Icond (_, _, n1, n2) -> Queue.add n1 to_visit; Queue.add n2 to_visit
            | Inop n | Iop (_, _, _, n) | Iload (_, _, _, _, _, n) | Istore (_, _, _, _, n) -> Queue.add n to_visit
      end
    done;
    !bfs_list
  end

let get_predecessors_rtl code =
  let preds = ref (PTree.map (fun n i -> []) code) in
  let process_inst (node, i) =
    let succ = match i with
      | Inop n | Iop (_,_,_,n) | Iload (_, _,_,_,_,n) | Istore (_,_,_,_,n)
      | Icall (_,_,_,_,n) | Ibuiltin (_, _, _, n) -> [n]
      | Icond (_,_,n1,n2) -> [n1;n2]
      | Ijumptable (_,ln) -> ln
      | Itailcall _ | Ireturn _ -> []
    in List.iter (fun s -> preds := PTree.set s (node::(get_some @@ PTree.get s !preds)) !preds) succ
  in begin
    List.iter process_inst (PTree.elements code);
    !preds
  end

module PInt = struct
  type t = P.t
  let compare x y = compare (P.to_int x) (P.to_int y)
end

module PSet = Set.Make(PInt)

let print_intlist l =
  let rec f = function
  | [] -> ()
  | n::ln -> (Printf.printf "%d " (P.to_int n); f ln)
  in begin
    Printf.printf "[";
    f l;
    Printf.printf "]"
  end

let print_intset s =
  let seq = PSet.to_seq s
  in begin
    Printf.printf "{";
    Seq.iter (fun n ->
      Printf.printf "%d " (P.to_int n)
    ) seq;
    Printf.printf "}"
  end

(* FIXME - dominators not working well because the order of dataflow update isn't right *)
  (*
let get_dominators code entrypoint =
  let bfs_order = bfs code entrypoint
  and predecessors = get_predecessors_rtl code
  in let doms = ref (PTree.map (fun n i -> PSet.of_list bfs_order) code)
  in begin
    Printf.printf "BFS: ";
    print_intlist bfs_order;
    Printf.printf "\n";
    List.iter (fun n ->
      let preds = get_some @@ PTree.get n predecessors
      and single = PSet.singleton n
      in match preds with
      | [] -> doms := PTree.set n single !doms
      | p::lp ->
          let set_p = get_some @@ PTree.get p !doms
          and set_lp = List.map (fun p -> get_some @@ PTree.get p !doms) lp
          in let inter = List.fold_left PSet.inter set_p set_lp
          in let union = PSet.union inter single
          in begin
            Printf.printf "----------------------------------------\n";
            Printf.printf "n = %d\n" (P.to_int n);
            Printf.printf "set_p = "; print_intset set_p; Printf.printf "\n";
            Printf.printf "set_lp = ["; List.iter (fun s -> print_intset s; Printf.printf ", ") set_lp; Printf.printf "]\n";
            Printf.printf "=> inter = "; print_intset inter; Printf.printf "\n";
            Printf.printf "=> union = "; print_intset union; Printf.printf "\n";
            doms := PTree.set n union !doms
          end
    ) bfs_order;
    !doms
  end
*)

let print_dominators dominators =
  let domlist = PTree.elements dominators
  in begin
    Printf.printf "{\n";
    List.iter (fun (n, doms) ->
      Printf.printf "\t";
      Printf.printf "%d:" (P.to_int n);
      print_intset doms;
      Printf.printf "\n"
    ) domlist
  end

type vstate = Unvisited | Processed | Visited

(** Getting loop branches with a DFS visit :
  * Each node is either Unvisited, Visited, or Processed
  * pre-order: node becomes Processed
  * post-order: node becomes Visited
  *
  * If we come accross an edge to a Processed node, it's a loop!
  *)
let get_loop_headers code entrypoint =
  let visited = ref (PTree.map (fun n i -> Unvisited) code)
  and is_loop_header = ref (PTree.map (fun n i -> false) code)
  in let rec dfs_visit code = function
  | [] -> ()
  | node :: ln ->
      match (get_some @@ PTree.get node !visited) with
      | Visited -> ()
      | Processed -> begin
          is_loop_header := PTree.set node true !is_loop_header;
          visited := PTree.set node Visited !visited
        end
      | Unvisited -> begin
          visited := PTree.set node Processed !visited;
          match PTree.get node code with
          | None -> failwith "No such node"
          | Some i -> let next_visits = (match i with
            | Icall (_, _, _, _, n) | Ibuiltin (_, _, _, n) | Inop n | Iop (_, _, _, n)
            | Iload (_, _, _, _, _, n) | Istore (_, _, _, _, n) -> [n]
            | Icond (_, _, n1, n2) -> [n1; n2]
            | Itailcall _ | Ireturn _ -> []
            | Ijumptable (_, ln) -> ln
            ) in dfs_visit code next_visits;
          visited := PTree.set node Visited !visited;
          dfs_visit code ln
        end
  in begin
    dfs_visit code [entrypoint];
    !is_loop_header
  end

let ptree_printbool pt =
  let elements = PTree.elements pt
  in begin
    Printf.printf "[";
    List.iter (fun (n, b) ->
      if b then Printf.printf "%d, " (P.to_int n) else ()
    ) elements;
    Printf.printf "]"
  end

(* Looks ahead (until a branch) to see if a node further down verifies
 * the given predicate *)
let rec look_ahead code node is_loop_header predicate =
  if (predicate node) then true
  else match (get_some @@ PTree.get node code) with
    | Ireturn _ | Itailcall _ | Icond _ | Ijumptable _ -> false
    | Inop n | Iop (_, _, _, n) | Iload (_, _, _, _, _, n)
    | Istore (_, _, _, _, n) | Icall (_, _, _, _, n)
    | Ibuiltin (_, _, _, n) ->
      if (predicate n) then true
      else (
        if (get_some @@ PTree.get n is_loop_header) then false
        else look_ahead code n is_loop_header predicate
      )

exception HeuristicSucceeded

let do_call_heuristic code ifso ifnot is_loop_header preferred =
  let predicate n = (function
  | Icall _ -> true
  | _ -> false) @@ get_some @@ PTree.get n code
  in if (look_ahead code ifso is_loop_header predicate) then
    (preferred := false; raise HeuristicSucceeded)
  else if (look_ahead code ifnot is_loop_header predicate) then
    (preferred := true; raise HeuristicSucceeded)
  else ()

let do_opcode_heuristic code cond ifso ifnot preferred = DuplicateOpcodeHeuristic.opcode_heuristic code cond ifso ifnot preferred

let do_return_heuristic code ifso ifnot is_loop_header preferred =
  let predicate n = (function
  | Ireturn _ -> true
  | _ -> false) @@ get_some @@ PTree.get n code
  in if (look_ahead code ifso is_loop_header predicate) then
    (preferred := false; raise HeuristicSucceeded)
  else if (look_ahead code ifnot is_loop_header predicate) then
    (preferred := true; raise HeuristicSucceeded)
  else ()

let do_store_heuristic code ifso ifnot is_loop_header preferred =
  let predicate n = (function
  | Istore _ -> true
  | _ -> false) @@ get_some @@ PTree.get n code
  in if (look_ahead code ifso is_loop_header predicate) then
    (preferred := false; raise HeuristicSucceeded)
  else if (look_ahead code ifnot is_loop_header predicate) then
    (preferred := true; raise HeuristicSucceeded)
  else ()

let do_loop_heuristic code ifso ifnot is_loop_header preferred =
  let predicate n = get_some @@ PTree.get n is_loop_header
  in if (look_ahead code ifso is_loop_header predicate) then
    (preferred := true; raise HeuristicSucceeded)
  else if (look_ahead code ifnot is_loop_header predicate) then
    (preferred := false; raise HeuristicSucceeded)
  else ()

let get_directions code entrypoint =
  let bfs_order = bfs code entrypoint
  and is_loop_header = get_loop_headers code entrypoint
  and directions = ref (PTree.map (fun n i -> false) code) (* false <=> fallthru *)
  in begin
    Printf.printf "Loop headers: ";
    ptree_printbool is_loop_header;
    Printf.printf "\n";
    List.iter (fun n ->
      match (get_some @@ PTree.get n code) with
      | Icond (cond, lr, ifso, ifnot) ->
          Printf.printf "Analyzing %d.." (P.to_int n);
          let preferred = ref false
          in (try
            Printf.printf " call..";
            do_call_heuristic code ifso ifnot is_loop_header preferred;
            Printf.printf " opcode..";
            do_opcode_heuristic code cond ifso ifnot preferred;
            Printf.printf " return..";
            do_return_heuristic code ifso ifnot is_loop_header preferred;
            Printf.printf " store..";
            do_store_heuristic code ifso ifnot is_loop_header preferred;
            Printf.printf " loop..";
            do_loop_heuristic code ifso ifnot is_loop_header preferred;
            Printf.printf "Random choice for %d\n" (P.to_int n);
            preferred := Random.bool ()
            with HeuristicSucceeded | DuplicateOpcodeHeuristic.HeuristicSucceeded
              -> Printf.printf " %s\n" (match !preferred with true -> "BRANCH"
                                        | false -> "FALLTHROUGH")
          ); directions := PTree.set n !preferred !directions
      | _ -> ()
    ) bfs_order;
    !directions
  end

let to_ttl_inst direction = function
| Ireturn o -> Tleaf (Ireturn o)
| Inop n -> Tnext (n, Inop n)
| Iop (op, lr, r, n) -> Tnext (n, Iop(op, lr, r, n))
| Iload (tm, m, a, lr, r, n) -> Tnext (n, Iload(tm, m, a, lr, r, n))
| Istore (m, a, lr, r, n) -> Tnext (n, Istore(m, a, lr, r, n))
| Icall (s, ri, lr, r, n) -> Tleaf (Icall(s, ri, lr, r, n))
| Itailcall (s, ri, lr) -> Tleaf (Itailcall(s, ri, lr))
| Ibuiltin (ef, lbr, br, n) -> Tleaf (Ibuiltin(ef, lbr, br, n))
| Icond (cond, lr, n, n') -> (match direction with
    | false -> Tnext (n', Icond(cond, lr, n, n'))
    | true -> Tnext (n, Icond(cond, lr, n, n')))
| Ijumptable (r, ln) -> Tleaf (Ijumptable(r, ln))

let rec to_ttl_code_rec directions = function
| [] -> PTree.empty
| m::lm -> let (n, i) = m
    in let direction = get_some @@ PTree.get n directions
    in PTree.set n (to_ttl_inst direction i) (to_ttl_code_rec directions lm)

let to_ttl_code code entrypoint =
  let directions = get_directions code entrypoint
  in begin
    Printf.printf "Ifso directions: ";
    ptree_printbool directions;
    Printf.printf "\n";
    Random.init(0); (* using same seed to make it deterministic *)
    to_ttl_code_rec directions (PTree.elements code)
  end

(** Trace selection on TTL *)

let rec exists_false_rec = function
  | [] -> false
  | m::lm -> let (_, b) = m in if b then exists_false_rec lm else true

let exists_false boolmap = exists_false_rec (PTree.elements boolmap)

(* DFS on TTL to guide the exploration *)
let dfs code entrypoint =
  let visited = ref (PTree.map (fun n i -> false) code) in
  let rec dfs_list code = function
  | [] -> []
  | node :: ln ->
      let node_dfs =
        if not (get_some @@ PTree.get node !visited) then begin
          visited := PTree.set node true !visited;
          match PTree.get node code with
          | None -> failwith "No such node"
          | Some ti -> [node] @ match ti with
              | Tleaf i -> (match i with
                  | Icall(_, _, _, _, n) -> dfs_list code [n]
                  | Ibuiltin(_, _, _, n) -> dfs_list code [n]
                  | Ijumptable(_, ln) -> dfs_list code ln
                  | Itailcall _ | Ireturn _ -> [] 
                  | _ -> failwith "Tleaf case not handled in dfs" )
              | Tnext (n,i) -> (dfs_list code [n]) @ match i with
                  | Icond (_, _, n1, n2) -> dfs_list code [n1; n2]
                  | Inop _ | Iop _ | Iload _ | Istore _ -> []
                  | _ -> failwith "Tnext case not handled in dfs"
          end
        else []
      in node_dfs @ (dfs_list code ln)
  in dfs_list code [entrypoint]

let ptree_get_some n ptree = get_some @@ PTree.get n ptree

let get_predecessors_ttl code =
  let preds = ref (PTree.map (fun n i -> []) code) in
  let process_inst (node, ti) = match ti with
  | Tleaf _ -> ()
  | Tnext (_, i) -> let succ = match i with
      | Inop n | Iop (_,_,_,n) | Iload (_, _,_,_,_,n) | Istore (_,_,_,_,n)
      | Icall (_,_,_,_,n) | Ibuiltin (_, _, _, n) -> [n]
      | Icond (_,_,n1,n2) -> [n1;n2]
      | Ijumptable (_,ln) -> ln
      | _ -> []
      in List.iter (fun s -> preds := PTree.set s (node::(get_some @@ PTree.get s !preds)) !preds) succ
  in begin
    List.iter process_inst (PTree.elements code);
    !preds
  end

let rtl_proj code = PTree.map (fun n ti -> match ti with Tleaf i | Tnext(_, i) -> i) code

let rec select_unvisited_node is_visited = function
| [] -> failwith "Empty list"
| n :: ln -> if not (ptree_get_some n is_visited) then n else select_unvisited_node is_visited ln

let best_successor_of node code is_visited =
  match (PTree.get node code) with
  | None -> failwith "No such node in the code"
  | Some ti -> match ti with
      | Tleaf _ -> None
      | Tnext (n,_) -> if not (ptree_get_some n is_visited) then Some n
                       else None

let best_predecessor_of node predecessors order is_visited =
  match (PTree.get node predecessors) with
  | None -> failwith "No predecessor list found"
  | Some lp -> try Some (List.find (fun n -> (List.mem n lp) && (not (ptree_get_some n is_visited))) order)
               with Not_found -> None

(* Algorithm mostly inspired from Chang and Hwu 1988
 * "Trace Selection for Compiling Large C Application Programs to Microcode" *)
let select_traces code entrypoint =
  let order = dfs code entrypoint in
  let predecessors = get_predecessors_ttl code in
  let traces = ref [] in
  let is_visited = ref (PTree.map (fun n i -> false) code) in begin (* mark all nodes visited *)
    while exists_false !is_visited do (* while (there are unvisited nodes) *)
      let seed = select_unvisited_node !is_visited order in
      let trace = ref [seed] in
      let current = ref seed in begin
        is_visited := PTree.set seed true !is_visited; (* mark seed visited *)
        let quit_loop = ref false in begin
          while not !quit_loop do
            let s = best_successor_of !current code !is_visited in
            match s with
            | None -> quit_loop := true (* if (s==0) exit loop *)
            | Some succ -> begin
                trace := !trace @ [succ];
                is_visited := PTree.set succ true !is_visited; (* mark s visited *)
                current := succ
                end
          done;
          current := seed;
          quit_loop := false;
          while not !quit_loop do
            let s = best_predecessor_of !current predecessors order !is_visited in
            match s with
            | None -> quit_loop := true (* if (s==0) exit loop *)
            | Some pred -> begin
                trace := pred :: !trace;
                is_visited := PTree.set pred true !is_visited; (* mark s visited *)
                current := pred
                end
          done;
          traces := !trace :: !traces;
        end
      end
    done;
    Printf.printf "DFS: \t"; print_intlist order; Printf.printf "\n";
    !traces
  end

let print_trace t = print_intlist t

let print_traces traces =
  let rec f = function
  | [] -> ()
  | t::lt -> Printf.printf "\n\t"; print_trace t; Printf.printf ",\n"; f lt
  in begin
    Printf.printf "Traces: {";
    f traces;
    Printf.printf "}\n";
  end

let rec make_identity_ptree_rec = function
| [] -> PTree.empty
| m::lm -> let (n, _) = m in PTree.set n n (make_identity_ptree_rec lm)

let make_identity_ptree f = make_identity_ptree_rec (PTree.elements f.fn_code)

(* FIXME - For now, identity *)
let tail_duplicate code ptree trace = (code, ptree)

let rec superblockify_traces code ptree = function
  | [] -> (code, ptree)
  | trace :: traces ->
      let new_code, new_ptree = tail_duplicate code ptree trace
      in superblockify_traces new_code new_ptree traces

(* For now, identity function *)
let duplicate_aux f =
  let entrypoint = fn_entrypoint f in
  let traces = select_traces (to_ttl_code (fn_code f) entrypoint) entrypoint in
  let pTreeId = make_identity_ptree f in
  let (new_code, pTreeId) = superblockify_traces (fn_code f) pTreeId traces in
  begin
    print_traces traces;
    ((new_code, (fn_entrypoint f)), pTreeId)
  end