Skip to content
Snippets Groups Projects
Commit 160c4ae2 authored by Cyril SIX's avatar Cyril SIX
Browse files

Fixing get_loop_headers + alternative get_inner_loops (commented, not active)

parent 9b6758f4
No related branches found
No related tags found
No related merge requests found
Pipeline #52035 passed
...@@ -30,7 +30,9 @@ let get_some = LICMaux.get_some ...@@ -30,7 +30,9 @@ let get_some = LICMaux.get_some
let rtl_successors = LICMaux.rtl_successors let rtl_successors = LICMaux.rtl_successors
(* Get list of nodes following a BFS of the code *) (* Get list of nodes following a BFS of the code *)
let bfs code entrypoint = begin (* Stops when predicate is reached
* Excludes any node given in excluded function *)
let bfs_until code entrypoint (predicate: node->bool) (excluded: node->bool) = begin
debug "bfs\n"; debug "bfs\n";
let visited = ref (PTree.map (fun n i -> false) code) let visited = ref (PTree.map (fun n i -> false) code)
and bfs_list = ref [] and bfs_list = ref []
...@@ -40,20 +42,24 @@ let bfs code entrypoint = begin ...@@ -40,20 +42,24 @@ let bfs code entrypoint = begin
Queue.add entrypoint to_visit; Queue.add entrypoint to_visit;
while not (Queue.is_empty to_visit) do while not (Queue.is_empty to_visit) do
node := Queue.pop to_visit; node := Queue.pop to_visit;
if not (get_some @@ PTree.get !node !visited) then begin if (not (get_some @@ PTree.get !node !visited)) then begin
visited := PTree.set !node true !visited; visited := PTree.set !node true !visited;
match PTree.get !node code with if not (excluded !node) then begin
| None -> failwith "No such node" match PTree.get !node code with
| Some i -> | None -> failwith "No such node"
bfs_list := !node :: !bfs_list; | Some i ->
let succ = rtl_successors i in bfs_list := !node :: !bfs_list;
List.iter (fun n -> Queue.add n to_visit) succ if not (predicate !node) then
let succ = rtl_successors i in List.iter (fun n -> Queue.add n to_visit) succ
end
end end
done; done;
List.rev !bfs_list List.rev !bfs_list
end end
end end
let bfs code entrypoint = bfs_until code entrypoint (fun _ -> false) (fun _ -> false)
let optbool o = match o with Some _ -> true | None -> false let optbool o = match o with Some _ -> true | None -> false
let ptree_get_some n ptree = get_some @@ PTree.get n ptree let ptree_get_some n ptree = get_some @@ PTree.get n ptree
...@@ -81,15 +87,7 @@ end ...@@ -81,15 +87,7 @@ end
module PSet = Set.Make(PInt) module PSet = Set.Make(PInt)
let print_intlist oc l = let print_intlist = LICMaux.print_intlist
let rec f oc = function
| [] -> ()
| n::ln -> (Printf.fprintf oc "%d %a" (P.to_int n) f ln)
in begin
if !debug_flag then begin
Printf.fprintf oc "[%a]" f l
end
end
let print_intset s = let print_intset s =
let seq = PSet.to_seq s let seq = PSet.to_seq s
...@@ -627,7 +625,7 @@ let invert_iconds code = ...@@ -627,7 +625,7 @@ let invert_iconds code =
type innerLoop = { type innerLoop = {
preds: P.t list; preds: P.t list;
body: HashedSet.PSet.t; body: P.t list;
head: P.t; (* head of the loop *) head: P.t; (* head of the loop *)
final: P.t (* the final instruction, which loops back to the head *) final: P.t (* the final instruction, which loops back to the head *)
} }
...@@ -635,7 +633,7 @@ type innerLoop = { ...@@ -635,7 +633,7 @@ type innerLoop = {
let print_pset = LICMaux.pp_pset let print_pset = LICMaux.pp_pset
let print_inner_loop iloop = let print_inner_loop iloop =
debug "{preds: %a, body: %a}" print_intlist iloop.preds print_pset iloop.body debug "{preds: %a, body: %a}" print_intlist iloop.preds print_intlist iloop.body
let rec print_inner_loops = function let rec print_inner_loops = function
| [] -> () | [] -> ()
...@@ -657,6 +655,53 @@ let print_ptree printer pt = ...@@ -657,6 +655,53 @@ let print_ptree printer pt =
let print_pint oc i = if !debug_flag then Printf.fprintf oc "%d" (P.to_int i) else () let print_pint oc i = if !debug_flag then Printf.fprintf oc "%d" (P.to_int i) else ()
let cb_exit_node = function
| Icond (_,_,n1,n2,p) -> begin match p with
| Some true -> Some n2
| Some false -> Some n1
| None -> None
end
| _ -> None
let get_natural_loop code predmap n =
let is_final_node m =
let successors = rtl_successors @@ get_some @@ PTree.get m code in
List.exists (fun s -> (P.to_int s) == (P.to_int n)) successors
in
let excluded_node = cb_exit_node @@ get_some @@ PTree.get n code in
let is_excluded m = match excluded_node with
| None -> false
| Some ex -> P.to_int ex == P.to_int m
in
debug "get_natural_loop for %d\n" (P.to_int n);
let body = bfs_until code n is_final_node is_excluded in
debug "BODY: %a\n" print_intlist body;
let final = List.find is_final_node body in
debug "FINAL: %d\n" (P.to_int final);
let preds = List.filter (fun pred -> List.mem pred body) @@ get_some @@ PTree.get n predmap in
debug "PREDS: %a\n" print_intlist preds;
{ preds = preds; body = body; head = n; final = final }
let rec count_loop_headers is_loop_header = function
| [] -> 0
| n :: ln ->
let rem = count_loop_headers is_loop_header ln in
if (get_some @@ PTree.get n is_loop_header) then rem + 1 else rem
(* Alternative code to get inner_loops - use it if we suspect the other function to be bugged *)
(*
let get_inner_loops f code is_loop_header =
let predmap = get_predecessors_rtl code in
let iloops = ref [] in
List.iter (fun (n, ilh) -> if ilh then
let iloop = get_natural_loop code predmap n in
let nb_headers = count_loop_headers is_loop_header iloop.body in
if nb_headers == 1 then (* innermost loop *)
iloops := iloop :: !iloops
) (PTree.elements is_loop_header);
!iloops
*)
let get_inner_loops f code is_loop_header = let get_inner_loops f code is_loop_header =
let fake_f = { fn_sig = f.fn_sig; fn_params = f.fn_params; let fake_f = { fn_sig = f.fn_sig; fn_params = f.fn_params;
fn_stacksize = f.fn_stacksize; fn_code = code; fn_entrypoint = f.fn_entrypoint } in fn_stacksize = f.fn_stacksize; fn_code = code; fn_entrypoint = f.fn_entrypoint } in
...@@ -684,7 +729,7 @@ let get_inner_loops f code is_loop_header = ...@@ -684,7 +729,7 @@ let get_inner_loops f code is_loop_header =
assert (List.length filtered == 1); assert (List.length filtered == 1);
List.hd filtered List.hd filtered
end in end in
{ preds = preds; body = body; head = head; final = final } { preds = preds; body = (HashedSet.PSet.elements body); head = head; final = final }
) )
(* LICMaux.inner_loops also returns non-inner loops, but with a body of 1 instruction (* LICMaux.inner_loops also returns non-inner loops, but with a body of 1 instruction
* We remove those to get just the inner loops *) * We remove those to get just the inner loops *)
...@@ -769,7 +814,7 @@ let rec count_ignore_nops code = function ...@@ -769,7 +814,7 @@ let rec count_ignore_nops code = function
* 3) Links the last instruction of body' into the first instruction of body * 3) Links the last instruction of body' into the first instruction of body
*) *)
let unroll_inner_loop_single code revmap iloop = let unroll_inner_loop_single code revmap iloop =
let body = HashedSet.PSet.elements (iloop.body) in let body = iloop.body in
if count_ignore_nops code body > !Clflags.option_funrollsingle then begin if count_ignore_nops code body > !Clflags.option_funrollsingle then begin
debug "Too many nodes in the loop body (%d > %d)" (List.length body) !Clflags.option_funrollsingle; debug "Too many nodes in the loop body (%d > %d)" (List.length body) !Clflags.option_funrollsingle;
(code, revmap) (code, revmap)
...@@ -806,7 +851,7 @@ let unroll_inner_loops_single f code revmap = ...@@ -806,7 +851,7 @@ let unroll_inner_loops_single f code revmap =
* 3) Links the last instruction of body' into the first of body * 3) Links the last instruction of body' into the first of body
*) *)
let unroll_inner_loop_body code revmap iloop = let unroll_inner_loop_body code revmap iloop =
let body = HashedSet.PSet.elements (iloop.body) in let body = iloop.body in
let limit = !Clflags.option_funrollbody in let limit = !Clflags.option_funrollbody in
if count_ignore_nops code body > limit then begin if count_ignore_nops code body > limit then begin
debug "Too many nodes in the loop body (%d > %d)" (List.length body) limit; debug "Too many nodes in the loop body (%d > %d)" (List.length body) limit;
...@@ -824,7 +869,9 @@ let unroll_inner_loop_body code revmap iloop = ...@@ -824,7 +869,9 @@ let unroll_inner_loop_body code revmap iloop =
let unroll_inner_loops_body f code revmap = let unroll_inner_loops_body f code revmap =
let is_loop_header = get_loop_headers code (f.fn_entrypoint) in let is_loop_header = get_loop_headers code (f.fn_entrypoint) in
(* debug_flag := true; *)
let inner_loops = get_inner_loops f code is_loop_header in let inner_loops = get_inner_loops f code is_loop_header in
debug "Number of loops found: %d\n" (List.length inner_loops);
let code' = ref code in let code' = ref code in
let revmap' = ref revmap in let revmap' = ref revmap in
begin begin
...@@ -832,7 +879,7 @@ let unroll_inner_loops_body f code revmap = ...@@ -832,7 +879,7 @@ let unroll_inner_loops_body f code revmap =
List.iter (fun iloop -> List.iter (fun iloop ->
let (new_code, new_revmap) = unroll_inner_loop_body !code' !revmap' iloop in let (new_code, new_revmap) = unroll_inner_loop_body !code' !revmap' iloop in
code' := new_code; revmap' := new_revmap code' := new_code; revmap' := new_revmap
) inner_loops; ) inner_loops; (* debug_flag := false; *)
(!code', !revmap') (!code', !revmap')
end end
......
...@@ -39,6 +39,28 @@ let rtl_successors = function ...@@ -39,6 +39,28 @@ let rtl_successors = function
| Icond (_,_,n1,n2,_) -> [n1; n2] | Icond (_,_,n1,n2,_) -> [n1; n2]
| Ijumptable (_,ln) -> ln | Ijumptable (_,ln) -> ln
let print_ptree_bool oc pt =
if !debug_flag then
let elements = PTree.elements pt in
begin
Printf.fprintf oc "[";
List.iter (fun (n, b) ->
if b then Printf.fprintf oc "%d, " (P.to_int n)
) elements;
Printf.fprintf oc "]\n"
end
else ()
let print_intlist oc l =
let rec f oc = function
| [] -> ()
| n::ln -> (Printf.fprintf oc "%d %a" (P.to_int n) f ln)
in begin
if !debug_flag then begin
Printf.fprintf oc "[%a]" f l
end
end
(** Getting loop branches with a DFS visit : (** Getting loop branches with a DFS visit :
* Each node is either Unvisited, Visited, or Processed * Each node is either Unvisited, Visited, or Processed
* pre-order: node becomes Processed * pre-order: node becomes Processed
...@@ -53,23 +75,34 @@ let get_loop_headers code entrypoint = begin ...@@ -53,23 +75,34 @@ let get_loop_headers code entrypoint = begin
in let rec dfs_visit code = function in let rec dfs_visit code = function
| [] -> () | [] -> ()
| node :: ln -> | node :: ln ->
debug "ENTERING node %d, REM are %a\n" (P.to_int node) print_intlist ln;
match (get_some @@ PTree.get node !visited) with match (get_some @@ PTree.get node !visited) with
| Visited -> () | Visited -> begin
debug "\tNode %d is already Visited, skipping\n" (P.to_int node);
dfs_visit code ln
end
| Processed -> begin | Processed -> begin
debug "Node %d is a loop header\n" (P.to_int node); debug "Node %d is a loop header\n" (P.to_int node);
is_loop_header := PTree.set node true !is_loop_header; is_loop_header := PTree.set node true !is_loop_header;
visited := PTree.set node Visited !visited visited := PTree.set node Visited !visited;
dfs_visit code ln
end end
| Unvisited -> begin | Unvisited -> begin
visited := PTree.set node Processed !visited; visited := PTree.set node Processed !visited;
match PTree.get node code with debug "Node %d is Processed\n" (P.to_int node);
(match PTree.get node code with
| None -> failwith "No such node" | None -> failwith "No such node"
| Some i -> let next_visits = rtl_successors i in dfs_visit code next_visits; | Some i -> let next_visits = rtl_successors i in begin
debug "About to visit: %a\n" print_intlist next_visits;
dfs_visit code next_visits
end);
debug "Node %d is Visited!\n" (P.to_int node);
visited := PTree.set node Visited !visited; visited := PTree.set node Visited !visited;
dfs_visit code ln dfs_visit code ln
end end
in begin in begin
dfs_visit code [entrypoint]; dfs_visit code [entrypoint];
debug "LOOP HEADERS: %a\n" print_ptree_bool !is_loop_header;
!is_loop_header !is_loop_header
end end
end end
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment