Skip to content
Snippets Groups Projects
cpu.sch 1.19 KiB
Newer Older
macro simpl!(X) {
  ccp(X);
  simplify-cfg(X);
  lift-dc-math(X);
  gvn(X);
  phi-elim(X);
  dce(X);
  infer-schedules(X);
}

phi-elim(bfs);
no-memset(bfs@cost);
rarbore2's avatar
rarbore2 committed
let init = outline(bfs@cost_init);
let traverse = outline(bfs@loop1);
let collect = outline(bfs@loop2);

simpl!(*);
predication(*);
const-inline(*);
rarbore2's avatar
rarbore2 committed
loop-bound-canon(*);
simpl!(*);
fixpoint {
  forkify(*);
  fork-guard-elim(*);
}
simpl!(*);
rarbore2's avatar
rarbore2 committed
predication(*);
simpl!(*);
rarbore2's avatar
rarbore2 committed
reduce-slf(*);
simpl!(*);
slf(*);
simpl!(*);

fixpoint {
  forkify(collect);
  fork-guard-elim(collect);
}
simpl!(collect);

parallel-fork(traverse, collect);
parallel-reduce(traverse, collect);
rarbore2's avatar
rarbore2 committed
fork-tile[32, 0, false, true](traverse, collect);
let (outer, inner) = fork-reshape[[1], [0]](traverse);
let traverse_body = outline(inner);
let (outer, inner) = fork-reshape[[1], [0]](collect);
let collect_body = outline(inner);

let init_body = init;
// Following code seems to generate breaking RT code
//fork-tile[32, 0, false, true](init);
//let (outer, inner) = fork-reshape[[1], [0]](init);
//let init_body = outline(inner);
//inline(bfs@cost_init);

inline(bfs@loop1, bfs@loop2);
delete-uncalled(*);
const-inline(*);

unforkify(init_body, traverse_body, collect_body);
simpl!(*);