Fix bugs in SSA renaming and improve phi insertion

This commit is contained in:
Andrzej Janik
2020-04-30 00:20:12 +02:00
parent 7d38992e08
commit 6700f8bcc2

View File

@ -151,9 +151,9 @@ fn ssa_legalize(
bbs: Vec<BasicBlock>, bbs: Vec<BasicBlock>,
doms: &Vec<BBIndex>, doms: &Vec<BBIndex>,
dom_fronts: &Vec<HashSet<BBIndex>>, dom_fronts: &Vec<HashSet<BBIndex>>,
) { ) -> Vec<Vec<PhiDef>> {
let phis = gather_phi_sets(&func, max_id, &bbs, dom_fronts); let phis = gather_phi_sets(&func, max_id, &bbs, dom_fronts);
apply_ssa_renaming(func, &bbs, doms, max_id, &phis); apply_ssa_renaming(func, &bbs, doms, max_id, &phis)
} }
// "Modern Compiler Implementation in Java" - Algorithm 19.7 // "Modern Compiler Implementation in Java" - Algorithm 19.7
@ -163,9 +163,9 @@ fn apply_ssa_renaming(
doms: &[BBIndex], doms: &[BBIndex],
max_id: spirv::Word, max_id: spirv::Word,
old_phi: &[HashSet<spirv::Word>], old_phi: &[HashSet<spirv::Word>],
) { ) -> Vec<Vec<PhiDef>> {
let mut dom_tree = vec![Vec::new(); bbs.len()]; let mut dom_tree = vec![Vec::new(); bbs.len()];
for (bb, idom) in doms.iter().enumerate() { for (bb, idom) in doms.iter().enumerate().skip(1) {
dom_tree[idom.0].push(BBIndex(bb)); dom_tree[idom.0].push(BBIndex(bb));
} }
let mut old_dst_id = vec![Vec::new(); bbs.len()]; let mut old_dst_id = vec![Vec::new(); bbs.len()];
@ -178,7 +178,7 @@ fn apply_ssa_renaming(
.iter() .iter()
.map(|ids| { .map(|ids| {
ids.iter() ids.iter()
.map(|id| (*id, Vec::new())) .map(|id| (*id, (u32::max_value(), HashSet::new())))
.collect::<HashMap<_, _>>() .collect::<HashMap<_, _>>()
}) })
.collect::<Vec<_>>(); .collect::<Vec<_>>();
@ -190,7 +190,7 @@ fn apply_ssa_renaming(
if let Some((BBIndex(bb), dom_succ_idx)) = state.last_mut() { if let Some((BBIndex(bb), dom_succ_idx)) = state.last_mut() {
let bb = *bb; let bb = *bb;
if *dom_succ_idx == 0 { if *dom_succ_idx == 0 {
rename_phi_dst(max_id, &mut ssa_state, &mut new_phi[bb]); rename_phi_dst(&mut ssa_state, &mut new_phi[bb]);
rename_bb_body(&mut ssa_state, func, bbs, BBIndex(bb)); rename_bb_body(&mut ssa_state, func, bbs, BBIndex(bb));
for BBIndex(succ_idx) in bbs[bb].succ.iter() { for BBIndex(succ_idx) in bbs[bb].succ.iter() {
rename_succesor_phi_src(&ssa_state, &mut new_phi[*succ_idx]); rename_succesor_phi_src(&ssa_state, &mut new_phi[*succ_idx]);
@ -207,22 +207,32 @@ fn apply_ssa_renaming(
break; break;
} }
} }
new_phi
.into_iter()
.map(|map| {
map.into_iter()
.map(|(_, (new_id, defs))| PhiDef {
dst: new_id,
src: defs,
})
.collect::<Vec<_>>()
})
.collect::<Vec<_>>()
}
// before ssa-renaming every phi is x <- phi(x,x,x,x)
#[derive(Debug, PartialEq)]
struct PhiDef {
dst: spirv::Word,
src: HashSet<spirv::Word>,
} }
fn rename_phi_dst( fn rename_phi_dst(
max_old_id: spirv::Word,
rewriter: &mut SSARewriteState, rewriter: &mut SSARewriteState,
phi: &mut HashMap<spirv::Word, Vec<spirv::Word>>, phi: &mut HashMap<spirv::Word, (spirv::Word, HashSet<spirv::Word>)>,
) { ) {
let old_keys = phi for (old_k, (new_k, _)) in phi.iter_mut() {
.keys() *new_k = rewriter.redefine(*old_k);
.copied()
.filter(|id| *id <= max_old_id)
.collect::<Vec<_>>();
for k in old_keys.into_iter() {
let remapped_id = rewriter.redefine(k);
let values = phi.remove(&k).unwrap();
phi.insert(remapped_id, values);
} }
} }
@ -245,10 +255,10 @@ fn rename_bb_body(
fn rename_succesor_phi_src( fn rename_succesor_phi_src(
ssa_state: &SSARewriteState, ssa_state: &SSARewriteState,
phi: &mut HashMap<spirv::Word, Vec<spirv::Word>>, phi: &mut HashMap<spirv::Word, (spirv::Word, HashSet<spirv::Word>)>,
) { ) {
for (id, v) in phi.iter_mut() { for (id, (_, v)) in phi.iter_mut() {
v.push(ssa_state.get(*id)); v.insert(ssa_state.get(*id));
} }
} }
@ -295,9 +305,10 @@ struct SSARewriteState {
impl SSARewriteState { impl SSARewriteState {
fn new(max: spirv::Word) -> Self { fn new(max: spirv::Word) -> Self {
let stack = vec![Vec::new(); max as usize]; let len = max + 1;
let stack = (0..len).map(|x| vec![x + len]).collect::<Vec<_>>();
SSARewriteState { SSARewriteState {
next: max + 1, next: 2 * len,
stack, stack,
} }
} }
@ -318,40 +329,50 @@ impl SSARewriteState {
} }
} }
// "Modern Compiler Implementation in Java" - Algorithm 19.6 // "Engineering a Compiler" - Figure 9.9
// Calculates semi-pruned phis
fn gather_phi_sets( fn gather_phi_sets(
func: &[Statement], func: &[Statement],
max_id: spirv::Word, max_id: spirv::Word,
bbs: &[BasicBlock], cfg: &[BasicBlock],
dom_fronts: &[HashSet<BBIndex>], dom_fronts: &[HashSet<BBIndex>],
) -> Vec<HashSet<spirv::Word>> { ) -> Vec<HashSet<spirv::Word>> {
let mut result = vec![HashSet::new(); bbs.len()]; let mut result = vec![HashSet::new(); cfg.len()];
let mut bb_dst_definitions = vec![HashSet::new(); bbs.len()]; let mut globals = HashSet::new();
let mut def_sites = vec![(HashSet::new(), Vec::new()); (max_id as usize) + 1]; let mut blocks = vec![(Vec::new(), HashSet::new()); (max_id as usize) + 1];
for bb in 0..bbs.len() { for bb in 0..cfg.len() {
let bb = BBIndex(bb); let mut var_kill = HashSet::new();
for s in get_bb_body(func, bbs, bb) { let mut visitor = |is_dst, id: &u32| {
s.for_dst_id(&mut |id| { if is_dst {
bb_dst_definitions[bb.0].insert(id); var_kill.insert(*id);
let (ref mut set, ref mut stack) = def_sites[id as usize]; let (ref mut stack, ref mut set) = blocks[*id as usize];
if set.insert(bb) { stack.push(BBIndex(bb));
stack.push(bb); set.insert(BBIndex(bb));
} else {
if !var_kill.contains(id) {
globals.insert(*id);
} }
}); }
};
for s in get_bb_body(func, cfg, BBIndex(bb)) {
match s {
Statement::Instruction(pred, inst) => {
pred.as_ref().map(|p| p.visit_id(&mut visitor));
inst.visit_id(&mut visitor);
}
Statement::Label(_) => (),
}
} }
} }
for (id, to_work) in def_sites.iter_mut().enumerate() { for id in globals {
let id = id as spirv::Word; let (ref mut work_stack, ref mut work_set) = &mut blocks[id as usize];
let (ref mut set, ref mut stack) = to_work;
loop { loop {
if let Some(bb) = stack.pop() { if let Some(bb) = work_stack.pop() {
set.remove(&bb); work_set.remove(&bb);
for y_bb in &dom_fronts[bb.0] { for d_bb in &dom_fronts[bb.0] {
if result[y_bb.0].insert(id) { if result[d_bb.0].insert(id) {
if !bb_dst_definitions[y_bb.0].contains(&id) { if work_set.insert(*d_bb) {
if set.insert(*y_bb) { work_stack.push(*d_bb);
stack.push(*y_bb);
}
} }
} }
} }
@ -596,6 +617,16 @@ impl Statement {
} }
} }
fn visit_id<F: FnMut(bool, &spirv::Word)>(&self, f: &mut F) {
match self {
Statement::Label(id) => f(true, id),
Statement::Instruction(pred, inst) => {
pred.as_ref().map(|p| p.visit_id(f));
inst.visit_id(f);
}
}
}
fn visit_id_mut<F: FnMut(bool, &mut spirv::Word)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut spirv::Word)>(&mut self, f: &mut F) {
match self { match self {
Statement::Label(id) => f(true, id), Statement::Label(id) => f(true, id),
@ -615,6 +646,10 @@ impl<T> ast::PredAt<T> {
} }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
f(false, &self.label)
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
f(false, &mut self.label) f(false, &mut self.label)
} }
@ -642,6 +677,23 @@ impl<T> ast::Instruction<T> {
} }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
match self {
ast::Instruction::Ld(_, a) => a.visit_id(f),
ast::Instruction::Mov(_, a) => a.visit_id(f),
ast::Instruction::Mul(_, a) => a.visit_id(f),
ast::Instruction::Add(_, a) => a.visit_id(f),
ast::Instruction::Setp(_, a) => a.visit_id(f),
ast::Instruction::SetpBool(_, a) => a.visit_id(f),
ast::Instruction::Not(_, a) => a.visit_id(f),
ast::Instruction::Cvt(_, a) => a.visit_id(f),
ast::Instruction::Shl(_, a) => a.visit_id(f),
ast::Instruction::St(_, a) => a.visit_id(f),
ast::Instruction::Bra(_, a) => a.visit_id(f),
ast::Instruction::Ret(_) => (),
}
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
match self { match self {
ast::Instruction::Ld(_, a) => a.visit_id_mut(f), ast::Instruction::Ld(_, a) => a.visit_id_mut(f),
@ -718,6 +770,10 @@ impl<T> ast::Arg1<T> {
ast::Arg1 { src: f(self.src) } ast::Arg1 { src: f(self.src) }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
f(false, &self.src);
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
f(false, &mut self.src); f(false, &mut self.src);
} }
@ -731,6 +787,11 @@ impl<T> ast::Arg2<T> {
} }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
f(true, &self.dst);
self.src.visit_id(f);
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
f(true, &mut self.dst); f(true, &mut self.dst);
self.src.visit_id_mut(f); self.src.visit_id_mut(f);
@ -751,6 +812,11 @@ impl<T> ast::Arg2Mov<T> {
} }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
f(true, &self.dst);
self.src.visit_id(f);
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
f(true, &mut self.dst); f(true, &mut self.dst);
self.src.visit_id_mut(f); self.src.visit_id_mut(f);
@ -772,6 +838,12 @@ impl<T> ast::Arg3<T> {
} }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
f(true, &self.dst);
self.src1.visit_id(f);
self.src2.visit_id(f);
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
f(true, &mut self.dst); f(true, &mut self.dst);
self.src1.visit_id_mut(f); self.src1.visit_id_mut(f);
@ -795,6 +867,13 @@ impl<T> ast::Arg4<T> {
} }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
f(true, &self.dst1);
self.dst2.as_ref().map(|i| f(true, i));
self.src1.visit_id(f);
self.src2.visit_id(f);
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
f(true, &mut self.dst1); f(true, &mut self.dst1);
self.dst2.as_mut().map(|i| f(true, i)); self.dst2.as_mut().map(|i| f(true, i));
@ -821,6 +900,14 @@ impl<T> ast::Arg5<T> {
} }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
f(true, &self.dst1);
self.dst2.as_ref().map(|i| f(true, i));
self.src1.visit_id(f);
self.src2.visit_id(f);
self.src3.visit_id(f);
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
f(true, &mut self.dst1); f(true, &mut self.dst1);
self.dst2.as_mut().map(|i| f(true, i)); self.dst2.as_mut().map(|i| f(true, i));
@ -846,6 +933,14 @@ impl<T> ast::Operand<T> {
} }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
match self {
ast::Operand::Reg(i) => f(false, i),
ast::Operand::RegOffset(i, _) => f(false, i),
ast::Operand::Imm(_) => (),
}
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
match self { match self {
ast::Operand::Reg(i) => f(false, i), ast::Operand::Reg(i) => f(false, i),
@ -863,6 +958,13 @@ impl<T> ast::MovOperand<T> {
} }
} }
fn visit_id<F: FnMut(bool, &T)>(&self, f: &mut F) {
match self {
ast::MovOperand::Op(o) => o.visit_id(f),
ast::MovOperand::Vec(_, _) => (),
}
}
fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) { fn visit_id_mut<F: FnMut(bool, &mut T)>(&mut self, f: &mut F) {
match self { match self {
ast::MovOperand::Op(o) => o.visit_id_mut(f), ast::MovOperand::Op(o) => o.visit_id_mut(f),
@ -1202,7 +1304,7 @@ mod tests {
} }
// page 403 // page 403
const fig_19_4: &'static str = "{ const FIG_19_4: &'static str = "{
mov.u32 i, 1; mov.u32 i, 1;
mov.u32 j, 1; mov.u32 j, 1;
mov.u32 k, 0; mov.u32 k, 0;
@ -1226,8 +1328,8 @@ mod tests {
}"; }";
#[test] #[test]
fn gather_phi_sets_fig_19_4() { fn get_basic_blocks_fig_19_4() {
let func = fig_19_4; let func = FIG_19_4;
let mut errors = Vec::new(); let mut errors = Vec::new();
let ast = ptx::FunctionBodyParser::new() let ast = ptx::FunctionBodyParser::new()
.parse(&mut errors, func) .parse(&mut errors, func)
@ -1348,7 +1450,6 @@ mod tests {
); );
} }
// page 403
#[test] #[test]
fn dominance_frontiers_fig_19_4() { fn dominance_frontiers_fig_19_4() {
let cfg = cfg_fig_19_4(); let cfg = cfg_fig_19_4();
@ -1369,4 +1470,45 @@ mod tests {
]; ];
assert_eq!(dom_fronts, should); assert_eq!(dom_fronts, should);
} }
#[test]
fn gather_phi_sets_fig_19_4() {
let func = FIG_19_4;
let mut errors = Vec::new();
let fn_ast = ptx::FunctionBodyParser::new()
.parse(&mut errors, func)
.unwrap();
assert_eq!(errors.len(), 0);
let (normalized_ids, max_id) = normalize_identifiers(fn_ast);
let bbs = get_basic_blocks(&normalized_ids);
let rpostorder = to_reverse_postorder(&bbs);
let doms = immediate_dominators(&bbs, &rpostorder);
let dom_fronts = dominance_frontiers(&bbs, &doms);
let phi = gather_phi_sets(&normalized_ids, max_id, &bbs, &dom_fronts);
assert_eq!(
phi,
vec![
HashSet::new(),
to_hashset(vec![1, 2]),
HashSet::new(),
HashSet::new(),
HashSet::new(),
to_hashset(vec![1, 2]),
HashSet::new()
]
);
}
fn to_hashset<T: std::hash::Hash + Eq>(v: Vec<T>) -> HashSet<T> {
v.into_iter().collect::<HashSet<T>>()
}
fn assert_dst_unique(func: &[Statement]) {
let mut seen = HashSet::new();
for s in func {
s.for_dst_id(&mut |id| {
assert!(seen.insert(id));
});
}
}
} }