Skip to content

Commit

Permalink
ssa: empirically faster passRedundantPhiEliminationOpt (#2214)
Browse files Browse the repository at this point in the history
Signed-off-by: Takeshi Yoneda <t.y.mathetake@gmail.com>
  • Loading branch information
mathetake authored May 23, 2024
1 parent 3383f44 commit eb24363
Show file tree
Hide file tree
Showing 2 changed files with 11 additions and 3 deletions.
11 changes: 8 additions & 3 deletions internal/engine/wazevo/ssa/pass.go
Original file line number Diff line number Diff line change
Expand Up @@ -22,9 +22,9 @@ func (b *builder) RunPasses() {
func (b *builder) runPreBlockLayoutPasses() {
passSortSuccessors(b)
passDeadBlockEliminationOpt(b)
passRedundantPhiEliminationOpt(b)
// The result of passCalculateImmediateDominators will be used by various passes below.
passCalculateImmediateDominators(b)
passRedundantPhiEliminationOpt(b)
passNopInstElimination(b)

// TODO: implement either conversion of irreducible CFG into reducible one, or irreducible CFG detection where we panic.
Expand Down Expand Up @@ -109,6 +109,8 @@ func passDeadBlockEliminationOpt(b *builder) {
}

// passRedundantPhiEliminationOpt eliminates the redundant PHIs (in our terminology, parameters of a block).
// This requires the reverse post-order traversal to be calculated before calling this function,
// hence passCalculateImmediateDominators must be called before this.
func passRedundantPhiEliminationOpt(b *builder) {
redundantParameterIndexes := b.ints[:0] // reuse the slice from previous iterations.

Expand All @@ -118,11 +120,14 @@ func passRedundantPhiEliminationOpt(b *builder) {
// relatively small. For example, sqlite speedtest binary results in the large number of redundant PHIs,
// the maximum number of iteration was 22, which seems to be acceptable but not that small either since the
// complexity here is O(BlockNum * Iterations) at the worst case where BlockNum might be the order of thousands.
// -- Note --
// Currently, each iteration can run in an order of blocks, but it empirically converges quickly in practice when
// running on the reverse post-order. It might be possible to optimize this further by using the dominator tree.
for {
changed := false
_ = b.blockIteratorBegin() // skip entry block!
_ = b.blockIteratorReversePostOrderBegin() // skip entry block!
// Below, we intentionally use the named iteration variable name, as this comes with inevitable nested for loops!
for blk := b.blockIteratorNext(); blk != nil; blk = b.blockIteratorNext() {
for blk := b.blockIteratorReversePostOrderNext(); blk != nil; blk = b.blockIteratorReversePostOrderNext() {
paramNum := len(blk.params)

for paramIndex := 0; paramIndex < paramNum; paramIndex++ {
Expand Down
3 changes: 3 additions & 0 deletions internal/engine/wazevo/ssa/pass_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -167,6 +167,9 @@ blk3: () <-- (blk1,blk2)
ret.AsReturn(ValuesNil)
b.InsertInstruction(ret)
}

// passRedundantPhiEliminationOpt requires the reverse post-order traversal to be calculated.
passCalculateImmediateDominators(b)
return nil
},
before: `
Expand Down

0 comments on commit eb24363

Please sign in to comment.