// Copyright 2015 The Go Authors. All rights reserved.
|
// Use of this source code is governed by a BSD-style
|
// license that can be found in the LICENSE file.
|
|
package ssa
|
|
// mark values
|
type markKind uint8
|
|
const (
|
notFound markKind = 0 // block has not been discovered yet
|
notExplored markKind = 1 // discovered and in queue, outedges not processed yet
|
explored markKind = 2 // discovered and in queue, outedges processed
|
done markKind = 3 // all done, in output ordering
|
)
|
|
// This file contains code to compute the dominator tree
|
// of a control-flow graph.
|
|
// postorder computes a postorder traversal ordering for the
|
// basic blocks in f. Unreachable blocks will not appear.
|
func postorder(f *Func) []*Block {
|
return postorderWithNumbering(f, []int32{})
|
}
|
|
type blockAndIndex struct {
|
b *Block
|
index int // index is the number of successor edges of b that have already been explored.
|
}
|
|
// postorderWithNumbering provides a DFS postordering.
|
// This seems to make loop-finding more robust.
|
func postorderWithNumbering(f *Func, ponums []int32) []*Block {
|
mark := make([]markKind, f.NumBlocks())
|
|
// result ordering
|
var order []*Block
|
|
// stack of blocks and next child to visit
|
// A constant bound allows this to be stack-allocated. 32 is
|
// enough to cover almost every postorderWithNumbering call.
|
s := make([]blockAndIndex, 0, 32)
|
s = append(s, blockAndIndex{b: f.Entry})
|
mark[f.Entry.ID] = explored
|
for len(s) > 0 {
|
tos := len(s) - 1
|
x := s[tos]
|
b := x.b
|
i := x.index
|
if i < len(b.Succs) {
|
s[tos].index++
|
bb := b.Succs[i].Block()
|
if mark[bb.ID] == notFound {
|
mark[bb.ID] = explored
|
s = append(s, blockAndIndex{b: bb})
|
}
|
} else {
|
s = s[:tos]
|
if len(ponums) > 0 {
|
ponums[b.ID] = int32(len(order))
|
}
|
order = append(order, b)
|
}
|
}
|
return order
|
}
|
|
type linkedBlocks func(*Block) []Edge
|
|
const nscratchslices = 7
|
|
// experimentally, functions with 512 or fewer blocks account
|
// for 75% of memory (size) allocation for dominator computation
|
// in make.bash.
|
const minscratchblocks = 512
|
|
func (cache *Cache) scratchBlocksForDom(maxBlockID int) (a, b, c, d, e, f, g []ID) {
|
tot := maxBlockID * nscratchslices
|
scratch := cache.domblockstore
|
if len(scratch) < tot {
|
// req = min(1.5*tot, nscratchslices*minscratchblocks)
|
// 50% padding allows for graph growth in later phases.
|
req := (tot * 3) >> 1
|
if req < nscratchslices*minscratchblocks {
|
req = nscratchslices * minscratchblocks
|
}
|
scratch = make([]ID, req)
|
cache.domblockstore = scratch
|
} else {
|
// Clear as much of scratch as we will (re)use
|
scratch = scratch[0:tot]
|
for i := range scratch {
|
scratch[i] = 0
|
}
|
}
|
|
a = scratch[0*maxBlockID : 1*maxBlockID]
|
b = scratch[1*maxBlockID : 2*maxBlockID]
|
c = scratch[2*maxBlockID : 3*maxBlockID]
|
d = scratch[3*maxBlockID : 4*maxBlockID]
|
e = scratch[4*maxBlockID : 5*maxBlockID]
|
f = scratch[5*maxBlockID : 6*maxBlockID]
|
g = scratch[6*maxBlockID : 7*maxBlockID]
|
|
return
|
}
|
|
func dominators(f *Func) []*Block {
|
preds := func(b *Block) []Edge { return b.Preds }
|
succs := func(b *Block) []Edge { return b.Succs }
|
|
//TODO: benchmark and try to find criteria for swapping between
|
// dominatorsSimple and dominatorsLT
|
return f.dominatorsLTOrig(f.Entry, preds, succs)
|
}
|
|
// dominatorsLTOrig runs Lengauer-Tarjan to compute a dominator tree starting at
|
// entry and using predFn/succFn to find predecessors/successors to allow
|
// computing both dominator and post-dominator trees.
|
func (f *Func) dominatorsLTOrig(entry *Block, predFn linkedBlocks, succFn linkedBlocks) []*Block {
|
// Adapted directly from the original TOPLAS article's "simple" algorithm
|
|
maxBlockID := entry.Func.NumBlocks()
|
semi, vertex, label, parent, ancestor, bucketHead, bucketLink := f.Cache.scratchBlocksForDom(maxBlockID)
|
|
// This version uses integers for most of the computation,
|
// to make the work arrays smaller and pointer-free.
|
// fromID translates from ID to *Block where that is needed.
|
fromID := make([]*Block, maxBlockID)
|
for _, v := range f.Blocks {
|
fromID[v.ID] = v
|
}
|
idom := make([]*Block, maxBlockID)
|
|
// Step 1. Carry out a depth first search of the problem graph. Number
|
// the vertices from 1 to n as they are reached during the search.
|
n := f.dfsOrig(entry, succFn, semi, vertex, label, parent)
|
|
for i := n; i >= 2; i-- {
|
w := vertex[i]
|
|
// step2 in TOPLAS paper
|
for _, e := range predFn(fromID[w]) {
|
v := e.b
|
if semi[v.ID] == 0 {
|
// skip unreachable predecessor
|
// not in original, but we're using existing pred instead of building one.
|
continue
|
}
|
u := evalOrig(v.ID, ancestor, semi, label)
|
if semi[u] < semi[w] {
|
semi[w] = semi[u]
|
}
|
}
|
|
// add w to bucket[vertex[semi[w]]]
|
// implement bucket as a linked list implemented
|
// in a pair of arrays.
|
vsw := vertex[semi[w]]
|
bucketLink[w] = bucketHead[vsw]
|
bucketHead[vsw] = w
|
|
linkOrig(parent[w], w, ancestor)
|
|
// step3 in TOPLAS paper
|
for v := bucketHead[parent[w]]; v != 0; v = bucketLink[v] {
|
u := evalOrig(v, ancestor, semi, label)
|
if semi[u] < semi[v] {
|
idom[v] = fromID[u]
|
} else {
|
idom[v] = fromID[parent[w]]
|
}
|
}
|
}
|
// step 4 in toplas paper
|
for i := ID(2); i <= n; i++ {
|
w := vertex[i]
|
if idom[w].ID != vertex[semi[w]] {
|
idom[w] = idom[idom[w].ID]
|
}
|
}
|
|
return idom
|
}
|
|
// dfs performs a depth first search over the blocks starting at entry block
|
// (in arbitrary order). This is a de-recursed version of dfs from the
|
// original Tarjan-Lengauer TOPLAS article. It's important to return the
|
// same values for parent as the original algorithm.
|
func (f *Func) dfsOrig(entry *Block, succFn linkedBlocks, semi, vertex, label, parent []ID) ID {
|
n := ID(0)
|
s := make([]*Block, 0, 256)
|
s = append(s, entry)
|
|
for len(s) > 0 {
|
v := s[len(s)-1]
|
s = s[:len(s)-1]
|
// recursing on v
|
|
if semi[v.ID] != 0 {
|
continue // already visited
|
}
|
n++
|
semi[v.ID] = n
|
vertex[n] = v.ID
|
label[v.ID] = v.ID
|
// ancestor[v] already zero
|
for _, e := range succFn(v) {
|
w := e.b
|
// if it has a dfnum, we've already visited it
|
if semi[w.ID] == 0 {
|
// yes, w can be pushed multiple times.
|
s = append(s, w)
|
parent[w.ID] = v.ID // keep overwriting this till it is visited.
|
}
|
}
|
}
|
return n
|
}
|
|
// compressOrig is the "simple" compress function from LT paper
|
func compressOrig(v ID, ancestor, semi, label []ID) {
|
if ancestor[ancestor[v]] != 0 {
|
compressOrig(ancestor[v], ancestor, semi, label)
|
if semi[label[ancestor[v]]] < semi[label[v]] {
|
label[v] = label[ancestor[v]]
|
}
|
ancestor[v] = ancestor[ancestor[v]]
|
}
|
}
|
|
// evalOrig is the "simple" eval function from LT paper
|
func evalOrig(v ID, ancestor, semi, label []ID) ID {
|
if ancestor[v] == 0 {
|
return v
|
}
|
compressOrig(v, ancestor, semi, label)
|
return label[v]
|
}
|
|
func linkOrig(v, w ID, ancestor []ID) {
|
ancestor[w] = v
|
}
|
|
// dominators computes the dominator tree for f. It returns a slice
|
// which maps block ID to the immediate dominator of that block.
|
// Unreachable blocks map to nil. The entry block maps to nil.
|
func dominatorsSimple(f *Func) []*Block {
|
// A simple algorithm for now
|
// Cooper, Harvey, Kennedy
|
idom := make([]*Block, f.NumBlocks())
|
|
// Compute postorder walk
|
post := f.postorder()
|
|
// Make map from block id to order index (for intersect call)
|
postnum := make([]int, f.NumBlocks())
|
for i, b := range post {
|
postnum[b.ID] = i
|
}
|
|
// Make the entry block a self-loop
|
idom[f.Entry.ID] = f.Entry
|
if postnum[f.Entry.ID] != len(post)-1 {
|
f.Fatalf("entry block %v not last in postorder", f.Entry)
|
}
|
|
// Compute relaxation of idom entries
|
for {
|
changed := false
|
|
for i := len(post) - 2; i >= 0; i-- {
|
b := post[i]
|
var d *Block
|
for _, e := range b.Preds {
|
p := e.b
|
if idom[p.ID] == nil {
|
continue
|
}
|
if d == nil {
|
d = p
|
continue
|
}
|
d = intersect(d, p, postnum, idom)
|
}
|
if d != idom[b.ID] {
|
idom[b.ID] = d
|
changed = true
|
}
|
}
|
if !changed {
|
break
|
}
|
}
|
// Set idom of entry block to nil instead of itself.
|
idom[f.Entry.ID] = nil
|
return idom
|
}
|
|
// intersect finds the closest dominator of both b and c.
|
// It requires a postorder numbering of all the blocks.
|
func intersect(b, c *Block, postnum []int, idom []*Block) *Block {
|
// TODO: This loop is O(n^2). It used to be used in nilcheck,
|
// see BenchmarkNilCheckDeep*.
|
for b != c {
|
if postnum[b.ID] < postnum[c.ID] {
|
b = idom[b.ID]
|
} else {
|
c = idom[c.ID]
|
}
|
}
|
return b
|
}
|