Commit 073297ff authored by David Chase's avatar David Chase

cmd/compile: enhance postorder computation and repair loop finder

Replace derecursed postorder computation with one that
mimics DFS traversal.

Corrected outerinner function in loopfinder

Leave enhanced checks in place.

Change-Id: I657ba5e89c88941028d6d4c72e9f9056e30f1ce8
Reviewed-on: https://go-review.googlesource.com/40872
Run-TryBot: David Chase <drchase@google.com>
Reviewed-by: default avatarKeith Randall <khr@golang.org>
parent e956dcbd
...@@ -638,7 +638,6 @@ var knownFormats = map[string]string{ ...@@ -638,7 +638,6 @@ var knownFormats = map[string]string{
"cmd/compile/internal/ssa.Type %s": "", "cmd/compile/internal/ssa.Type %s": "",
"cmd/compile/internal/ssa.Type %v": "", "cmd/compile/internal/ssa.Type %v": "",
"cmd/compile/internal/ssa.ValAndOff %s": "", "cmd/compile/internal/ssa.ValAndOff %s": "",
"cmd/compile/internal/ssa.markKind %d": "",
"cmd/compile/internal/ssa.rbrank %d": "", "cmd/compile/internal/ssa.rbrank %d": "",
"cmd/compile/internal/ssa.regMask %d": "", "cmd/compile/internal/ssa.regMask %d": "",
"cmd/compile/internal/ssa.register %d": "", "cmd/compile/internal/ssa.register %d": "",
......
...@@ -273,6 +273,23 @@ func checkFunc(f *Func) { ...@@ -273,6 +273,23 @@ func checkFunc(f *Func) {
} }
} }
// Check loop construction
if f.RegAlloc == nil && f.pass != nil { // non-nil pass allows better-targeted debug printing
ln := f.loopnest()
po := f.postorder() // use po to avoid unreachable blocks.
for _, b := range po {
for _, s := range b.Succs {
bb := s.Block()
if ln.b2l[b.ID] == nil && ln.b2l[bb.ID] != nil && bb != ln.b2l[bb.ID].header {
f.Fatalf("block %s not in loop branches to non-header block %s in loop", b.String(), bb.String())
}
if ln.b2l[b.ID] != nil && ln.b2l[bb.ID] != nil && bb != ln.b2l[bb.ID].header && !ln.b2l[b.ID].isWithinOrEq(ln.b2l[bb.ID]) {
f.Fatalf("block %s in loop branches to non-header block %s in non-containing loop", b.String(), bb.String())
}
}
}
}
// Check use counts // Check use counts
uses := make([]int32, f.NumValues()) uses := make([]int32, f.NumValues())
for _, b := range f.Blocks { for _, b := range f.Blocks {
......
...@@ -22,40 +22,42 @@ const ( ...@@ -22,40 +22,42 @@ const (
func postorder(f *Func) []*Block { func postorder(f *Func) []*Block {
return postorderWithNumbering(f, []int32{}) return postorderWithNumbering(f, []int32{})
} }
type blockAndIndex struct {
b *Block
index int // index is the number of successor edges of b that have already been explored.
}
// postorderWithNumbering provides a DFS postordering.
// This seems to make loop-finding more robust.
func postorderWithNumbering(f *Func, ponums []int32) []*Block { func postorderWithNumbering(f *Func, ponums []int32) []*Block {
mark := make([]markKind, f.NumBlocks()) mark := make([]markKind, f.NumBlocks())
// result ordering // result ordering
var order []*Block var order []*Block
// stack of blocks // stack of blocks and next child to visit
var s []*Block var s []blockAndIndex
s = append(s, f.Entry) s = append(s, blockAndIndex{b: f.Entry})
mark[f.Entry.ID] = notExplored mark[f.Entry.ID] = explored
for len(s) > 0 { for len(s) > 0 {
b := s[len(s)-1] tos := len(s) - 1
switch mark[b.ID] { x := s[tos]
case explored: b := x.b
// Children have all been visited. Pop & output block. i := x.index
s = s[:len(s)-1] if i < len(b.Succs) {
mark[b.ID] = done s[tos].index++
bb := b.Succs[i].Block()
if mark[bb.ID] == notFound {
mark[bb.ID] = explored
s = append(s, blockAndIndex{b: bb})
}
} else {
s = s[:tos]
if len(ponums) > 0 { if len(ponums) > 0 {
ponums[b.ID] = int32(len(order)) ponums[b.ID] = int32(len(order))
} }
order = append(order, b) order = append(order, b)
case notExplored:
// Children have not been visited yet. Mark as explored
// and queue any children we haven't seen yet.
mark[b.ID] = explored
for _, e := range b.Succs {
c := e.b
if mark[c.ID] == notFound {
mark[c.ID] = notExplored
s = append(s, c)
}
}
default:
b.Fatalf("bad stack state %v %d", b, mark[b.ID])
} }
} }
return order return order
......
...@@ -454,7 +454,39 @@ func generateDominatorMap(fut fun) map[string]string { ...@@ -454,7 +454,39 @@ func generateDominatorMap(fut fun) map[string]string {
return doms return doms
} }
func TestDominatorsPostTricky(t *testing.T) { func TestDominatorsPostTrickyA(t *testing.T) {
testDominatorsPostTricky(t, "b8", "b11", "b10", "b8", "b14", "b15")
}
func TestDominatorsPostTrickyB(t *testing.T) {
testDominatorsPostTricky(t, "b11", "b8", "b10", "b8", "b14", "b15")
}
func TestDominatorsPostTrickyC(t *testing.T) {
testDominatorsPostTricky(t, "b8", "b11", "b8", "b10", "b14", "b15")
}
func TestDominatorsPostTrickyD(t *testing.T) {
testDominatorsPostTricky(t, "b11", "b8", "b8", "b10", "b14", "b15")
}
func TestDominatorsPostTrickyE(t *testing.T) {
testDominatorsPostTricky(t, "b8", "b11", "b10", "b8", "b15", "b14")
}
func TestDominatorsPostTrickyF(t *testing.T) {
testDominatorsPostTricky(t, "b11", "b8", "b10", "b8", "b15", "b14")
}
func TestDominatorsPostTrickyG(t *testing.T) {
testDominatorsPostTricky(t, "b8", "b11", "b8", "b10", "b15", "b14")
}
func TestDominatorsPostTrickyH(t *testing.T) {
testDominatorsPostTricky(t, "b11", "b8", "b8", "b10", "b15", "b14")
}
func testDominatorsPostTricky(t *testing.T, b7then, b7else, b12then, b12else, b13then, b13else string) {
c := testConfig(t) c := testConfig(t)
fun := c.Fun("b1", fun := c.Fun("b1",
Bloc("b1", Bloc("b1",
...@@ -466,11 +498,11 @@ func TestDominatorsPostTricky(t *testing.T) { ...@@ -466,11 +498,11 @@ func TestDominatorsPostTricky(t *testing.T) {
Bloc("b5", Bloc("b5",
Goto("b7")), Goto("b7")),
Bloc("b7", Bloc("b7",
If("p", "b8", "b11")), If("p", b7then, b7else)),
Bloc("b8", Bloc("b8",
Goto("b13")), Goto("b13")),
Bloc("b13", Bloc("b13",
If("p", "b14", "b15")), If("p", b13then, b13else)),
Bloc("b14", Bloc("b14",
Goto("b10")), Goto("b10")),
Bloc("b15", Bloc("b15",
...@@ -482,7 +514,7 @@ func TestDominatorsPostTricky(t *testing.T) { ...@@ -482,7 +514,7 @@ func TestDominatorsPostTricky(t *testing.T) {
Bloc("b11", Bloc("b11",
Goto("b12")), Goto("b12")),
Bloc("b12", Bloc("b12",
If("p", "b10", "b8")), If("p", b12then, b12else)),
Bloc("b10", Bloc("b10",
Goto("b6")), Goto("b6")),
Bloc("b6", Bloc("b6",
......
...@@ -35,6 +35,9 @@ type loop struct { ...@@ -35,6 +35,9 @@ type loop struct {
func (sdom SparseTree) outerinner(outer, inner *loop) { func (sdom SparseTree) outerinner(outer, inner *loop) {
// There could be other outer loops found in some random order, // There could be other outer loops found in some random order,
// locate the new outer loop appropriately among them. // locate the new outer loop appropriately among them.
// Outer loop headers dominate inner loop headers.
// Use this to put the "new" "outer" loop in the right place.
oldouter := inner.outer oldouter := inner.outer
for oldouter != nil && sdom.isAncestor(outer.header, oldouter.header) { for oldouter != nil && sdom.isAncestor(outer.header, oldouter.header) {
inner = oldouter inner = oldouter
...@@ -44,7 +47,7 @@ func (sdom SparseTree) outerinner(outer, inner *loop) { ...@@ -44,7 +47,7 @@ func (sdom SparseTree) outerinner(outer, inner *loop) {
return return
} }
if oldouter != nil { if oldouter != nil {
outer.outer = oldouter sdom.outerinner(oldouter, outer)
} }
inner.outer = outer inner.outer = outer
...@@ -259,6 +262,18 @@ func (l *loop) LongString() string { ...@@ -259,6 +262,18 @@ func (l *loop) LongString() string {
return fmt.Sprintf("hdr:%s%s%s", l.header, i, o) return fmt.Sprintf("hdr:%s%s%s", l.header, i, o)
} }
func (l *loop) isWithinOrEq(ll *loop) bool {
if ll == nil { // nil means whole program
return true
}
for ; l != nil; l = l.outer {
if l == ll {
return true
}
}
return false
}
// nearestOuterLoop returns the outer loop of loop most nearly // nearestOuterLoop returns the outer loop of loop most nearly
// containing block b; the header must dominate b. loop itself // containing block b; the header must dominate b. loop itself
// is assumed to not be that loop. For acceptable performance, // is assumed to not be that loop. For acceptable performance,
...@@ -278,8 +293,8 @@ func loopnestfor(f *Func) *loopnest { ...@@ -278,8 +293,8 @@ func loopnestfor(f *Func) *loopnest {
// Reducible-loop-nest-finding. // Reducible-loop-nest-finding.
for _, b := range po { for _, b := range po {
if f.pass.debug > 3 { if f.pass != nil && f.pass.debug > 3 {
fmt.Printf("loop finding (0) at %s\n", b) fmt.Printf("loop finding at %s\n", b)
} }
var innermost *loop // innermost header reachable from this block var innermost *loop // innermost header reachable from this block
...@@ -299,6 +314,9 @@ func loopnestfor(f *Func) *loopnest { ...@@ -299,6 +314,9 @@ func loopnestfor(f *Func) *loopnest {
l := b2l[bb.ID] l := b2l[bb.ID]
if sdom.isAncestorEq(bb, b) { // Found a loop header if sdom.isAncestorEq(bb, b) { // Found a loop header
if f.pass != nil && f.pass.debug > 4 {
fmt.Printf("loop finding succ %s of %s is header\n", bb.String(), b.String())
}
if l == nil { if l == nil {
l = &loop{header: bb, isInner: true} l = &loop{header: bb, isInner: true}
loops = append(loops, l) loops = append(loops, l)
...@@ -311,6 +329,13 @@ func loopnestfor(f *Func) *loopnest { ...@@ -311,6 +329,13 @@ func loopnestfor(f *Func) *loopnest {
if l != nil && !sdom.isAncestorEq(l.header, b) { if l != nil && !sdom.isAncestorEq(l.header, b) {
l = l.nearestOuterLoop(sdom, b) l = l.nearestOuterLoop(sdom, b)
} }
if f.pass != nil && f.pass.debug > 4 {
if l == nil {
fmt.Printf("loop finding succ %s of %s has no loop\n", bb.String(), b.String())
} else {
fmt.Printf("loop finding succ %s of %s provides loop with header %s\n", bb.String(), b.String(), l.header.String())
}
}
} }
if l == nil || innermost == l { if l == nil || innermost == l {
...@@ -340,7 +365,7 @@ func loopnestfor(f *Func) *loopnest { ...@@ -340,7 +365,7 @@ func loopnestfor(f *Func) *loopnest {
ln := &loopnest{f: f, b2l: b2l, po: po, sdom: sdom, loops: loops} ln := &loopnest{f: f, b2l: b2l, po: po, sdom: sdom, loops: loops}
// Curious about the loopiness? "-d=ssa/likelyadjust/stats" // Curious about the loopiness? "-d=ssa/likelyadjust/stats"
if f.pass.stats > 0 && len(loops) > 0 { if f.pass != nil && f.pass.stats > 0 && len(loops) > 0 {
ln.assembleChildren() ln.assembleChildren()
ln.calculateDepths() ln.calculateDepths()
ln.findExits() ln.findExits()
...@@ -365,7 +390,7 @@ func loopnestfor(f *Func) *loopnest { ...@@ -365,7 +390,7 @@ func loopnestfor(f *Func) *loopnest {
} }
} }
if f.pass.debug > 1 && len(loops) > 0 { if f.pass != nil && f.pass.debug > 1 && len(loops) > 0 {
fmt.Printf("Loops in %s:\n", f.Name) fmt.Printf("Loops in %s:\n", f.Name)
for _, l := range loops { for _, l := range loops {
fmt.Printf("%s, b=", l.LongString()) fmt.Printf("%s, b=", l.LongString())
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment