cmd/compile: insert scheduling checks on loop backedges

author David Chase <drchase@google.com>

Thu, 10 Nov 2016 21:03:47 +0000 (16:03 -0500)

committer David Chase <drchase@google.com>

Mon, 9 Jan 2017 21:01:29 +0000 (21:01 +0000)
author David Chase <drchase@google.com>
Thu, 10 Nov 2016 21:03:47 +0000 (16:03 -0500)
committer David Chase <drchase@google.com>
Mon, 9 Jan 2017 21:01:29 +0000 (21:01 +0000)
diff --git a/src/cmd/compile/internal/gc/builtin.go b/src/cmd/compile/internal/gc/builtin.go

index e02e2feb016b6498866aeda2462dbae383dddd27..71b323f8a1d1b2796b079578e3b05346d1a6e6dc 100644 (file)
--- a/src/cmd/compile/internal/gc/builtin.go
+++ b/src/cmd/compile/internal/gc/builtin.go
@@ -15,6 +15,7 @@ var runtimeDecls = [...]struct {
         {"panicwrap", funcTag, 7},
         {"gopanic", funcTag, 9},
         {"gorecover", funcTag, 12},
+       {"goschedguarded", funcTag, 5},
         {"printbool", funcTag, 14},
         {"printfloat", funcTag, 16},
         {"printint", funcTag, 18},
diff --git a/src/cmd/compile/internal/gc/builtin/runtime.go b/src/cmd/compile/internal/gc/builtin/runtime.go

index 98e25fefb899c710c28b14f36748be88f5aa9cf5..69511155f4728b431531d51f14139861e9f84b13 100644 (file)
--- a/src/cmd/compile/internal/gc/builtin/runtime.go
+++ b/src/cmd/compile/internal/gc/builtin/runtime.go
@@ -21,6 +21,7 @@ func panicwrap(string, string, string)
  
  func gopanic(interface{})
  func gorecover(*int32) interface{}
+func goschedguarded()
  
  func printbool(bool)
  func printfloat(float64)
diff --git a/src/cmd/compile/internal/gc/ssa.go b/src/cmd/compile/internal/gc/ssa.go

index 55ee3c01dcc50e99dd1b53f84a2387f8c2fc056b..bf483f8416c118860faab62de85a22f8457499e6 100644 (file)
--- a/src/cmd/compile/internal/gc/ssa.go
+++ b/src/cmd/compile/internal/gc/ssa.go
@@ -64,6 +64,9 @@ func buildssa(fn *Node) *ssa.Func {
         s.config = initssa()
         s.f = s.config.NewFunc()
         s.f.Name = name
+       if fn.Func.Pragma&Nosplit != 0 {
+               s.f.NoSplit = true
+       }
         s.exitCode = fn.Func.Exit
         s.panics = map[funcLine]*ssa.Block{}
         s.config.DebugTest = s.config.DebugHashMatch("GOSSAHASH", name)
diff --git a/src/cmd/compile/internal/ssa/compile.go b/src/cmd/compile/internal/ssa/compile.go

index b9ec7eb6b7bddf22b1d712f5812e24f9e12b2367..5b461bac4874476b4cfc8811e17c36d23bac9cff 100644 (file)
--- a/src/cmd/compile/internal/ssa/compile.go
+++ b/src/cmd/compile/internal/ssa/compile.go
@@ -5,6 +5,7 @@
  package ssa
  
  import (
+       "cmd/internal/obj"
         "fmt"
         "log"
         "os"
@@ -349,6 +350,8 @@ var passes = [...]pass{
         {name: "writebarrier", fn: writebarrier, required: true}, // expand write barrier ops
         {name: "fuse", fn: fuse},
         {name: "dse", fn: dse},
+       {name: "insert resched checks", fn: insertLoopReschedChecks,
+               disabled: obj.Preemptibleloops_enabled == 0}, // insert resched checks in loops.
         {name: "tighten", fn: tighten}, // move values closer to their uses
         {name: "lower", fn: lower, required: true},
         {name: "lowered cse", fn: cse},
@@ -378,7 +381,13 @@ type constraint struct {
  }
  
  var passOrder = [...]constraint{
-       // prove reliese on common-subexpression elimination for maximum benefits.
+       // "insert resched checks" uses mem, better to clean out stores first.
+       {"dse", "insert resched checks"},
+       // insert resched checks adds new blocks containing generic instructions
+       {"insert resched checks", "lower"},
+       {"insert resched checks", "tighten"},
+
+       // prove relies on common-subexpression elimination for maximum benefits.
         {"generic cse", "prove"},
         // deadcode after prove to eliminate all new dead blocks.
         {"prove", "generic deadcode"},
diff --git a/src/cmd/compile/internal/ssa/func.go b/src/cmd/compile/internal/ssa/func.go

index 7b2097bcae71aedda8fbbfcc690aa8316dc3038f..df29aa36064f19edd61d93d41858b910923bdced 100644 (file)
--- a/src/cmd/compile/internal/ssa/func.go
+++ b/src/cmd/compile/internal/ssa/func.go
@@ -24,6 +24,7 @@ type Func struct {
         vid        idAlloc     // value ID allocator
  
         scheduled bool // Values in Blocks are in final order
+       NoSplit   bool // true if function is marked as nosplit.  Used by schedule check pass.
  
         // when register allocation is done, maps value ids to locations
         RegAlloc []Location
diff --git a/src/cmd/compile/internal/ssa/loopreschedchecks.go b/src/cmd/compile/internal/ssa/loopreschedchecks.go

new file mode 100644 (file)

index 0000000..8f8055e
--- /dev/null
+++ b/src/cmd/compile/internal/ssa/loopreschedchecks.go
@@ -0,0 +1,517 @@
+// Copyright 2016 The Go Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style
+// license that can be found in the LICENSE file.
+
+package ssa
+
+import "fmt"
+
+// an edgeMemCtr records a backedge, together with the memory and
+// counter phi functions at the target of the backedge that must
+// be updated when a rescheduling check replaces the backedge.
+type edgeMemCtr struct {
+       e Edge
+       m *Value // phi for memory at dest of e
+       c *Value // phi for counter at dest of e
+}
+
+// a rewriteTarget is a a value-argindex pair indicating
+// where a rewrite is applied.  Note that this is for values,
+// not for block controls, because block controls are not targets
+// for the rewrites performed in inserting rescheduling checks.
+type rewriteTarget struct {
+       v *Value
+       i int
+}
+
+type rewrite struct {
+       before, after *Value          // before is the expected value before rewrite, after is the new value installed.
+       rewrites      []rewriteTarget // all the targets for this rewrite.
+}
+
+func (r *rewrite) String() string {
+       s := "\n\tbefore=" + r.before.String() + ", after=" + r.after.String()
+       for _, rw := range r.rewrites {
+               s += ", (i=" + fmt.Sprint(rw.i) + ", v=" + rw.v.LongString() + ")"
+       }
+       s += "\n"
+       return s
+}
+
+const initialRescheduleCounterValue = 1021 // Largest 10-bit prime. 97 nSec loop bodies will check every 100 uSec.
+
+// insertLoopReschedChecks inserts rescheduling checks on loop backedges.
+func insertLoopReschedChecks(f *Func) {
+       // TODO: when split information is recorded in export data, insert checks only on backedges that can be reached on a split-call-free path.
+
+       // Loop reschedule checks decrement a per-function counter
+       // shared by all loops, and when the counter becomes non-positive
+       // a call is made to a rescheduling check in the runtime.
+       //
+       // Steps:
+       // 1. locate backedges.
+       // 2. Record memory definitions at block end so that
+       //    the SSA graph for mem can be prperly modified.
+       // 3. Define a counter and record its future uses (at backedges)
+       //    (Same process as 2, applied to a single definition of the counter.
+       //     difference for mem is that there are zero-to-many existing mem
+       //     definitions, versus exactly one for the new counter.)
+       // 4. Ensure that phi functions that will-be-needed for mem and counter
+       //    are present in the graph, initially with trivial inputs.
+       // 5. Record all to-be-modified uses of mem and counter;
+       //    apply modifications (split into two steps to simplify and
+       //    avoided nagging order-dependences).
+       // 6. Rewrite backedges to include counter check, reschedule check,
+       //    and modify destination phi function appropriately with new
+       //    definitions for mem and counter.
+
+       if f.NoSplit { // nosplit functions don't reschedule.
+               return
+       }
+
+       backedges := backedges(f)
+       if len(backedges) == 0 { // no backedges means no rescheduling checks.
+               return
+       }
+
+       lastMems := findLastMems(f)
+
+       idom := f.Idom()
+       sdom := f.sdom()
+
+       if f.pass.debug > 2 {
+               fmt.Printf("before %s = %s\n", f.Name, sdom.treestructure(f.Entry))
+       }
+
+       tofixBackedges := []edgeMemCtr{}
+
+       for _, e := range backedges { // TODO: could filter here by calls in loops, if declared and inferred nosplit are recorded in export data.
+               tofixBackedges = append(tofixBackedges, edgeMemCtr{e, nil, nil})
+       }
+
+       // It's possible that there is no memory state (no global/pointer loads/stores or calls)
+       if lastMems[f.Entry.ID] == nil {
+               lastMems[f.Entry.ID] = f.Entry.NewValue0(f.Entry.Line, OpInitMem, TypeMem)
+       }
+
+       memDefsAtBlockEnds := make([]*Value, f.NumBlocks()) // For each block, the mem def seen at its bottom. Could be from earlier block.
+
+       // Propagate last mem definitions forward through successor blocks.
+       po := f.postorder()
+       for i := len(po) - 1; i >= 0; i-- {
+               b := po[i]
+               mem := lastMems[b.ID]
+               for j := 0; mem == nil; j++ { // if there's no def, then there's no phi, so the visible mem is identical in all predecessors.
+                       // loop because there might be backedges that haven't been visited yet.
+                       mem = memDefsAtBlockEnds[b.Preds[j].b.ID]
+               }
+               memDefsAtBlockEnds[b.ID] = mem
+       }
+
+       // Set up counter.  There are no phis etc pre-existing for it.
+       counter0 := f.Entry.NewValue0I(f.Entry.Line, OpConst32, f.Config.fe.TypeInt32(), initialRescheduleCounterValue)
+       ctrDefsAtBlockEnds := make([]*Value, f.NumBlocks()) // For each block, def visible at its end, if that def will be used.
+
+       // There's a minor difference between memDefsAtBlockEnds and ctrDefsAtBlockEnds;
+       // because the counter only matter for loops and code that reaches them, it is nil for blocks where the ctr is no
+       // longer live.  This will avoid creation of dead phi functions.  This optimization is ignored for the mem variable
+       // because it is harder and also less likely to be helpful, though dead code elimination ought to clean this out anyhow.
+
+       for _, emc := range tofixBackedges {
+               e := emc.e
+               // set initial uses of counter zero (note available-at-bottom and use are the same thing initially.)
+               // each back-edge will be rewritten to include a reschedule check, and that will use the counter.
+               src := e.b.Preds[e.i].b
+               ctrDefsAtBlockEnds[src.ID] = counter0
+       }
+
+       // Push uses towards root
+       for _, b := range f.postorder() {
+               bd := ctrDefsAtBlockEnds[b.ID]
+               if bd == nil {
+                       continue
+               }
+               for _, e := range b.Preds {
+                       p := e.b
+                       if ctrDefsAtBlockEnds[p.ID] == nil {
+                               ctrDefsAtBlockEnds[p.ID] = bd
+                       }
+               }
+       }
+
+       // Maps from block to newly-inserted phi function in block.
+       newmemphis := make(map[*Block]rewrite)
+       newctrphis := make(map[*Block]rewrite)
+
+       // Insert phi functions as necessary for future changes to flow graph.
+       for i, emc := range tofixBackedges {
+               e := emc.e
+               h := e.b
+
+               // find the phi function for the memory input at "h", if there is one.
+               var headerMemPhi *Value // look for header mem phi
+
+               for _, v := range h.Values {
+                       if v.Op == OpPhi && v.Type.IsMemory() {
+                               headerMemPhi = v
+                       }
+               }
+
+               if headerMemPhi == nil {
+                       // if the header is nil, make a trivial phi from the dominator
+                       mem0 := memDefsAtBlockEnds[idom[h.ID].ID]
+                       headerMemPhi = newPhiFor(h, mem0)
+                       newmemphis[h] = rewrite{before: mem0, after: headerMemPhi}
+                       addDFphis(mem0, h, h, f, memDefsAtBlockEnds, newmemphis)
+
+               }
+               tofixBackedges[i].m = headerMemPhi
+
+               var headerCtrPhi *Value
+               rw, ok := newctrphis[h]
+               if !ok {
+                       headerCtrPhi = newPhiFor(h, counter0)
+                       newctrphis[h] = rewrite{before: counter0, after: headerCtrPhi}
+                       addDFphis(counter0, h, h, f, ctrDefsAtBlockEnds, newctrphis)
+               } else {
+                       headerCtrPhi = rw.after
+               }
+               tofixBackedges[i].c = headerCtrPhi
+       }
+
+       rewriteNewPhis(f.Entry, f.Entry, f, memDefsAtBlockEnds, newmemphis)
+       rewriteNewPhis(f.Entry, f.Entry, f, ctrDefsAtBlockEnds, newctrphis)
+
+       if f.pass.debug > 0 {
+               for b, r := range newmemphis {
+                       fmt.Printf("b=%s, rewrite=%s\n", b, r.String())
+               }
+
+               for b, r := range newctrphis {
+                       fmt.Printf("b=%s, rewrite=%s\n", b, r.String())
+               }
+       }
+
+       // Apply collected rewrites.
+       for _, r := range newmemphis {
+               for _, rw := range r.rewrites {
+                       rw.v.SetArg(rw.i, r.after)
+               }
+       }
+
+       for _, r := range newctrphis {
+               for _, rw := range r.rewrites {
+                       rw.v.SetArg(rw.i, r.after)
+               }
+       }
+
+       zero := f.Entry.NewValue0I(f.Entry.Line, OpConst32, f.Config.fe.TypeInt32(), 0)
+       one := f.Entry.NewValue0I(f.Entry.Line, OpConst32, f.Config.fe.TypeInt32(), 1)
+
+       // Rewrite backedges to include reschedule checks.
+       for _, emc := range tofixBackedges {
+               e := emc.e
+               headerMemPhi := emc.m
+               headerCtrPhi := emc.c
+               h := e.b
+               i := e.i
+               p := h.Preds[i]
+               bb := p.b
+               mem0 := headerMemPhi.Args[i]
+               ctr0 := headerCtrPhi.Args[i]
+               // bb e->p h,
+               // Because we're going to insert a rare-call, make sure the
+               // looping edge still looks likely.
+               likely := BranchLikely
+               if p.i != 0 {
+                       likely = BranchUnlikely
+               }
+               bb.Likely = likely
+
+               // rewrite edge to include reschedule check
+               // existing edges:
+               //
+               // bb.Succs[p.i] == Edge{h, i}
+               // h.Preds[i] == p == Edge{bb,p.i}
+               //
+               // new block(s):
+               // test:
+               //    ctr1 := ctr0 - 1
+               //    if ctr1 <= 0 { goto sched }
+               //    goto join
+               // sched:
+               //    mem1 := call resched (mem0)
+               //    goto join
+               // join:
+               //    ctr2 := phi(ctr1, counter0) // counter0 is the constant
+               //    mem2 := phi(mem0, mem1)
+               //    goto h
+               //
+               // and correct arg i of headerMemPhi and headerCtrPhi
+               //
+               // EXCEPT: block containing only phi functions is bad
+               // for the register allocator.  Therefore, there is no
+               // join, and instead branches targeting join instead target
+               // the header, and the other phi functions within header are
+               // adjusted for the additional input.
+
+               test := f.NewBlock(BlockIf)
+               sched := f.NewBlock(BlockPlain)
+
+               test.Line = bb.Line
+               sched.Line = bb.Line
+
+               //    ctr1 := ctr0 - 1
+               //    if ctr1 <= 0 { goto sched }
+               //    goto header
+               ctr1 := test.NewValue2(bb.Line, OpSub32, f.Config.fe.TypeInt32(), ctr0, one)
+               cmp := test.NewValue2(bb.Line, OpLeq32, f.Config.fe.TypeBool(), ctr1, zero)
+               test.SetControl(cmp)
+               test.AddEdgeTo(sched) // if true
+               // if false -- rewrite edge to header.
+               // do NOT remove+add, because that will perturb all the other phi functions
+               // as well as messing up other edges to the header.
+               test.Succs = append(test.Succs, Edge{h, i})
+               h.Preds[i] = Edge{test, 1}
+               headerMemPhi.SetArg(i, mem0)
+               headerCtrPhi.SetArg(i, ctr1)
+
+               test.Likely = BranchUnlikely
+
+               // sched:
+               //    mem1 := call resched (mem0)
+               //    goto header
+               resched := f.Config.fe.Syslook("goschedguarded")
+               mem1 := sched.NewValue1A(bb.Line, OpStaticCall, TypeMem, resched, mem0)
+               sched.AddEdgeTo(h)
+               headerMemPhi.AddArg(mem1)
+               headerCtrPhi.AddArg(counter0)
+
+               bb.Succs[p.i] = Edge{test, 0}
+               test.Preds = append(test.Preds, Edge{bb, p.i})
+
+               // Must correct all the other phi functions in the header for new incoming edge.
+               // Except for mem and counter phis, it will be the same value seen on the original
+               // backedge at index i.
+               for _, v := range h.Values {
+                       if v.Op == OpPhi && v != headerMemPhi && v != headerCtrPhi {
+                               v.AddArg(v.Args[i])
+                       }
+               }
+       }
+
+       f.invalidateCFG()
+
+       if f.pass.debug > 2 {
+               sdom = newSparseTree(f, f.Idom())
+               fmt.Printf("after %s = %s\n", f.Name, sdom.treestructure(f.Entry))
+       }
+
+       return
+}
+
+// newPhiFor inserts a new Phi function into b,
+// with all inputs set to v.
+func newPhiFor(b *Block, v *Value) *Value {
+       phiV := b.NewValue0(b.Line, OpPhi, v.Type)
+
+       for range b.Preds {
+               phiV.AddArg(v)
+       }
+       return phiV
+}
+
+// rewriteNewPhis updates newphis[h] to record all places where the new phi function inserted
+// in block h will replace a previous definition.  Block b is the block currently being processed;
+// if b has its own phi definition then it takes the place of h.
+// defsForUses provides information about other definitions of the variable that are present
+// (and if nil, indicates that the variable is no longer live)
+func rewriteNewPhis(h, b *Block, f *Func, defsForUses []*Value, newphis map[*Block]rewrite) {
+       // If b is a block with a new phi, then a new rewrite applies below it in the dominator tree.
+       if _, ok := newphis[b]; ok {
+               h = b
+       }
+       change := newphis[h]
+       x := change.before
+       y := change.after
+
+       // Apply rewrites to this block
+       if x != nil { // don't waste time on the common case of no definition.
+               p := &change.rewrites
+               for _, v := range b.Values {
+                       if v == y { // don't rewrite self -- phi inputs are handled below.
+                               continue
+                       }
+                       for i, w := range v.Args {
+                               if w != x {
+                                       continue
+                               }
+                               *p = append(*p, rewriteTarget{v, i})
+                       }
+               }
+
+               // Rewrite appropriate inputs of phis reached in successors
+               // in dominance frontier, self, and dominated.
+               // If the variable def reaching uses in b is itself defined in b, then the new phi function
+               // does not reach the successors of b.  (This assumes a bit about the structure of the
+               // phi use-def graph, but it's true for memory and the inserted counter.)
+               if dfu := defsForUses[b.ID]; dfu != nil && dfu.Block != b {
+                       for _, e := range b.Succs {
+                               s := e.b
+                               if sphi, ok := newphis[s]; ok { // saves time to find the phi this way.
+                                       *p = append(*p, rewriteTarget{sphi.after, e.i})
+                                       continue
+                               }
+                               for _, v := range s.Values {
+                                       if v.Op == OpPhi && v.Args[e.i] == x {
+                                               *p = append(*p, rewriteTarget{v, e.i})
+                                               break
+                                       }
+                               }
+                       }
+               }
+               newphis[h] = change
+       }
+
+       sdom := f.sdom()
+
+       for c := sdom[b.ID].child; c != nil; c = sdom[c.ID].sibling {
+               rewriteNewPhis(h, c, f, defsForUses, newphis) // TODO: convert to explicit stack from recursion.
+       }
+}
+
+// addDFphis creates new trivial phis that are necessary to correctly reflect (within SSA)
+// a new definition for variable "x" inserted at h (usually but not necessarily a phi).
+// These new phis can only occur at the dominance frontier of h; block s is in the dominance
+// frontier of h if h does not strictly dominate s and if s is a successor of a block b where
+// either b = h or h strictly dominates b.
+// These newly created phis are themselves new definitions that may require addition of their
+// own trivial phi functions in their own dominance frontier, and this is handled recursively.
+func addDFphis(x *Value, h, b *Block, f *Func, defForUses []*Value, newphis map[*Block]rewrite) {
+       oldv := defForUses[b.ID]
+       if oldv != x { // either a new definition replacing x, or nil if it is proven that there are no uses reachable from b
+               return
+       }
+       sdom := f.sdom()
+       idom := f.Idom()
+outer:
+       for _, e := range b.Succs {
+               s := e.b
+               // check phi functions in the dominance frontier
+               if sdom.isAncestor(h, s) {
+                       continue // h dominates s, successor of b, therefore s is not in the frontier.
+               }
+               if _, ok := newphis[s]; ok {
+                       continue // successor s of b already has a new phi function, so there is no need to add another.
+               }
+               if x != nil {
+                       for _, v := range s.Values {
+                               if v.Op == OpPhi && v.Args[e.i] == x {
+                                       continue outer // successor s of b has an old phi function, so there is no need to add another.
+                               }
+                       }
+               }
+
+               old := defForUses[idom[s.ID].ID] // new phi function is correct-but-redundant, combining value "old" on all inputs.
+               headerPhi := newPhiFor(s, old)
+               // the new phi will replace "old" in block s and all blocks dominated by s.
+               newphis[s] = rewrite{before: old, after: headerPhi} // record new phi, to have inputs labeled "old" rewritten to "headerPhi"
+               addDFphis(old, s, s, f, defForUses, newphis)        // the new definition may also create new phi functions.
+       }
+       for c := sdom[b.ID].child; c != nil; c = sdom[c.ID].sibling {
+               addDFphis(x, h, c, f, defForUses, newphis) // TODO: convert to explicit stack from recursion.
+       }
+}
+
+// findLastMems maps block ids to last memory-output op in a block, if any
+func findLastMems(f *Func) []*Value {
+
+       var stores []*Value
+       lastMems := make([]*Value, f.NumBlocks())
+       storeUse := f.newSparseSet(f.NumValues())
+       defer f.retSparseSet(storeUse)
+       for _, b := range f.Blocks {
+               // Find all the stores in this block. Categorize their uses:
+               //  storeUse contains stores which are used by a subsequent store.
+               storeUse.clear()
+               stores = stores[:0]
+               var memPhi *Value
+               for _, v := range b.Values {
+                       if v.Op == OpPhi {
+                               if v.Type.IsMemory() {
+                                       memPhi = v
+                               }
+                               continue
+                       }
+                       if v.Type.IsMemory() {
+                               stores = append(stores, v)
+                               if v.Op == OpSelect1 {
+                                       // Use the arg of the tuple-generating op.
+                                       v = v.Args[0]
+                               }
+                               for _, a := range v.Args {
+                                       if a.Block == b && a.Type.IsMemory() {
+                                               storeUse.add(a.ID)
+                                       }
+                               }
+                       }
+               }
+               if len(stores) == 0 {
+                       lastMems[b.ID] = memPhi
+                       continue
+               }
+
+               // find last store in the block
+               var last *Value
+               for _, v := range stores {
+                       if storeUse.contains(v.ID) {
+                               continue
+                       }
+                       if last != nil {
+                               b.Fatalf("two final stores - simultaneous live stores %s %s", last, v)
+                       }
+                       last = v
+               }
+               if last == nil {
+                       b.Fatalf("no last store found - cycle?")
+               }
+               lastMems[b.ID] = last
+       }
+       return lastMems
+}
+
+type backedgesState struct {
+       b *Block
+       i int
+}
+
+// backedges returns a slice of successor edges that are back
+// edges.  For reducible loops, edge.b is the header.
+func backedges(f *Func) []Edge {
+       edges := []Edge{}
+       mark := make([]markKind, f.NumBlocks())
+       stack := []backedgesState{}
+
+       mark[f.Entry.ID] = notExplored
+       stack = append(stack, backedgesState{f.Entry, 0})
+
+       for len(stack) > 0 {
+               l := len(stack)
+               x := stack[l-1]
+               if x.i < len(x.b.Succs) {
+                       e := x.b.Succs[x.i]
+                       stack[l-1].i++
+                       s := e.b
+                       if mark[s.ID] == notFound {
+                               mark[s.ID] = notExplored
+                               stack = append(stack, backedgesState{s, 0})
+                       } else if mark[s.ID] == notExplored {
+                               edges = append(edges, e)
+                       }
+               } else {
+                       mark[x.b.ID] = done
+                       stack = stack[0 : l-1]
+               }
+       }
+       return edges
+}
diff --git a/src/cmd/compile/internal/ssa/sparsetree.go b/src/cmd/compile/internal/ssa/sparsetree.go

index 7c82a60d0fa8fc1e26e4660e4370e4d4ca59645e..8e5b9f3e5bd68023bffdcd81beb0ab4b41fecbd1 100644 (file)
--- a/src/cmd/compile/internal/ssa/sparsetree.go
+++ b/src/cmd/compile/internal/ssa/sparsetree.go
@@ -4,7 +4,10 @@
  
  package ssa
  
-import "fmt"
+import (
+       "fmt"
+       "strings"
+)
  
  type SparseTreeNode struct {
         child   *Block
@@ -67,6 +70,34 @@ func newSparseTree(f *Func, parentOf []*Block) SparseTree {
         return t
  }
  
+// treestructure provides a string description of the dominator
+// tree and flow structure of block b and all blocks that it
+// dominates.
+func (t SparseTree) treestructure(b *Block) string {
+       return t.treestructure1(b, 0)
+}
+func (t SparseTree) treestructure1(b *Block, i int) string {
+       s := "\n" + strings.Repeat("\t", i) + b.String() + "->["
+       for i, e := range b.Succs {
+               if i > 0 {
+                       s = s + ","
+               }
+               s = s + e.b.String()
+       }
+       s += "]"
+       if c0 := t[b.ID].child; c0 != nil {
+               s += "("
+               for c := c0; c != nil; c = t[c.ID].sibling {
+                       if c != c0 {
+                               s += " "
+                       }
+                       s += t.treestructure1(c, i+1)
+               }
+               s += ")"
+       }
+       return s
+}
+
  // numberBlock assigns entry and exit numbers for b and b's
  // children in an in-order walk from a gappy sequence, where n
  // is the first number not yet assigned or reserved. N should
diff --git a/src/cmd/internal/obj/go.go b/src/cmd/internal/obj/go.go

index 1852dc74f63b7d4e0f014932d38c9d8f87316210..732ce1963477618250bf68b0cfbba9a1d40d95ee 100644 (file)
--- a/src/cmd/internal/obj/go.go
+++ b/src/cmd/internal/obj/go.go
@@ -13,8 +13,9 @@ import (
  // go-specific code shared across loaders (5l, 6l, 8l).
  
  var (
-       framepointer_enabled int
-       Fieldtrack_enabled   int
+       framepointer_enabled     int
+       Fieldtrack_enabled       int
+       Preemptibleloops_enabled int
  )
  
  // Toolchain experiments.
@@ -27,6 +28,7 @@ var exper = []struct {
  }{
         {"fieldtrack", &Fieldtrack_enabled},
         {"framepointer", &framepointer_enabled},
+       {"preemptibleloops", &Preemptibleloops_enabled},
  }
  
  func addexp(s string) {
diff --git a/src/runtime/proc.go b/src/runtime/proc.go

index 756ce63c2421f13fcf19e0b1e5fdf50400fb15d7..f41672de73a67876b036f6a89068152c8cdf0742 100644 (file)
--- a/src/runtime/proc.go
+++ b/src/runtime/proc.go
@@ -240,6 +240,16 @@ func Gosched() {
         mcall(gosched_m)
  }
  
+var alwaysFalse bool
+
+// goschedguarded does nothing, but is written in a way that guarantees a preemption check in its prologue.
+// Calls to this function are inserted by the compiler in otherwise uninterruptible loops (see insertLoopReschedChecks).
+func goschedguarded() {
+       if alwaysFalse {
+               goschedguarded()
+       }
+}
+
  // Puts the current goroutine into a waiting state and calls unlockf.
  // If unlockf returns false, the goroutine is resumed.
  // unlockf must not access this G's stack, as it may be moved between
diff --git a/test/fixedbugs/issue10958.go b/test/fixedbugs/issue10958.go

new file mode 100644 (file)

index 0000000..abbd649
--- /dev/null
+++ b/test/fixedbugs/issue10958.go
@@ -0,0 +1,86 @@
+// +build !nacl
+// buildrun -t 2  -gcflags=-d=ssa/insert_resched_checks/on,ssa/check/on
+
+// Copyright 2016 The Go Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style
+// license that can be found in the LICENSE file.
+
+// This checks to see that call-free infinite loops do not
+// block garbage collection.
+
+package main
+
+import (
+       "runtime"
+)
+
+var someglobal1 int
+var someglobal2 int
+var someglobal3 int
+
+//go:noinline
+func f() {}
+
+func standinacorner1() {
+       for someglobal1&1 == 0 {
+               someglobal1++
+               someglobal1++
+       }
+}
+
+func standinacorner2(i int) {
+       // contains an irreducible loop containing changes to memory
+       if i != 0 {
+               goto midloop
+       }
+
+loop:
+       if someglobal2&1 != 0 {
+               goto done
+       }
+       someglobal2++
+midloop:
+       someglobal2++
+       goto loop
+
+done:
+       return
+}
+
+func standinacorner3() {
+       for someglobal3&1 == 0 {
+               if someglobal3&2 != 0 {
+                       for someglobal3&3 == 2 {
+                               someglobal3++
+                               someglobal3++
+                               someglobal3++
+                               someglobal3++
+                       }
+               }
+               someglobal3++
+               someglobal3++
+               someglobal3++
+               someglobal3++
+       }
+}
+
+func main() {
+       go standinacorner1()
+       go standinacorner2(0)
+       go standinacorner3()
+       // println("About to stand in a corner1")
+       for someglobal1 == 0 {
+               runtime.Gosched()
+       }
+       // println("About to stand in a corner2")
+       for someglobal2 == 0 {
+               runtime.Gosched()
+       }
+       // println("About to stand in a corner3")
+       for someglobal3 == 0 {
+               runtime.Gosched()
+       }
+       // println("About to GC")
+       runtime.GC()
+       // println("Success")
+}
diff --git a/test/live.go b/test/live.go

index 4fb231cfef9df5838471690da26a1f45ac489232..b23e1509e01da640e33a0023dd41817e02f2116d 100644 (file)
--- a/test/live.go
+++ b/test/live.go
@@ -1,6 +1,7 @@
-// errorcheckwithauto -0 -l -live -wb=0
+// errorcheckwithauto -0 -l -live -wb=0 -d=ssa/insert_resched_checks/off
  // +build !ppc64,!ppc64le
  // ppc64 needs a better tighten pass to make f18 pass
+// rescheduling checks need to be turned off because there are some live variables across the inserted check call
  
  // Copyright 2014 The Go Authors. All rights reserved.
  // Use of this source code is governed by a BSD-style
diff --git a/test/opt_branchlikely.go b/test/opt_branchlikely.go

index 5781253e3edf589770b4973ca951f6d9b82ddad4..84de32179f38a0a4b8e99e729c48a1b1cf8acc44 100644 (file)
--- a/test/opt_branchlikely.go
+++ b/test/opt_branchlikely.go
@@ -1,5 +1,6 @@
  // +build amd64
-// errorcheck -0 -d=ssa/likelyadjust/debug=1
+// errorcheck -0 -d=ssa/likelyadjust/debug=1,ssa/insert_resched_checks/off
+// rescheduling check insertion is turend off because the inserted conditional branches perturb the errorcheck
  
  // Copyright 2016 The Go Authors. All rights reserved.
  // Use of this source code is governed by a BSD-style
diff --git a/test/run.go b/test/run.go

index 0dee6b5caab41a96fde48b1a75ac4bef1f53ecbe..19ca3287651388d34ef71171930e708b6dd9a4af 100644 (file)
--- a/test/run.go
+++ b/test/run.go
@@ -463,6 +463,7 @@ func (t *test) run() {
         }
  
         var args, flags []string
+       var tim int
         wantError := false
         wantAuto := false
         singlefilepkgs := false
@@ -478,7 +479,7 @@ func (t *test) run() {
                 action = "rundir"
         case "cmpout":
                 action = "run" // the run case already looks for <dir>/<test>.out files
-       case "compile", "compiledir", "build", "run", "runoutput", "rundir":
+       case "compile", "compiledir", "build", "run", "buildrun", "runoutput", "rundir":
                 // nothing to do
         case "errorcheckandrundir":
                 wantError = false // should be no error if also will run
@@ -505,6 +506,14 @@ func (t *test) run() {
                         wantError = false
                 case "-s":
                         singlefilepkgs = true
+               case "-t": // timeout in seconds
+                       args = args[1:]
+                       var err error
+                       tim, err = strconv.Atoi(args[0])
+                       if err != nil {
+                               t.err = fmt.Errorf("need number of seconds for -t timeout, got %s instead", args[0])
+                       }
+
                 default:
                         flags = append(flags, args[0])
                 }
@@ -539,7 +548,31 @@ func (t *test) run() {
                 } else {
                         cmd.Env = os.Environ()
                 }
-               err := cmd.Run()
+
+               var err error
+
+               if tim != 0 {
+                       err = cmd.Start()
+                       // This command-timeout code adapted from cmd/go/test.go
+                       if err == nil {
+                               tick := time.NewTimer(time.Duration(tim) * time.Second)
+                               done := make(chan error)
+                               go func() {
+                                       done <- cmd.Wait()
+                               }()
+                               select {
+                               case err = <-done:
+                                       // ok
+                               case <-tick.C:
+                                       cmd.Process.Kill()
+                                       err = <-done
+                                       // err = errors.New("Test timeout")
+                               }
+                               tick.Stop()
+                       }
+               } else {
+                       err = cmd.Run()
+               }
                 if err != nil {
                         err = fmt.Errorf("%s\n%s", err, buf.Bytes())
                 }
@@ -671,6 +704,32 @@ func (t *test) run() {
                         t.err = err
                 }
  
+       case "buildrun": // build binary, then run binary, instead of go run. Useful for timeout tests where failure mode is infinite loop.
+               // TODO: not supported on NaCl
+               useTmp = true
+               cmd := []string{"go", "build", "-o", "a.exe"}
+               if *linkshared {
+                       cmd = append(cmd, "-linkshared")
+               }
+               longdirgofile := filepath.Join(filepath.Join(cwd, t.dir), t.gofile)
+               cmd = append(cmd, flags...)
+               cmd = append(cmd, longdirgofile)
+               out, err := runcmd(cmd...)
+               if err != nil {
+                       t.err = err
+                       return
+               }
+               cmd = []string{"./a.exe"}
+               out, err = runcmd(append(cmd, args...)...)
+               if err != nil {
+                       t.err = err
+                       return
+               }
+
+               if strings.Replace(string(out), "\r\n", "\n", -1) != t.expectedOutput() {
+                       t.err = fmt.Errorf("incorrect output\n%s", out)
+               }
+
         case "run":
                 useTmp = false
                 cmd := []string{"go", "run"}
author	David Chase <drchase@google.com>
	Thu, 10 Nov 2016 21:03:47 +0000 (16:03 -0500)
committer	David Chase <drchase@google.com>
	Mon, 9 Jan 2017 21:01:29 +0000 (21:01 +0000)
src/cmd/compile/internal/gc/builtin.go		patch \| blob \| history
src/cmd/compile/internal/gc/builtin/runtime.go		patch \| blob \| history
src/cmd/compile/internal/gc/ssa.go		patch \| blob \| history
src/cmd/compile/internal/ssa/compile.go		patch \| blob \| history
src/cmd/compile/internal/ssa/func.go		patch \| blob \| history
src/cmd/compile/internal/ssa/loopreschedchecks.go	[new file with mode: 0644]	patch \| blob
src/cmd/compile/internal/ssa/sparsetree.go		patch \| blob \| history
src/cmd/internal/obj/go.go		patch \| blob \| history
src/runtime/proc.go		patch \| blob \| history
test/fixedbugs/issue10958.go	[new file with mode: 0644]	patch \| blob
test/live.go		patch \| blob \| history
test/opt_branchlikely.go		patch \| blob \| history
test/run.go		patch \| blob \| history