runtime: make runtime.GC() trigger a concurrent GC

author Austin Clements <austin@google.com>

Fri, 24 Feb 2017 02:50:19 +0000 (21:50 -0500)

committer Austin Clements <austin@google.com>

Fri, 31 Mar 2017 01:15:21 +0000 (01:15 +0000)
author Austin Clements <austin@google.com>
Fri, 24 Feb 2017 02:50:19 +0000 (21:50 -0500)
committer Austin Clements <austin@google.com>
Fri, 31 Mar 2017 01:15:21 +0000 (01:15 +0000)
diff --git a/src/runtime/mgc.go b/src/runtime/mgc.go

index 9f59d8fa75fff04800864fd2c1a66dc68d5ceadd..03a58c3b27755c4642485da21df0b1b63ce67755 100644 (file)
--- a/src/runtime/mgc.go
+++ b/src/runtime/mgc.go
@@ -884,6 +884,19 @@ var work struct {
                 head, tail guintptr
         }
  
+       // sweepWaiters is a list of blocked goroutines to wake when
+       // we transition from mark termination to sweep.
+       sweepWaiters struct {
+               lock mutex
+               head guintptr
+       }
+
+       // cycles is the number of completed GC cycles, where a GC
+       // cycle is sweep termination, mark, mark termination, and
+       // sweep. This differs from memstats.numgc, which is
+       // incremented at mark termination.
+       cycles uint32
+
         // Timing/utilization stats for this cycle.
         stwprocs, maxprocs                 int32
         tSweepTerm, tMark, tMarkTerm, tEnd int64 // nanotime() of phase start
@@ -899,7 +912,94 @@ var work struct {
  // garbage collection is complete. It may also block the entire
  // program.
  func GC() {
-       gcStart(gcForceBlockMode, gcTrigger{kind: gcTriggerAlways})
+       // We consider a cycle to be: sweep termination, mark, mark
+       // termination, and sweep. This function shouldn't return
+       // until a full cycle has been completed, from beginning to
+       // end. Hence, we always want to finish up the current cycle
+       // and start a new one. That means:
+       //
+       // 1. In sweep termination, mark, or mark termination of cycle
+       // N, wait until mark termination N completes and transitions
+       // to sweep N.
+       //
+       // 2. In sweep N, help with sweep N.
+       //
+       // At this point we can begin a full cycle N+1.
+       //
+       // 3. Trigger cycle N+1 by starting sweep termination N+1.
+       //
+       // 4. Wait for mark termination N+1 to complete.
+       //
+       // 5. Help with sweep N+1 until it's done.
+       //
+       // This all has to be written to deal with the fact that the
+       // GC may move ahead on its own. For example, when we block
+       // until mark termination N, we may wake up in cycle N+2.
+
+       gp := getg()
+
+       // Prevent the GC phase or cycle count from changing.
+       lock(&work.sweepWaiters.lock)
+       n := atomic.Load(&work.cycles)
+       if gcphase == _GCmark {
+               // Wait until sweep termination, mark, and mark
+               // termination of cycle N complete.
+               gp.schedlink = work.sweepWaiters.head
+               work.sweepWaiters.head.set(gp)
+               goparkunlock(&work.sweepWaiters.lock, "wait for GC cycle", traceEvGoBlock, 1)
+       } else {
+               // We're in sweep N already.
+               unlock(&work.sweepWaiters.lock)
+       }
+
+       // We're now in sweep N or later. Trigger GC cycle N+1, which
+       // will first finish sweep N if necessary and then enter sweep
+       // termination N+1.
+       gcStart(gcBackgroundMode, gcTrigger{kind: gcTriggerCycle, n: n + 1})
+
+       // Wait for mark termination N+1 to complete.
+       lock(&work.sweepWaiters.lock)
+       if gcphase == _GCmark && atomic.Load(&work.cycles) == n+1 {
+               gp.schedlink = work.sweepWaiters.head
+               work.sweepWaiters.head.set(gp)
+               goparkunlock(&work.sweepWaiters.lock, "wait for GC cycle", traceEvGoBlock, 1)
+       } else {
+               unlock(&work.sweepWaiters.lock)
+       }
+
+       // Finish sweep N+1 before returning. We do this both to
+       // complete the cycle and because runtime.GC() is often used
+       // as part of tests and benchmarks to get the system into a
+       // relatively stable and isolated state.
+       for atomic.Load(&work.cycles) == n+1 && gosweepone() != ^uintptr(0) {
+               sweep.nbgsweep++
+               Gosched()
+       }
+
+       // Callers may assume that the heap profile reflects the
+       // just-completed cycle when this returns (historically this
+       // happened because this was a STW GC), but right now the
+       // profile still reflects mark termination N, not N+1.
+       //
+       // As soon as all of the sweep frees from cycle N+1 are done,
+       // we can go ahead and publish the heap profile.
+       //
+       // First, wait for sweeping to finish. (We know there are no
+       // more spans on the sweep queue, but we may be concurrently
+       // sweeping spans, so we have to wait.)
+       for atomic.Load(&work.cycles) == n+1 && atomic.Load(&mheap_.sweepers) != 0 {
+               Gosched()
+       }
+
+       // Now we're really done with sweeping, so we can publish the
+       // stable heap profile. Only do this if we haven't already hit
+       // another mark termination.
+       mp := acquirem()
+       cycle := atomic.Load(&work.cycles)
+       if cycle == n+1 || (gcphase == _GCmark && cycle == n+2) {
+               mProf_PostSweep()
+       }
+       releasem(mp)
  }
  
  // gcMode indicates how concurrent a GC cycle should be.
@@ -915,7 +1015,8 @@ const (
  // it is an exit condition for the _GCoff phase.
  type gcTrigger struct {
         kind gcTriggerKind
-       now  int64 // gcTriggerTime: current time
+       now  int64  // gcTriggerTime: current time
+       n    uint32 // gcTriggerCycle: cycle number to start
  }
  
  type gcTriggerKind int
@@ -935,6 +1036,11 @@ const (
         // it's been more than forcegcperiod nanoseconds since the
         // previous GC cycle.
         gcTriggerTime
+
+       // gcTriggerCycle indicates that a cycle should be started if
+       // we have not yet started cycle number gcTrigger.n (relative
+       // to work.cycles).
+       gcTriggerCycle
  )
  
  // test returns true if the trigger condition is satisfied, meaning
@@ -956,6 +1062,9 @@ func (t gcTrigger) test() bool {
         case gcTriggerTime:
                 lastgc := int64(atomic.Load64(&memstats.last_gc_nanotime))
                 return lastgc != 0 && t.now-lastgc > forcegcperiod
+       case gcTriggerCycle:
+               // t.n > work.cycles, but accounting for wraparound.
+               return int32(t.n-work.cycles) > 0
         }
         return true
  }
@@ -1003,7 +1112,7 @@ func gcStart(mode gcMode, trigger gcTrigger) {
         }
  
         // For stats, check if this GC was forced by the user.
-       work.userForced = trigger.kind == gcTriggerAlways
+       work.userForced = trigger.kind == gcTriggerAlways || trigger.kind == gcTriggerCycle
  
         // In gcstoptheworld debug mode, upgrade the mode accordingly.
         // We do this after re-checking the transition condition so
@@ -1047,6 +1156,7 @@ func gcStart(mode gcMode, trigger gcTrigger) {
         // reclaimed until the next GC cycle.
         clearpools()
  
+       work.cycles++
         if mode == gcBackgroundMode { // Do as much work concurrently as possible
                 gcController.startCycle()
                 work.heapGoal = memstats.next_gc
@@ -1331,8 +1441,6 @@ func gcMarkTermination() {
         totalCpu := sched.totaltime + (now-sched.procresizetime)*int64(gomaxprocs)
         memstats.gc_cpu_fraction = float64(work.totaltime) / float64(totalCpu)
  
-       memstats.numgc++
-
         // Reset sweep state.
         sweep.nbgsweep = 0
         sweep.npausesweep = 0
@@ -1341,6 +1449,13 @@ func gcMarkTermination() {
                 memstats.numforcedgc++
         }
  
+       // Bump GC cycle count and wake goroutines waiting on sweep.
+       lock(&work.sweepWaiters.lock)
+       memstats.numgc++
+       injectglist(work.sweepWaiters.head.ptr())
+       work.sweepWaiters.head = 0
+       unlock(&work.sweepWaiters.lock)
+
         // Finish the current heap profiling cycle and start a new
         // heap profiling cycle. We do this before starting the world
         // so events don't leak into the wrong cycle.
diff --git a/src/runtime/mprof.go b/src/runtime/mprof.go

index cd781c4416f971ef4608c5060d2aec270c2bc703..2bd09b6a2659a95a4d56a0aa1b0547e8feda9d5d 100644 (file)
--- a/src/runtime/mprof.go
+++ b/src/runtime/mprof.go
@@ -315,6 +315,27 @@ func mProf_FlushLocked() {
         }
  }
  
+// mProf_PostSweep records that all sweep frees for this GC cycle have
+// completed. This has the effect of publishing the heap profile
+// snapshot as of the last mark termination without advancing the heap
+// profile cycle.
+func mProf_PostSweep() {
+       lock(&proflock)
+       // Flush cycle C+1 to the active profile so everything as of
+       // the last mark termination becomes visible. *Don't* advance
+       // the cycle, since we're still accumulating allocs in cycle
+       // C+2, which have to become C+1 in the next mark termination
+       // and so on.
+       c := mProf.cycle
+       for b := mbuckets; b != nil; b = b.allnext {
+               mp := b.mp()
+               mpc := &mp.future[(c+1)%uint32(len(mp.future))]
+               mp.active.add(mpc)
+               *mpc = memRecordCycle{}
+       }
+       unlock(&proflock)
+}
+
  // Called by malloc to record a profiled block.
  func mProf_Malloc(p unsafe.Pointer, size uintptr) {
         var stk [maxStack]uintptr
author	Austin Clements <austin@google.com>
	Fri, 24 Feb 2017 02:50:19 +0000 (21:50 -0500)
committer	Austin Clements <austin@google.com>
	Fri, 31 Mar 2017 01:15:21 +0000 (01:15 +0000)
src/runtime/mgc.go		patch \| blob \| history
src/runtime/mprof.go		patch \| blob \| history