src/runtime/mwbbuf.go

   1 // Copyright 2017 The Go Authors. All rights reserved.
   2 // Use of this source code is governed by a BSD-style
   3 // license that can be found in the LICENSE file.
   4
   5 // This implements the write barrier buffer. The write barrier itself
   6 // is gcWriteBarrier and is implemented in assembly.
   7 //
   8 // See mbarrier.go for algorithmic details on the write barrier. This
   9 // file deals only with the buffer.
  10 //
  11 // The write barrier has a fast path and a slow path. The fast path
  12 // simply enqueues to a per-P write barrier buffer. It's written in
  13 // assembly and doesn't clobber any general purpose registers, so it
  14 // doesn't have the usual overheads of a Go call.
  15 //
  16 // When the buffer fills up, the write barrier invokes the slow path
  17 // (wbBufFlush) to flush the buffer to the GC work queues. In this
  18 // path, since the compiler didn't spill registers, we spill *all*
  19 // registers and disallow any GC safe points that could observe the
  20 // stack frame (since we don't know the types of the spilled
  21 // registers).
  22
  23 package runtime
  24
  25 import (
  26         "internal/goarch"
  27         "runtime/internal/atomic"
  28         "unsafe"
  29 )
  30
  31 // testSmallBuf forces a small write barrier buffer to stress write
  32 // barrier flushing.
  33 const testSmallBuf = false
  34
  35 // wbBuf is a per-P buffer of pointers queued by the write barrier.
  36 // This buffer is flushed to the GC workbufs when it fills up and on
  37 // various GC transitions.
  38 //
  39 // This is closely related to a "sequential store buffer" (SSB),
  40 // except that SSBs are usually used for maintaining remembered sets,
  41 // while this is used for marking.
  42 type wbBuf struct {
  43         // next points to the next slot in buf. It must not be a
  44         // pointer type because it can point past the end of buf and
  45         // must be updated without write barriers.
  46         //
  47         // This is a pointer rather than an index to optimize the
  48         // write barrier assembly.
  49         next uintptr
  50
  51         // end points to just past the end of buf. It must not be a
  52         // pointer type because it points past the end of buf and must
  53         // be updated without write barriers.
  54         end uintptr
  55
  56         // buf stores a series of pointers to execute write barriers on.
  57         buf [wbBufEntries]uintptr
  58 }
  59
  60 const (
  61         // wbBufEntries is the maximum number of pointers that can be
  62         // stored in the write barrier buffer.
  63         //
  64         // This trades latency for throughput amortization. Higher
  65         // values amortize flushing overhead more, but increase the
  66         // latency of flushing. Higher values also increase the cache
  67         // footprint of the buffer.
  68         //
  69         // TODO: What is the latency cost of this? Tune this value.
  70         wbBufEntries = 512
  71
  72         // Maximum number of entries that we need to ask from the
  73         // buffer in a single call.
  74         wbMaxEntriesPerCall = 8
  75 )
  76
  77 // reset empties b by resetting its next and end pointers.
  78 func (b *wbBuf) reset() {
  79         start := uintptr(unsafe.Pointer(&b.buf[0]))
  80         b.next = start
  81         if testSmallBuf {
  82                 // For testing, make the buffer smaller but more than
  83                 // 1 write barrier's worth, so it tests both the
  84                 // immediate flush and delayed flush cases.
  85                 b.end = uintptr(unsafe.Pointer(&b.buf[wbMaxEntriesPerCall+1]))
  86         } else {
  87                 b.end = start + uintptr(len(b.buf))*unsafe.Sizeof(b.buf[0])
  88         }
  89
  90         if (b.end-b.next)%unsafe.Sizeof(b.buf[0]) != 0 {
  91                 throw("bad write barrier buffer bounds")
  92         }
  93 }
  94
  95 // discard resets b's next pointer, but not its end pointer.
  96 //
  97 // This must be nosplit because it's called by wbBufFlush.
  98 //
  99 //go:nosplit
 100 func (b *wbBuf) discard() {
 101         b.next = uintptr(unsafe.Pointer(&b.buf[0]))
 102 }
 103
 104 // empty reports whether b contains no pointers.
 105 func (b *wbBuf) empty() bool {
 106         return b.next == uintptr(unsafe.Pointer(&b.buf[0]))
 107 }
 108
 109 // getX returns space in the write barrier buffer to store X pointers.
 110 // getX will flush the buffer if necessary. Callers should use this as:
 111 //
 112 //      buf := &getg().m.p.ptr().wbBuf
 113 //      p := buf.get2()
 114 //      p[0], p[1] = old, new
 115 //      ... actual memory write ...
 116 //
 117 // The caller must ensure there are no preemption points during the
 118 // above sequence. There must be no preemption points while buf is in
 119 // use because it is a per-P resource. There must be no preemption
 120 // points between the buffer put and the write to memory because this
 121 // could allow a GC phase change, which could result in missed write
 122 // barriers.
 123 //
 124 // getX must be nowritebarrierrec to because write barriers here would
 125 // corrupt the write barrier buffer. It (and everything it calls, if
 126 // it called anything) has to be nosplit to avoid scheduling on to a
 127 // different P and a different buffer.
 128 //
 129 //go:nowritebarrierrec
 130 //go:nosplit
 131 func (b *wbBuf) get1() *[1]uintptr {
 132         if b.next+goarch.PtrSize > b.end {
 133                 wbBufFlush()
 134         }
 135         p := (*[1]uintptr)(unsafe.Pointer(b.next))
 136         b.next += goarch.PtrSize
 137         return p
 138 }
 139
 140 //go:nowritebarrierrec
 141 //go:nosplit
 142 func (b *wbBuf) get2() *[2]uintptr {
 143         if b.next+2*goarch.PtrSize > b.end {
 144                 wbBufFlush()
 145         }
 146         p := (*[2]uintptr)(unsafe.Pointer(b.next))
 147         b.next += 2 * goarch.PtrSize
 148         return p
 149 }
 150
 151 // wbBufFlush flushes the current P's write barrier buffer to the GC
 152 // workbufs.
 153 //
 154 // This must not have write barriers because it is part of the write
 155 // barrier implementation.
 156 //
 157 // This and everything it calls must be nosplit because 1) the stack
 158 // contains untyped slots from gcWriteBarrier and 2) there must not be
 159 // a GC safe point between the write barrier test in the caller and
 160 // flushing the buffer.
 161 //
 162 // TODO: A "go:nosplitrec" annotation would be perfect for this.
 163 //
 164 //go:nowritebarrierrec
 165 //go:nosplit
 166 func wbBufFlush() {
 167         // Note: Every possible return from this function must reset
 168         // the buffer's next pointer to prevent buffer overflow.
 169
 170         if getg().m.dying > 0 {
 171                 // We're going down. Not much point in write barriers
 172                 // and this way we can allow write barriers in the
 173                 // panic path.
 174                 getg().m.p.ptr().wbBuf.discard()
 175                 return
 176         }
 177
 178         // Switch to the system stack so we don't have to worry about
 179         // safe points.
 180         systemstack(func() {
 181                 wbBufFlush1(getg().m.p.ptr())
 182         })
 183 }
 184
 185 // wbBufFlush1 flushes p's write barrier buffer to the GC work queue.
 186 //
 187 // This must not have write barriers because it is part of the write
 188 // barrier implementation, so this may lead to infinite loops or
 189 // buffer corruption.
 190 //
 191 // This must be non-preemptible because it uses the P's workbuf.
 192 //
 193 //go:nowritebarrierrec
 194 //go:systemstack
 195 func wbBufFlush1(pp *p) {
 196         // Get the buffered pointers.
 197         start := uintptr(unsafe.Pointer(&pp.wbBuf.buf[0]))
 198         n := (pp.wbBuf.next - start) / unsafe.Sizeof(pp.wbBuf.buf[0])
 199         ptrs := pp.wbBuf.buf[:n]
 200
 201         // Poison the buffer to make extra sure nothing is enqueued
 202         // while we're processing the buffer.
 203         pp.wbBuf.next = 0
 204
 205         if useCheckmark {
 206                 // Slow path for checkmark mode.
 207                 for _, ptr := range ptrs {
 208                         shade(ptr)
 209                 }
 210                 pp.wbBuf.reset()
 211                 return
 212         }
 213
 214         // Mark all of the pointers in the buffer and record only the
 215         // pointers we greyed. We use the buffer itself to temporarily
 216         // record greyed pointers.
 217         //
 218         // TODO: Should scanobject/scanblock just stuff pointers into
 219         // the wbBuf? Then this would become the sole greying path.
 220         //
 221         // TODO: We could avoid shading any of the "new" pointers in
 222         // the buffer if the stack has been shaded, or even avoid
 223         // putting them in the buffer at all (which would double its
 224         // capacity). This is slightly complicated with the buffer; we
 225         // could track whether any un-shaded goroutine has used the
 226         // buffer, or just track globally whether there are any
 227         // un-shaded stacks and flush after each stack scan.
 228         gcw := &pp.gcw
 229         pos := 0
 230         for _, ptr := range ptrs {
 231                 if ptr < minLegalPointer {
 232                         // nil pointers are very common, especially
 233                         // for the "old" values. Filter out these and
 234                         // other "obvious" non-heap pointers ASAP.
 235                         //
 236                         // TODO: Should we filter out nils in the fast
 237                         // path to reduce the rate of flushes?
 238                         continue
 239                 }
 240                 obj, span, objIndex := findObject(ptr, 0, 0)
 241                 if obj == 0 {
 242                         continue
 243                 }
 244                 // TODO: Consider making two passes where the first
 245                 // just prefetches the mark bits.
 246                 mbits := span.markBitsForIndex(objIndex)
 247                 if mbits.isMarked() {
 248                         continue
 249                 }
 250                 mbits.setMarked()
 251
 252                 // Mark span.
 253                 arena, pageIdx, pageMask := pageIndexOf(span.base())
 254                 if arena.pageMarks[pageIdx]&pageMask == 0 {
 255                         atomic.Or8(&arena.pageMarks[pageIdx], pageMask)
 256                 }
 257
 258                 if span.spanclass.noscan() {
 259                         gcw.bytesMarked += uint64(span.elemsize)
 260                         continue
 261                 }
 262                 ptrs[pos] = obj
 263                 pos++
 264         }
 265
 266         // Enqueue the greyed objects.
 267         gcw.putBatch(ptrs[:pos])
 268
 269         pp.wbBuf.reset()
 270 }