1 // Copyright 2017 The Go Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style 3 // license that can be found in the LICENSE file. 4 5 // This implements the write barrier buffer. The write barrier itself 6 // is gcWriteBarrier and is implemented in assembly. 7 // 8 // See mbarrier.go for algorithmic details on the write barrier. This 9 // file deals only with the buffer. 10 // 11 // The write barrier has a fast path and a slow path. The fast path 12 // simply enqueues to a per-P write barrier buffer. It's written in 13 // assembly and doesn't clobber any general purpose registers, so it 14 // doesn't have the usual overheads of a Go call. 15 // 16 // When the buffer fills up, the write barrier invokes the slow path 17 // (wbBufFlush) to flush the buffer to the GC work queues. In this 18 // path, since the compiler didn't spill registers, we spill *all* 19 // registers and disallow any GC safe points that could observe the 20 // stack frame (since we don't know the types of the spilled 21 // registers). 22 23 package runtime 24 25 import ( 26 "internal/goarch" 27 "runtime/internal/atomic" 28 "unsafe" 29 ) 30 31 // testSmallBuf forces a small write barrier buffer to stress write 32 // barrier flushing. 33 const testSmallBuf = false 34 35 // wbBuf is a per-P buffer of pointers queued by the write barrier. 36 // This buffer is flushed to the GC workbufs when it fills up and on 37 // various GC transitions. 38 // 39 // This is closely related to a "sequential store buffer" (SSB), 40 // except that SSBs are usually used for maintaining remembered sets, 41 // while this is used for marking. 42 type wbBuf struct { 43 // next points to the next slot in buf. It must not be a 44 // pointer type because it can point past the end of buf and 45 // must be updated without write barriers. 46 // 47 // This is a pointer rather than an index to optimize the 48 // write barrier assembly. 49 next uintptr 50 51 // end points to just past the end of buf. It must not be a 52 // pointer type because it points past the end of buf and must 53 // be updated without write barriers. 54 end uintptr 55 56 // buf stores a series of pointers to execute write barriers on. 57 buf [wbBufEntries]uintptr 58 } 59 60 const ( 61 // wbBufEntries is the maximum number of pointers that can be 62 // stored in the write barrier buffer. 63 // 64 // This trades latency for throughput amortization. Higher 65 // values amortize flushing overhead more, but increase the 66 // latency of flushing. Higher values also increase the cache 67 // footprint of the buffer. 68 // 69 // TODO: What is the latency cost of this? Tune this value. 70 wbBufEntries = 512 71 72 // Maximum number of entries that we need to ask from the 73 // buffer in a single call. 74 wbMaxEntriesPerCall = 8 75 ) 76 77 // reset empties b by resetting its next and end pointers. 78 func (b *wbBuf) reset() { 79 start := uintptr(unsafe.Pointer(&b.buf[0])) 80 b.next = start 81 if testSmallBuf { 82 // For testing, make the buffer smaller but more than 83 // 1 write barrier's worth, so it tests both the 84 // immediate flush and delayed flush cases. 85 b.end = uintptr(unsafe.Pointer(&b.buf[wbMaxEntriesPerCall+1])) 86 } else { 87 b.end = start + uintptr(len(b.buf))*unsafe.Sizeof(b.buf[0]) 88 } 89 90 if (b.end-b.next)%unsafe.Sizeof(b.buf[0]) != 0 { 91 throw("bad write barrier buffer bounds") 92 } 93 } 94 95 // discard resets b's next pointer, but not its end pointer. 96 // 97 // This must be nosplit because it's called by wbBufFlush. 98 // 99 //go:nosplit 100 func (b *wbBuf) discard() { 101 b.next = uintptr(unsafe.Pointer(&b.buf[0])) 102 } 103 104 // empty reports whether b contains no pointers. 105 func (b *wbBuf) empty() bool { 106 return b.next == uintptr(unsafe.Pointer(&b.buf[0])) 107 } 108 109 // getX returns space in the write barrier buffer to store X pointers. 110 // getX will flush the buffer if necessary. Callers should use this as: 111 // 112 // buf := &getg().m.p.ptr().wbBuf 113 // p := buf.get2() 114 // p[0], p[1] = old, new 115 // ... actual memory write ... 116 // 117 // The caller must ensure there are no preemption points during the 118 // above sequence. There must be no preemption points while buf is in 119 // use because it is a per-P resource. There must be no preemption 120 // points between the buffer put and the write to memory because this 121 // could allow a GC phase change, which could result in missed write 122 // barriers. 123 // 124 // getX must be nowritebarrierrec to because write barriers here would 125 // corrupt the write barrier buffer. It (and everything it calls, if 126 // it called anything) has to be nosplit to avoid scheduling on to a 127 // different P and a different buffer. 128 // 129 //go:nowritebarrierrec 130 //go:nosplit 131 func (b *wbBuf) get1() *[1]uintptr { 132 if b.next+goarch.PtrSize > b.end { 133 wbBufFlush() 134 } 135 p := (*[1]uintptr)(unsafe.Pointer(b.next)) 136 b.next += goarch.PtrSize 137 return p 138 } 139 140 //go:nowritebarrierrec 141 //go:nosplit 142 func (b *wbBuf) get2() *[2]uintptr { 143 if b.next+2*goarch.PtrSize > b.end { 144 wbBufFlush() 145 } 146 p := (*[2]uintptr)(unsafe.Pointer(b.next)) 147 b.next += 2 * goarch.PtrSize 148 return p 149 } 150 151 // wbBufFlush flushes the current P's write barrier buffer to the GC 152 // workbufs. 153 // 154 // This must not have write barriers because it is part of the write 155 // barrier implementation. 156 // 157 // This and everything it calls must be nosplit because 1) the stack 158 // contains untyped slots from gcWriteBarrier and 2) there must not be 159 // a GC safe point between the write barrier test in the caller and 160 // flushing the buffer. 161 // 162 // TODO: A "go:nosplitrec" annotation would be perfect for this. 163 // 164 //go:nowritebarrierrec 165 //go:nosplit 166 func wbBufFlush() { 167 // Note: Every possible return from this function must reset 168 // the buffer's next pointer to prevent buffer overflow. 169 170 if getg().m.dying > 0 { 171 // We're going down. Not much point in write barriers 172 // and this way we can allow write barriers in the 173 // panic path. 174 getg().m.p.ptr().wbBuf.discard() 175 return 176 } 177 178 // Switch to the system stack so we don't have to worry about 179 // safe points. 180 systemstack(func() { 181 wbBufFlush1(getg().m.p.ptr()) 182 }) 183 } 184 185 // wbBufFlush1 flushes p's write barrier buffer to the GC work queue. 186 // 187 // This must not have write barriers because it is part of the write 188 // barrier implementation, so this may lead to infinite loops or 189 // buffer corruption. 190 // 191 // This must be non-preemptible because it uses the P's workbuf. 192 // 193 //go:nowritebarrierrec 194 //go:systemstack 195 func wbBufFlush1(pp *p) { 196 // Get the buffered pointers. 197 start := uintptr(unsafe.Pointer(&pp.wbBuf.buf[0])) 198 n := (pp.wbBuf.next - start) / unsafe.Sizeof(pp.wbBuf.buf[0]) 199 ptrs := pp.wbBuf.buf[:n] 200 201 // Poison the buffer to make extra sure nothing is enqueued 202 // while we're processing the buffer. 203 pp.wbBuf.next = 0 204 205 if useCheckmark { 206 // Slow path for checkmark mode. 207 for _, ptr := range ptrs { 208 shade(ptr) 209 } 210 pp.wbBuf.reset() 211 return 212 } 213 214 // Mark all of the pointers in the buffer and record only the 215 // pointers we greyed. We use the buffer itself to temporarily 216 // record greyed pointers. 217 // 218 // TODO: Should scanobject/scanblock just stuff pointers into 219 // the wbBuf? Then this would become the sole greying path. 220 // 221 // TODO: We could avoid shading any of the "new" pointers in 222 // the buffer if the stack has been shaded, or even avoid 223 // putting them in the buffer at all (which would double its 224 // capacity). This is slightly complicated with the buffer; we 225 // could track whether any un-shaded goroutine has used the 226 // buffer, or just track globally whether there are any 227 // un-shaded stacks and flush after each stack scan. 228 gcw := &pp.gcw 229 pos := 0 230 for _, ptr := range ptrs { 231 if ptr < minLegalPointer { 232 // nil pointers are very common, especially 233 // for the "old" values. Filter out these and 234 // other "obvious" non-heap pointers ASAP. 235 // 236 // TODO: Should we filter out nils in the fast 237 // path to reduce the rate of flushes? 238 continue 239 } 240 obj, span, objIndex := findObject(ptr, 0, 0) 241 if obj == 0 { 242 continue 243 } 244 // TODO: Consider making two passes where the first 245 // just prefetches the mark bits. 246 mbits := span.markBitsForIndex(objIndex) 247 if mbits.isMarked() { 248 continue 249 } 250 mbits.setMarked() 251 252 // Mark span. 253 arena, pageIdx, pageMask := pageIndexOf(span.base()) 254 if arena.pageMarks[pageIdx]&pageMask == 0 { 255 atomic.Or8(&arena.pageMarks[pageIdx], pageMask) 256 } 257 258 if span.spanclass.noscan() { 259 gcw.bytesMarked += uint64(span.elemsize) 260 continue 261 } 262 ptrs[pos] = obj 263 pos++ 264 } 265 266 // Enqueue the greyed objects. 267 gcw.putBatch(ptrs[:pos]) 268 269 pp.wbBuf.reset() 270 } 271