Commit fe67ea32 authored by Michael Anthony Knyszek's avatar Michael Anthony Knyszek Committed by Michael Knyszek

runtime: add background scavenger

This change adds a background scavenging goroutine whose pacing is
determined when the heap goal changes. The scavenger is paced to use
at most 1% of the mutator's time for most systems. Furthermore, the
scavenger's pacing is computed based on the estimated number of
scavengable huge pages to take advantage of optimizations provided by
the OS.

The purpose of this scavenger is to deal with a shrinking heap: if the
heap goal is falling over time, the scavenger should kick in and start
returning free pages from the heap to the OS.

Also, now that we have a pacing system, the credit system used by
scavengeLocked has become redundant. Replace it with a mechanism which
only scavenges on the allocation path if it makes sense to do so with
respect to the new pacing system.

Fixes #30333.

Change-Id: I6203f8dc84affb26c3ab04528889dd9663530edc
Reviewed-on: https://go-review.googlesource.com/c/go/+/142960
Run-TryBot: Michael Knyszek <mknyszek@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: default avatarAustin Clements <austin@google.com>
parent eaa1c87b
...@@ -202,10 +202,14 @@ func readgogc() int32 { ...@@ -202,10 +202,14 @@ func readgogc() int32 {
// gcenable is called after the bulk of the runtime initialization, // gcenable is called after the bulk of the runtime initialization,
// just before we're about to start letting user code run. // just before we're about to start letting user code run.
// It kicks off the background sweeper goroutine and enables GC. // It kicks off the background sweeper goroutine, the background
// scavenger goroutine, and enables GC.
func gcenable() { func gcenable() {
c := make(chan int, 1) // Kick off sweeping and scavenging.
c := make(chan int, 2)
go bgsweep(c) go bgsweep(c)
go bgscavenge(c)
<-c
<-c <-c
memstats.enablegc = true // now that runtime is initialized, GC is okay memstats.enablegc = true // now that runtime is initialized, GC is okay
} }
...@@ -850,6 +854,8 @@ func gcSetTriggerRatio(triggerRatio float64) { ...@@ -850,6 +854,8 @@ func gcSetTriggerRatio(triggerRatio float64) {
atomic.Store64(&mheap_.pagesSweptBasis, pagesSwept) atomic.Store64(&mheap_.pagesSweptBasis, pagesSwept)
} }
} }
gcPaceScavenger()
} }
// gcEffectiveGrowthRatio returns the current effective heap growth // gcEffectiveGrowthRatio returns the current effective heap growth
......
This diff is collapsed.
...@@ -87,6 +87,25 @@ type mheap struct { ...@@ -87,6 +87,25 @@ type mheap struct {
// TODO(austin): pagesInUse should be a uintptr, but the 386 // TODO(austin): pagesInUse should be a uintptr, but the 386
// compiler can't 8-byte align fields. // compiler can't 8-byte align fields.
// Scavenger pacing parameters
//
// The two basis parameters and the scavenge ratio parallel the proportional
// sweeping implementation, the primary differences being that:
// * Scavenging concerns itself with RSS, estimated as heapRetained()
// * Rather than pacing the scavenger to the GC, it is paced to a
// time-based rate computed in gcPaceScavenger.
//
// scavengeRetainedGoal represents our goal RSS.
//
// All fields must be accessed with lock.
//
// TODO(mknyszek): Consider abstracting the basis fields and the scavenge ratio
// into its own type so that this logic may be shared with proportional sweeping.
scavengeTimeBasis int64
scavengeRetainedBasis uint64
scavengeBytesPerNS float64
scavengeRetainedGoal uint64
// Page reclaimer state // Page reclaimer state
// reclaimIndex is the page index in allArenas of next page to // reclaimIndex is the page index in allArenas of next page to
...@@ -106,14 +125,6 @@ type mheap struct { ...@@ -106,14 +125,6 @@ type mheap struct {
// This is accessed atomically. // This is accessed atomically.
reclaimCredit uintptr reclaimCredit uintptr
// scavengeCredit is spare credit for extra bytes scavenged.
// Since the scavenging mechanisms operate on spans, it may
// scavenge more than requested. Any spare pages released
// go to this credit pool.
//
// This is protected by the mheap lock.
scavengeCredit uintptr
// Malloc stats. // Malloc stats.
largealloc uint64 // bytes allocated for large objects largealloc uint64 // bytes allocated for large objects
nlargealloc uint64 // number of large object allocations nlargealloc uint64 // number of large object allocations
...@@ -172,7 +183,7 @@ type mheap struct { ...@@ -172,7 +183,7 @@ type mheap struct {
// simply blocking GC (by disabling preemption). // simply blocking GC (by disabling preemption).
sweepArenas []arenaIdx sweepArenas []arenaIdx
// _ uint32 // ensure 64-bit alignment of central _ uint32 // ensure 64-bit alignment of central
// central free lists for small size classes. // central free lists for small size classes.
// the padding makes sure that the mcentrals are // the padding makes sure that the mcentrals are
...@@ -1203,12 +1214,12 @@ HaveSpan: ...@@ -1203,12 +1214,12 @@ HaveSpan:
// Since we allocated out of a scavenged span, we just // Since we allocated out of a scavenged span, we just
// grew the RSS. Mitigate this by scavenging enough free // grew the RSS. Mitigate this by scavenging enough free
// space to make up for it. // space to make up for it but only if we need to.
// //
// Also, scavenge may cause coalescing, so prevent // scavengeLocked may cause coalescing, so prevent
// coalescing with s by temporarily changing its state. // coalescing with s by temporarily changing its state.
s.state = mSpanManual s.state = mSpanManual
h.scavengeLocked(s.npages*pageSize, true) h.scavengeIfNeededLocked(s.npages * pageSize)
s.state = mSpanFree s.state = mSpanFree
} }
...@@ -1236,12 +1247,9 @@ func (h *mheap) grow(npage uintptr) bool { ...@@ -1236,12 +1247,9 @@ func (h *mheap) grow(npage uintptr) bool {
} }
// Scavenge some pages out of the free treap to make up for // Scavenge some pages out of the free treap to make up for
// the virtual memory space we just allocated. We prefer to // the virtual memory space we just allocated, but only if
// scavenge the largest spans first since the cost of scavenging // we need to.
// is proportional to the number of sysUnused() calls rather than h.scavengeIfNeededLocked(size)
// the number of pages released, so we make fewer of those calls
// with larger spans.
h.scavengeLocked(size, true)
// Create a fake "in use" span and free it, so that the // Create a fake "in use" span and free it, so that the
// right coalescing happens. // right coalescing happens.
...@@ -1346,22 +1354,8 @@ func (h *mheap) freeSpanLocked(s *mspan, acctinuse, acctidle bool) { ...@@ -1346,22 +1354,8 @@ func (h *mheap) freeSpanLocked(s *mspan, acctinuse, acctidle bool) {
// starting from the span with the highest base address and working down. // starting from the span with the highest base address and working down.
// It then takes those spans and places them in scav. // It then takes those spans and places them in scav.
// //
// useCredit determines whether a scavenging call should use the credit
// system. In general, useCredit should be true except in special
// circumstances.
//
// Returns the amount of memory scavenged in bytes. h must be locked. // Returns the amount of memory scavenged in bytes. h must be locked.
func (h *mheap) scavengeLocked(nbytes uintptr, useCredit bool) uintptr { func (h *mheap) scavengeLocked(nbytes uintptr) uintptr {
// Use up scavenge credit if there's any available.
if useCredit {
if nbytes > h.scavengeCredit {
nbytes -= h.scavengeCredit
h.scavengeCredit = 0
} else {
h.scavengeCredit -= nbytes
return nbytes
}
}
released := uintptr(0) released := uintptr(0)
// Iterate over spans with huge pages first, then spans without. // Iterate over spans with huge pages first, then spans without.
const mask = treapIterScav | treapIterHuge const mask = treapIterScav | treapIterHuge
...@@ -1387,13 +1381,24 @@ func (h *mheap) scavengeLocked(nbytes uintptr, useCredit bool) uintptr { ...@@ -1387,13 +1381,24 @@ func (h *mheap) scavengeLocked(nbytes uintptr, useCredit bool) uintptr {
h.free.insert(s) h.free.insert(s)
} }
} }
if useCredit { return released
// If we over-scavenged, turn that extra amount into credit. }
if released > nbytes {
h.scavengeCredit += released - nbytes // scavengeIfNeededLocked calls scavengeLocked if we're currently above the
// scavenge goal in order to prevent the mutator from out-running the
// the scavenger.
//
// h must be locked.
func (h *mheap) scavengeIfNeededLocked(size uintptr) {
if r := heapRetained(); r+uint64(size) > h.scavengeRetainedGoal {
todo := uint64(size)
// If we're only going to go a little bit over, just request what
// we actually need done.
if overage := r + uint64(size) - h.scavengeRetainedGoal; overage < todo {
todo = overage
} }
h.scavengeLocked(uintptr(todo))
} }
return released
} }
// scavengeAll visits each node in the free treap and scavenges the // scavengeAll visits each node in the free treap and scavenges the
...@@ -1406,7 +1411,7 @@ func (h *mheap) scavengeAll() { ...@@ -1406,7 +1411,7 @@ func (h *mheap) scavengeAll() {
gp := getg() gp := getg()
gp.m.mallocing++ gp.m.mallocing++
lock(&h.lock) lock(&h.lock)
released := h.scavengeLocked(^uintptr(0), false) released := h.scavengeLocked(^uintptr(0))
unlock(&h.lock) unlock(&h.lock)
gp.m.mallocing-- gp.m.mallocing--
......
...@@ -852,6 +852,7 @@ const ( ...@@ -852,6 +852,7 @@ const (
waitReasonSelectNoCases // "select (no cases)" waitReasonSelectNoCases // "select (no cases)"
waitReasonGCAssistWait // "GC assist wait" waitReasonGCAssistWait // "GC assist wait"
waitReasonGCSweepWait // "GC sweep wait" waitReasonGCSweepWait // "GC sweep wait"
waitReasonGCScavengeWait // "GC scavenge wait"
waitReasonChanReceive // "chan receive" waitReasonChanReceive // "chan receive"
waitReasonChanSend // "chan send" waitReasonChanSend // "chan send"
waitReasonFinalizerWait // "finalizer wait" waitReasonFinalizerWait // "finalizer wait"
...@@ -879,6 +880,7 @@ var waitReasonStrings = [...]string{ ...@@ -879,6 +880,7 @@ var waitReasonStrings = [...]string{
waitReasonSelectNoCases: "select (no cases)", waitReasonSelectNoCases: "select (no cases)",
waitReasonGCAssistWait: "GC assist wait", waitReasonGCAssistWait: "GC assist wait",
waitReasonGCSweepWait: "GC sweep wait", waitReasonGCSweepWait: "GC sweep wait",
waitReasonGCScavengeWait: "GC scavenge wait",
waitReasonChanReceive: "chan receive", waitReasonChanReceive: "chan receive",
waitReasonChanSend: "chan send", waitReasonChanSend: "chan send",
waitReasonFinalizerWait: "finalizer wait", waitReasonFinalizerWait: "finalizer wait",
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment