Commit 1b1fbb31 authored by Michael Anthony Knyszek's avatar Michael Anthony Knyszek Committed by Michael Knyszek

runtime: use inUse ranges to map in summary memory only as needed

Prior to this change, if the heap was very discontiguous (such as in
TestArenaCollision) it's possible we could map a large amount of memory
as R/W and commit it. We would use only the start and end to track what
should be mapped, and we would extend that mapping as needed to
accomodate a potentially fragmented address space.

After this change, we only map exactly the part of the summary arrays
that we need by using the inUse ranges from the previous change. This
reduces the GCSys footprint of TestArenaCollision from 300 MiB to 18
MiB.

Because summaries are no longer mapped contiguously, this means the
scavenger can no longer iterate directly. This change also updates the
scavenger to borrow ranges out of inUse and iterate over only the
parts of the heap which are actually currently in use. This is both an
optimization and necessary for correctness.

Fixes #35514.

Change-Id: I96bf0c73ed0d2d89a00202ece7b9d089a53bac90
Reviewed-on: https://go-review.googlesource.com/c/go/+/207758
Run-TryBot: Michael Knyszek <mknyszek@google.com>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: default avatarAustin Clements <austin@google.com>
parent 6f2b8347
...@@ -578,6 +578,7 @@ func RunGetgThreadSwitchTest() { ...@@ -578,6 +578,7 @@ func RunGetgThreadSwitchTest() {
const ( const (
PageSize = pageSize PageSize = pageSize
PallocChunkPages = pallocChunkPages PallocChunkPages = pallocChunkPages
PageAlloc64Bit = pageAlloc64Bit
) )
// Expose pallocSum for testing. // Expose pallocSum for testing.
......
...@@ -405,15 +405,14 @@ func (s *pageAlloc) scavengeOne(max uintptr, locked bool) uintptr { ...@@ -405,15 +405,14 @@ func (s *pageAlloc) scavengeOne(max uintptr, locked bool) uintptr {
} }
lockHeap() lockHeap()
top := chunkIndex(s.scavAddr) ci := chunkIndex(s.scavAddr)
if top < s.start { if ci < s.start {
unlockHeap() unlockHeap()
return 0 return 0
} }
// Check the chunk containing the scav addr, starting at the addr // Check the chunk containing the scav addr, starting at the addr
// and see if there are any free and unscavenged pages. // and see if there are any free and unscavenged pages.
ci := chunkIndex(s.scavAddr)
if s.summary[len(s.summary)-1][ci].max() >= uint(minPages) { if s.summary[len(s.summary)-1][ci].max() >= uint(minPages) {
// We only bother looking for a candidate if there at least // We only bother looking for a candidate if there at least
// minPages free pages at all. It's important that we only // minPages free pages at all. It's important that we only
...@@ -429,21 +428,50 @@ func (s *pageAlloc) scavengeOne(max uintptr, locked bool) uintptr { ...@@ -429,21 +428,50 @@ func (s *pageAlloc) scavengeOne(max uintptr, locked bool) uintptr {
return uintptr(npages) * pageSize return uintptr(npages) * pageSize
} }
} }
// getInUseRange returns the highest range in the
// intersection of [0, addr] and s.inUse.
//
// s.mheapLock must be held.
getInUseRange := func(addr uintptr) addrRange {
top := s.inUse.findSucc(addr)
if top == 0 {
return addrRange{}
}
r := s.inUse.ranges[top-1]
// addr is inclusive, so treat it as such when
// updating the limit, which is exclusive.
if r.limit > addr+1 {
r.limit = addr + 1
}
return r
}
// Slow path: iterate optimistically over the in-use address space
// looking for any free and unscavenged page. If we think we see something,
// lock and verify it!
//
// We iterate over the address space by taking ranges from inUse.
newRange:
for {
r := getInUseRange(s.scavAddr)
if r.size() == 0 {
break
}
unlockHeap() unlockHeap()
// Slow path: iterate optimistically looking for any free and unscavenged page. // Iterate over all of the chunks described by r.
// If we think we see something, stop and verify it! // Note that r.limit is the exclusive upper bound, but what
for i := top - 1; i >= s.start; i-- { // we want is the top chunk instead, inclusive, so subtract 1.
bot, top := chunkIndex(r.base), chunkIndex(r.limit-1)
for i := top; i >= bot; i-- {
// If this chunk is totally in-use or has no unscavenged pages, don't bother // If this chunk is totally in-use or has no unscavenged pages, don't bother
// doing a more sophisticated check. // doing a more sophisticated check.
// //
// Note we're accessing the summary and the chunks without a lock, but // Note we're accessing the summary and the chunks without a lock, but
// that's fine. We're being optimistic anyway. // that's fine. We're being optimistic anyway.
// Check if there are enough free pages at all. It's imperative that we // Check quickly if there are enough free pages at all.
// check this before the chunk itself so that we quickly skip over
// unused parts of the address space, which may have a cleared bitmap
// but a zero'd summary which indicates not to allocate from there.
if s.summary[len(s.summary)-1][i].max() < uint(minPages) { if s.summary[len(s.summary)-1][i].max() < uint(minPages) {
continue continue
} }
...@@ -467,6 +495,7 @@ func (s *pageAlloc) scavengeOne(max uintptr, locked bool) uintptr { ...@@ -467,6 +495,7 @@ func (s *pageAlloc) scavengeOne(max uintptr, locked bool) uintptr {
base, npages := chunk.findScavengeCandidate(pallocChunkPages-1, minPages, maxPages) base, npages := chunk.findScavengeCandidate(pallocChunkPages-1, minPages, maxPages)
if npages > 0 { if npages > 0 {
// We found memory to scavenge! Mark the bits and report that up. // We found memory to scavenge! Mark the bits and report that up.
// scavengeRangeLocked will update scavAddr for us, also.
s.scavengeRangeLocked(i, base, npages) s.scavengeRangeLocked(i, base, npages)
unlockHeap() unlockHeap()
return uintptr(npages) * pageSize return uintptr(npages) * pageSize
...@@ -474,14 +503,22 @@ func (s *pageAlloc) scavengeOne(max uintptr, locked bool) uintptr { ...@@ -474,14 +503,22 @@ func (s *pageAlloc) scavengeOne(max uintptr, locked bool) uintptr {
// We were fooled, let's take this opportunity to move the scavAddr // We were fooled, let's take this opportunity to move the scavAddr
// all the way down to where we searched as scavenged for future calls // all the way down to where we searched as scavenged for future calls
// and keep iterating. // and keep iterating. Then, go get a new range.
s.scavAddr = chunkBase(i-1) + pallocChunkPages*pageSize - 1 s.scavAddr = chunkBase(i-1) + pallocChunkPages*pageSize - 1
unlockHeap() continue newRange
} }
lockHeap() lockHeap()
// We couldn't find anything, so signal that there's nothing left
// to scavenge. // Move the scavenger down the heap, past everything we just searched.
// Since we don't check if scavAddr moved while twe let go of the heap lock,
// it's possible that it moved down and we're moving it up here. This
// raciness could result in us searching parts of the heap unnecessarily.
// TODO(mknyszek): Remove this racy behavior through explicit address
// space reservations, which are difficult to do with just scavAddr.
s.scavAddr = r.base - 1
}
// We reached the end of the in-use address space and couldn't find anything,
// so signal that there's nothing left to scavenge.
s.scavAddr = minScavAddr s.scavAddr = minScavAddr
unlockHeap() unlockHeap()
......
...@@ -182,6 +182,10 @@ type pageAlloc struct { ...@@ -182,6 +182,10 @@ type pageAlloc struct {
// runtime segmentation fault, we get a much friendlier out-of-bounds // runtime segmentation fault, we get a much friendlier out-of-bounds
// error. // error.
// //
// To iterate over a summary level, use inUse to determine which ranges
// are currently available. Otherwise one might try to access
// memory which is only Reserved which may result in a hard fault.
//
// We may still get segmentation faults < len since some of that // We may still get segmentation faults < len since some of that
// memory may not be committed yet. // memory may not be committed yet.
summary [summaryLevels][]pallocSum summary [summaryLevels][]pallocSum
...@@ -212,12 +216,9 @@ type pageAlloc struct { ...@@ -212,12 +216,9 @@ type pageAlloc struct {
// making the impact on BSS too high (note the L1 is stored directly // making the impact on BSS too high (note the L1 is stored directly
// in pageAlloc). // in pageAlloc).
// //
// summary[len(s.summary)-1][i] should always be checked, at least // To iterate over the bitmap, use inUse to determine which ranges
// for a zero max value, before accessing chunks[i]. It's possible the // are currently available. Otherwise one might iterate over unused
// bitmap at that index is mapped in and zeroed, indicating that it // ranges.
// contains free space, but in actuality it is unused since its
// corresponding summary was never updated. Tests may ignore this
// and assume the zero value (and that it is mapped).
// //
// TODO(mknyszek): Consider changing the definition of the bitmap // TODO(mknyszek): Consider changing the definition of the bitmap
// such that 1 means free and 0 means in-use so that summaries and // such that 1 means free and 0 means in-use so that summaries and
...@@ -297,53 +298,6 @@ func (s *pageAlloc) init(mheapLock *mutex, sysStat *uint64) { ...@@ -297,53 +298,6 @@ func (s *pageAlloc) init(mheapLock *mutex, sysStat *uint64) {
s.mheapLock = mheapLock s.mheapLock = mheapLock
} }
// extendMappedRegion ensures that all the memory in the range
// [base+nbase, base+nlimit) is in the Ready state.
// base must refer to the beginning of a memory region in the
// Reserved state. extendMappedRegion assumes that the region
// [base+mbase, base+mlimit) is already mapped.
//
// Note that extendMappedRegion only supports extending
// mappings in one direction. Therefore,
// nbase < mbase && nlimit > mlimit is an invalid input
// and this function will throw.
func extendMappedRegion(base unsafe.Pointer, mbase, mlimit, nbase, nlimit uintptr, sysStat *uint64) {
if uintptr(base)%physPageSize != 0 {
print("runtime: base = ", base, "\n")
throw("extendMappedRegion: base not page-aligned")
}
// Round the offsets to a physical page.
mbase = alignDown(mbase, physPageSize)
nbase = alignDown(nbase, physPageSize)
mlimit = alignUp(mlimit, physPageSize)
nlimit = alignUp(nlimit, physPageSize)
// If none of the region is mapped, don't bother
// trying to figure out which parts are.
if mlimit-mbase != 0 {
// Determine which part of the region actually needs
// mapping.
if nbase < mbase && nlimit > mlimit {
// TODO(mknyszek): Consider supporting this case. It can't
// ever happen currently in the page allocator, but may be
// useful in the future. Also, it would make this function's
// purpose simpler to explain.
throw("mapped region extended in two directions")
} else if nbase < mbase && nlimit <= mlimit {
nlimit = mbase
} else if nbase >= mbase && nlimit > mlimit {
nbase = mlimit
} else {
return
}
}
// Transition from Reserved to Ready.
rbase := add(base, nbase)
sysMap(rbase, nlimit-nbase, sysStat)
sysUsed(rbase, nlimit-nbase)
}
// compareSearchAddrTo compares an address against s.searchAddr in a linearized // compareSearchAddrTo compares an address against s.searchAddr in a linearized
// view of the address space on systems with discontinuous process address spaces. // view of the address space on systems with discontinuous process address spaces.
// This linearized view is the same one generated by chunkIndex and arenaIndex, // This linearized view is the same one generated by chunkIndex and arenaIndex,
......
...@@ -102,42 +102,79 @@ func (s *pageAlloc) sysGrow(base, limit uintptr) { ...@@ -102,42 +102,79 @@ func (s *pageAlloc) sysGrow(base, limit uintptr) {
throw("sysGrow bounds not aligned to pallocChunkBytes") throw("sysGrow bounds not aligned to pallocChunkBytes")
} }
// addrRangeToSummaryRange converts a range of addresses into a range
// of summary indices which must be mapped to support those addresses
// in the summary range.
addrRangeToSummaryRange := func(level int, r addrRange) (int, int) {
sumIdxBase, sumIdxLimit := addrsToSummaryRange(level, r.base, r.limit)
return blockAlignSummaryRange(level, sumIdxBase, sumIdxLimit)
}
// summaryRangeToSumAddrRange converts a range of indices in any
// level of s.summary into page-aligned addresses which cover that
// range of indices.
summaryRangeToSumAddrRange := func(level, sumIdxBase, sumIdxLimit int) addrRange {
baseOffset := alignDown(uintptr(sumIdxBase)*pallocSumBytes, physPageSize)
limitOffset := alignUp(uintptr(sumIdxLimit)*pallocSumBytes, physPageSize)
base := unsafe.Pointer(&s.summary[level][0])
return addrRange{
uintptr(add(base, baseOffset)),
uintptr(add(base, limitOffset)),
}
}
// addrRangeToSumAddrRange is a convienience function that converts
// an address range r to the address range of the given summary level
// that stores the summaries for r.
addrRangeToSumAddrRange := func(level int, r addrRange) addrRange {
sumIdxBase, sumIdxLimit := addrRangeToSummaryRange(level, r)
return summaryRangeToSumAddrRange(level, sumIdxBase, sumIdxLimit)
}
// Find the first inUse index which is strictly greater than base.
//
// Because this function will never be asked remap the same memory
// twice, this index is effectively the index at which we would insert
// this new growth, and base will never overlap/be contained within
// any existing range.
//
// This will be used to look at what memory in the summary array is already
// mapped before and after this new range.
inUseIndex := s.inUse.findSucc(base)
// Walk up the radix tree and map summaries in as needed. // Walk up the radix tree and map summaries in as needed.
cbase, climit := chunkBase(s.start), chunkBase(s.end) for l := range s.summary {
for l := len(s.summary) - 1; l >= 0; l-- {
// Figure out what part of the summary array this new address space needs. // Figure out what part of the summary array this new address space needs.
// Note that we need to align the ranges to the block width (1<<levelBits[l]) needIdxBase, needIdxLimit := addrRangeToSummaryRange(l, addrRange{base, limit})
// at this level because the full block is needed to compute the summary for
// the next level.
lo, hi := addrsToSummaryRange(l, base, limit)
lo, hi = blockAlignSummaryRange(l, lo, hi)
// Update the summary slices with a new upper-bound. This ensures // Update the summary slices with a new upper-bound. This ensures
// we get tight bounds checks on at least the top bound. // we get tight bounds checks on at least the top bound.
// //
// We must do this regardless of whether we map new memory, because we // We must do this regardless of whether we map new memory.
// may be extending further into the mapped memory. if needIdxLimit > len(s.summary[l]) {
if hi > len(s.summary[l]) { s.summary[l] = s.summary[l][:needIdxLimit]
s.summary[l] = s.summary[l][:hi]
} }
// Figure out what part of the summary array is already mapped. // Compute the needed address range in the summary array for level l.
// If we're doing our first growth, just pass zero. need := summaryRangeToSumAddrRange(l, needIdxBase, needIdxLimit)
// addrsToSummaryRange won't accept cbase == climit.
var mlo, mhi int // Prune need down to what needs to be newly mapped. Some parts of it may
if s.start != 0 { // already be mapped by what inUse describes due to page alignment requirements
mlo, mhi = addrsToSummaryRange(l, cbase, climit) // for mapping. prune's invariants are guaranteed by the fact that this
mlo, mhi = blockAlignSummaryRange(l, mlo, mhi) // function will never be asked to remap the same memory twice.
if inUseIndex > 0 {
need = need.subtract(addrRangeToSumAddrRange(l, s.inUse.ranges[inUseIndex-1]))
}
if inUseIndex < len(s.inUse.ranges) {
need = need.subtract(addrRangeToSumAddrRange(l, s.inUse.ranges[inUseIndex]))
}
// It's possible that after our pruning above, there's nothing new to map.
if need.size() == 0 {
continue
} }
// Extend the mappings for this summary level. // Map and commit need.
extendMappedRegion( sysMap(unsafe.Pointer(need.base), need.size(), s.sysStat)
unsafe.Pointer(&s.summary[l][0]), sysUsed(unsafe.Pointer(need.base), need.size())
uintptr(mlo)*pallocSumBytes,
uintptr(mhi)*pallocSumBytes,
uintptr(lo)*pallocSumBytes,
uintptr(hi)*pallocSumBytes,
s.sysStat,
)
} }
} }
...@@ -41,10 +41,11 @@ func checkPageAlloc(t *testing.T, want, got *PageAlloc) { ...@@ -41,10 +41,11 @@ func checkPageAlloc(t *testing.T, want, got *PageAlloc) {
} }
func TestPageAllocGrow(t *testing.T) { func TestPageAllocGrow(t *testing.T) {
tests := map[string]struct { type test struct {
chunks []ChunkIdx chunks []ChunkIdx
inUse []AddrRange inUse []AddrRange
}{ }
tests := map[string]test{
"One": { "One": {
chunks: []ChunkIdx{ chunks: []ChunkIdx{
BaseChunkIdx, BaseChunkIdx,
...@@ -112,6 +113,18 @@ func TestPageAllocGrow(t *testing.T) { ...@@ -112,6 +113,18 @@ func TestPageAllocGrow(t *testing.T) {
}, },
}, },
} }
if PageAlloc64Bit != 0 {
tests["ExtremelyDiscontiguous"] = test{
chunks: []ChunkIdx{
BaseChunkIdx,
BaseChunkIdx + 0x100000, // constant translates to O(TiB)
},
inUse: []AddrRange{
{PageBase(BaseChunkIdx, 0), PageBase(BaseChunkIdx+1, 0)},
{PageBase(BaseChunkIdx+0x100000, 0), PageBase(BaseChunkIdx+0x100001, 0)},
},
}
}
for name, v := range tests { for name, v := range tests {
v := v v := v
t.Run(name, func(t *testing.T) { t.Run(name, func(t *testing.T) {
......
...@@ -21,6 +21,31 @@ type addrRange struct { ...@@ -21,6 +21,31 @@ type addrRange struct {
base, limit uintptr base, limit uintptr
} }
// size returns the size of the range represented in bytes.
func (a addrRange) size() uintptr {
if a.limit <= a.base {
return 0
}
return a.limit - a.base
}
// subtract takes the addrRange toPrune and cuts out any overlap with
// from, then returns the new range. subtract assumes that a and b
// either don't overlap at all, only overlap on one side, or are equal.
// If b is strictly contained in a, thus forcing a split, it will throw.
func (a addrRange) subtract(b addrRange) addrRange {
if a.base >= b.base && a.limit <= b.limit {
return addrRange{}
} else if a.base < b.base && a.limit > b.limit {
throw("bad prune")
} else if a.limit > b.limit && a.base < b.limit {
a.base = b.limit
} else if a.base < b.base && a.limit > b.base {
a.limit = b.base
}
return a
}
// addrRanges is a data structure holding a collection of ranges of // addrRanges is a data structure holding a collection of ranges of
// address space. // address space.
// //
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment