Commit 9dc6764d authored by Keith Randall's avatar Keith Randall

runtime: a few optimizations of scanblock.

Lowers gc pause time by 5-10% on test/bench/garbage

LGTM=rsc, dvyukov
R=rsc, dvyukov
CC=golang-codereviews
https://golang.org/cl/157810043
parent 64bed3f5
...@@ -215,8 +215,7 @@ scanblock(byte *b, uintptr n, byte *ptrmask) ...@@ -215,8 +215,7 @@ scanblock(byte *b, uintptr n, byte *ptrmask)
for(i = 0; i < nelem(scanbuf); i++) { for(i = 0; i < nelem(scanbuf); i++) {
b = scanbuf[scanbufpos]; b = scanbuf[scanbufpos];
scanbuf[scanbufpos++] = nil; scanbuf[scanbufpos++] = nil;
if(scanbufpos == nelem(scanbuf)) scanbufpos %= nelem(scanbuf);
scanbufpos = 0;
if(b != nil) { if(b != nil) {
n = arena_used - b; // scan until bitBoundary or BitsDead n = arena_used - b; // scan until bitBoundary or BitsDead
ptrmask = nil; // use GC bitmap for pointer info ptrmask = nil; // use GC bitmap for pointer info
...@@ -267,10 +266,13 @@ scanblock(byte *b, uintptr n, byte *ptrmask) ...@@ -267,10 +266,13 @@ scanblock(byte *b, uintptr n, byte *ptrmask)
break; break;
// Consult GC bitmap. // Consult GC bitmap.
bits = *ptrbitp; bits = *ptrbitp;
if((((uintptr)b+i)%(PtrSize*wordsPerBitmapByte)) != 0) {
ptrbitp--; if(wordsPerBitmapByte != 2)
bits >>= gcBits; runtime·throw("alg doesn't work for wordsPerBitmapByte != 2");
} j = ((uintptr)b+i)/PtrSize & 1;
ptrbitp -= j;
bits >>= gcBits*j;
if((bits&bitBoundary) != 0 && i != 0) if((bits&bitBoundary) != 0 && i != 0)
break; // reached beginning of the next object break; // reached beginning of the next object
bits = (bits>>2)&BitsMask; bits = (bits>>2)&BitsMask;
...@@ -293,10 +295,9 @@ scanblock(byte *b, uintptr n, byte *ptrmask) ...@@ -293,10 +295,9 @@ scanblock(byte *b, uintptr n, byte *ptrmask)
// Find the next pair of bits. // Find the next pair of bits.
if(ptrmask == nil) { if(ptrmask == nil) {
bits = *ptrbitp; bits = *ptrbitp;
if((((uintptr)b+i)%(PtrSize*wordsPerBitmapByte)) == 0) { j = ((uintptr)b+i+PtrSize)/PtrSize & 1;
ptrbitp--; ptrbitp -= j;
bits >>= gcBits; bits >>= gcBits*j;
}
bits = (bits>>2)&BitsMask; bits = (bits>>2)&BitsMask;
} else } else
bits = (ptrmask[((i+PtrSize)/PtrSize)/4]>>((((i+PtrSize)/PtrSize)%4)*BitsPerPointer))&BitsMask; bits = (ptrmask[((i+PtrSize)/PtrSize)/4]>>((((i+PtrSize)/PtrSize)%4)*BitsPerPointer))&BitsMask;
...@@ -328,12 +329,13 @@ scanblock(byte *b, uintptr n, byte *ptrmask) ...@@ -328,12 +329,13 @@ scanblock(byte *b, uintptr n, byte *ptrmask)
// Check if it points into heap. // Check if it points into heap.
if(obj == nil) if(obj == nil)
continue; continue;
if((uintptr)obj < PhysPageSize) { if(obj < arena_start || obj >= arena_used) {
s = nil; if((uintptr)obj < PhysPageSize) {
goto badobj; s = nil;
} goto badobj;
if(obj < arena_start || obj >= arena_used) }
continue; continue;
}
// Mark the object. // Mark the object.
obj = (byte*)((uintptr)obj & ~(PtrSize-1)); obj = (byte*)((uintptr)obj & ~(PtrSize-1));
off = (uintptr*)obj - (uintptr*)arena_start; off = (uintptr*)obj - (uintptr*)arena_start;
...@@ -442,8 +444,7 @@ scanblock(byte *b, uintptr n, byte *ptrmask) ...@@ -442,8 +444,7 @@ scanblock(byte *b, uintptr n, byte *ptrmask)
PREFETCH(obj); PREFETCH(obj);
p = scanbuf[scanbufpos]; p = scanbuf[scanbufpos];
scanbuf[scanbufpos++] = obj; scanbuf[scanbufpos++] = obj;
if(scanbufpos == nelem(scanbuf)) scanbufpos %= nelem(scanbuf);
scanbufpos = 0;
if(p == nil) if(p == nil)
continue; continue;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment