Commit b0392159 authored by Austin Clements's avatar Austin Clements

runtime,cmd/trace: trace GC STW events

Right now we only kind of sort of trace GC STW events. We emit events
around mark termination, but those start well after stopping the world
and end before starting it again, and we don't emit any events for
sweep termination.

Fix this by generalizing EvGCScanStart/EvGCScanDone. These were
already re-purposed to indicate mark termination (despite the names).
This commit renames them to EvGCSTWStart/EvGCSTWDone, adds an argument
to indicate the STW reason, and shuffles the runtime to generate them
right before stopping the world and right after starting the world,
respectively.

These events will make it possible to generate precise minimum mutator
utilization (MMU) graphs and could be useful in detecting
non-preemptible goroutines (e.g., #20792).

Change-Id: If95783f370781d8ef66addd94886028103a7c26f
Reviewed-on: https://go-review.googlesource.com/55411Reviewed-by: default avatarRick Hudson <rlh@golang.org>
parent 4a5c3779
...@@ -478,12 +478,12 @@ func generateTrace(params *traceParams) (ViewerData, error) { ...@@ -478,12 +478,12 @@ func generateTrace(params *traceParams) (ViewerData, error) {
case trace.EvGCStart: case trace.EvGCStart:
ctx.emitSlice(ev, "GC") ctx.emitSlice(ev, "GC")
case trace.EvGCDone: case trace.EvGCDone:
case trace.EvGCScanStart: case trace.EvGCSTWStart:
if ctx.gtrace { if ctx.gtrace {
continue continue
} }
ctx.emitSlice(ev, "MARK TERMINATION") ctx.emitSlice(ev, fmt.Sprintf("STW (%s)", ev.SArgs[0]))
case trace.EvGCScanDone: case trace.EvGCSTWDone:
case trace.EvGCMarkAssistStart: case trace.EvGCMarkAssistStart:
// Mark assists can continue past preemptions, so truncate to the // Mark assists can continue past preemptions, so truncate to the
// whichever comes first. We'll synthesize another slice if // whichever comes first. We'll synthesize another slice if
......
...@@ -31,7 +31,7 @@ type Event struct { ...@@ -31,7 +31,7 @@ type Event struct {
SArgs []string // event-type-specific string args SArgs []string // event-type-specific string args
// linked event (can be nil), depends on event type: // linked event (can be nil), depends on event type:
// for GCStart: the GCStop // for GCStart: the GCStop
// for GCScanStart: the GCScanDone // for GCSTWStart: the GCSTWDone
// for GCSweepStart: the GCSweepDone // for GCSweepStart: the GCSweepDone
// for GoCreate: first GoStart of the created goroutine // for GoCreate: first GoStart of the created goroutine
// for GoStart/GoStartLabel: the associated GoEnd, GoBlock or other blocking event // for GoStart/GoStartLabel: the associated GoEnd, GoBlock or other blocking event
...@@ -128,7 +128,7 @@ func readTrace(r io.Reader) (ver int, events []rawEvent, strings map[uint64]stri ...@@ -128,7 +128,7 @@ func readTrace(r io.Reader) (ver int, events []rawEvent, strings map[uint64]stri
return return
} }
switch ver { switch ver {
case 1005, 1007, 1008, 1009: case 1005, 1007, 1008, 1009, 1010:
// Note: When adding a new version, add canned traces // Note: When adding a new version, add canned traces
// from the old version to the test suite using mkcanned.bash. // from the old version to the test suite using mkcanned.bash.
break break
...@@ -373,7 +373,18 @@ func parseEvents(ver int, rawEvents []rawEvent, strings map[uint64]string) (even ...@@ -373,7 +373,18 @@ func parseEvents(ver int, rawEvents []rawEvent, strings map[uint64]string) (even
if raw.typ == EvGoStartLabel { if raw.typ == EvGoStartLabel {
e.SArgs = []string{strings[e.Args[2]]} e.SArgs = []string{strings[e.Args[2]]}
} }
case EvGCStart, EvGCDone, EvGCScanStart, EvGCScanDone: case EvGCSTWStart:
e.G = 0
switch e.Args[0] {
case 0:
e.SArgs = []string{"mark termination"}
case 1:
e.SArgs = []string{"sweep termination"}
default:
err = fmt.Errorf("unknown STW kind %d", e.Args[0])
return
}
case EvGCStart, EvGCDone, EvGCSTWDone:
e.G = 0 e.G = 0
case EvGoEnd, EvGoStop, EvGoSched, EvGoPreempt, case EvGoEnd, EvGoStop, EvGoSched, EvGoPreempt,
EvGoSleep, EvGoBlock, EvGoBlockSend, EvGoBlockRecv, EvGoSleep, EvGoBlock, EvGoBlockSend, EvGoBlockRecv,
...@@ -511,14 +522,14 @@ func postProcessTrace(ver int, events []*Event) error { ...@@ -511,14 +522,14 @@ func postProcessTrace(ver int, events []*Event) error {
type pdesc struct { type pdesc struct {
running bool running bool
g uint64 g uint64
evScan *Event evSTW *Event
evSweep *Event evSweep *Event
} }
gs := make(map[uint64]gdesc) gs := make(map[uint64]gdesc)
ps := make(map[int]pdesc) ps := make(map[int]pdesc)
gs[0] = gdesc{state: gRunning} gs[0] = gdesc{state: gRunning}
var evGC *Event var evGC, evSTW *Event
checkRunning := func(p pdesc, g gdesc, ev *Event, allowG0 bool) error { checkRunning := func(p pdesc, g gdesc, ev *Event, allowG0 bool) error {
name := EventDescriptions[ev.Type].Name name := EventDescriptions[ev.Type].Name
...@@ -565,17 +576,27 @@ func postProcessTrace(ver int, events []*Event) error { ...@@ -565,17 +576,27 @@ func postProcessTrace(ver int, events []*Event) error {
} }
evGC.Link = ev evGC.Link = ev
evGC = nil evGC = nil
case EvGCScanStart: case EvGCSTWStart:
if p.evScan != nil { evp := &evSTW
return fmt.Errorf("previous scanning is not ended before a new one (offset %v, time %v)", ev.Off, ev.Ts) if ver < 1010 {
} // Before 1.10, EvGCSTWStart was per-P.
p.evScan = ev evp = &p.evSTW
case EvGCScanDone: }
if p.evScan == nil { if *evp != nil {
return fmt.Errorf("bogus scanning end (offset %v, time %v)", ev.Off, ev.Ts) return fmt.Errorf("previous STW is not ended before a new one (offset %v, time %v)", ev.Off, ev.Ts)
} }
p.evScan.Link = ev *evp = ev
p.evScan = nil case EvGCSTWDone:
evp := &evSTW
if ver < 1010 {
// Before 1.10, EvGCSTWDone was per-P.
evp = &p.evSTW
}
if *evp == nil {
return fmt.Errorf("bogus STW end (offset %v, time %v)", ev.Off, ev.Ts)
}
(*evp).Link = ev
*evp = nil
case EvGCSweepStart: case EvGCSweepStart:
if p.evSweep != nil { if p.evSweep != nil {
return fmt.Errorf("previous sweeping is not ended before a new one (offset %v, time %v)", ev.Off, ev.Ts) return fmt.Errorf("previous sweeping is not ended before a new one (offset %v, time %v)", ev.Off, ev.Ts)
...@@ -864,6 +885,10 @@ func argNum(raw rawEvent, ver int) int { ...@@ -864,6 +885,10 @@ func argNum(raw rawEvent, ver int) int {
if ver < 1007 { if ver < 1007 {
narg-- // 1.7 added an additional seq arg narg-- // 1.7 added an additional seq arg
} }
case EvGCSTWStart:
if ver < 1010 {
narg-- // 1.10 added an argument
}
} }
return narg return narg
} }
...@@ -883,8 +908,8 @@ const ( ...@@ -883,8 +908,8 @@ const (
EvProcStop = 6 // stop of P [timestamp] EvProcStop = 6 // stop of P [timestamp]
EvGCStart = 7 // GC start [timestamp, seq, stack id] EvGCStart = 7 // GC start [timestamp, seq, stack id]
EvGCDone = 8 // GC done [timestamp] EvGCDone = 8 // GC done [timestamp]
EvGCScanStart = 9 // GC mark termination start [timestamp] EvGCSTWStart = 9 // GC mark termination start [timestamp, kind]
EvGCScanDone = 10 // GC mark termination done [timestamp] EvGCSTWDone = 10 // GC mark termination done [timestamp]
EvGCSweepStart = 11 // GC sweep start [timestamp, stack id] EvGCSweepStart = 11 // GC sweep start [timestamp, stack id]
EvGCSweepDone = 12 // GC sweep done [timestamp, swept, reclaimed] EvGCSweepDone = 12 // GC sweep done [timestamp, swept, reclaimed]
EvGoCreate = 13 // goroutine creation [timestamp, new goroutine id, new stack id, stack id] EvGoCreate = 13 // goroutine creation [timestamp, new goroutine id, new stack id, stack id]
...@@ -937,8 +962,8 @@ var EventDescriptions = [EvCount]struct { ...@@ -937,8 +962,8 @@ var EventDescriptions = [EvCount]struct {
EvProcStop: {"ProcStop", 1005, false, []string{}}, EvProcStop: {"ProcStop", 1005, false, []string{}},
EvGCStart: {"GCStart", 1005, true, []string{"seq"}}, // in 1.5 format it was {} EvGCStart: {"GCStart", 1005, true, []string{"seq"}}, // in 1.5 format it was {}
EvGCDone: {"GCDone", 1005, false, []string{}}, EvGCDone: {"GCDone", 1005, false, []string{}},
EvGCScanStart: {"GCScanStart", 1005, false, []string{}}, EvGCSTWStart: {"GCSTWStart", 1005, false, []string{"kind"}}, // <= 1.9, args was {} (implicitly {0})
EvGCScanDone: {"GCScanDone", 1005, false, []string{}}, EvGCSTWDone: {"GCSTWDone", 1005, false, []string{}},
EvGCSweepStart: {"GCSweepStart", 1005, true, []string{}}, EvGCSweepStart: {"GCSweepStart", 1005, true, []string{}},
EvGCSweepDone: {"GCSweepDone", 1005, false, []string{"swept", "reclaimed"}}, // before 1.9, format was {} EvGCSweepDone: {"GCSweepDone", 1005, false, []string{"swept", "reclaimed"}}, // before 1.9, format was {}
EvGoCreate: {"GoCreate", 1005, true, []string{"g", "stack"}}, EvGoCreate: {"GoCreate", 1005, true, []string{"g", "stack"}},
......
...@@ -1256,6 +1256,9 @@ func gcStart(mode gcMode, trigger gcTrigger) { ...@@ -1256,6 +1256,9 @@ func gcStart(mode gcMode, trigger gcTrigger) {
now := nanotime() now := nanotime()
work.tSweepTerm = now work.tSweepTerm = now
work.pauseStart = now work.pauseStart = now
if trace.enabled {
traceGCSTWStart(1)
}
systemstack(stopTheWorldWithSema) systemstack(stopTheWorldWithSema)
// Finish sweep before we start concurrent scan. // Finish sweep before we start concurrent scan.
systemstack(func() { systemstack(func() {
...@@ -1309,11 +1312,16 @@ func gcStart(mode gcMode, trigger gcTrigger) { ...@@ -1309,11 +1312,16 @@ func gcStart(mode gcMode, trigger gcTrigger) {
// Concurrent mark. // Concurrent mark.
systemstack(func() { systemstack(func() {
now = startTheWorldWithSema() now = startTheWorldWithSema(trace.enabled)
}) })
work.pauseNS += now - work.pauseStart work.pauseNS += now - work.pauseStart
work.tMark = now work.tMark = now
} else { } else {
if trace.enabled {
// Switch to mark termination STW.
traceGCSTWDone()
traceGCSTWStart(0)
}
t := nanotime() t := nanotime()
work.tMark, work.tMarkTerm = t, t work.tMark, work.tMarkTerm = t, t
work.heapGoal = work.heap0 work.heapGoal = work.heap0
...@@ -1414,6 +1422,9 @@ top: ...@@ -1414,6 +1422,9 @@ top:
work.tMarkTerm = now work.tMarkTerm = now
work.pauseStart = now work.pauseStart = now
getg().m.preemptoff = "gcing" getg().m.preemptoff = "gcing"
if trace.enabled {
traceGCSTWStart(0)
}
systemstack(stopTheWorldWithSema) systemstack(stopTheWorldWithSema)
// The gcphase is _GCmark, it will transition to _GCmarktermination // The gcphase is _GCmark, it will transition to _GCmarktermination
// below. The important thing is that the wb remains active until // below. The important thing is that the wb remains active until
...@@ -1574,7 +1585,7 @@ func gcMarkTermination(nextTriggerRatio float64) { ...@@ -1574,7 +1585,7 @@ func gcMarkTermination(nextTriggerRatio float64) {
// so events don't leak into the wrong cycle. // so events don't leak into the wrong cycle.
mProf_NextCycle() mProf_NextCycle()
systemstack(func() { startTheWorldWithSema() }) systemstack(func() { startTheWorldWithSema(true) })
// Flush the heap profile so we can start a new cycle next GC. // Flush the heap profile so we can start a new cycle next GC.
// This is relatively expensive, so we don't do it with the // This is relatively expensive, so we don't do it with the
...@@ -1915,10 +1926,6 @@ func gcMark(start_time int64) { ...@@ -1915,10 +1926,6 @@ func gcMark(start_time int64) {
work.helperDrainBlock = true work.helperDrainBlock = true
} }
if trace.enabled {
traceGCScanStart()
}
if work.nproc > 1 { if work.nproc > 1 {
noteclear(&work.alldone) noteclear(&work.alldone)
helpgc(int32(work.nproc)) helpgc(int32(work.nproc))
...@@ -1962,10 +1969,6 @@ func gcMark(start_time int64) { ...@@ -1962,10 +1969,6 @@ func gcMark(start_time int64) {
} }
} }
if trace.enabled {
traceGCScanDone()
}
cachestats() cachestats()
// Update the marked heap stat. // Update the marked heap stat.
...@@ -2103,10 +2106,6 @@ func gchelper() { ...@@ -2103,10 +2106,6 @@ func gchelper() {
_g_.m.traceback = 2 _g_.m.traceback = 2
gchelperstart() gchelperstart()
if trace.enabled {
traceGCScanStart()
}
// Parallel mark over GC roots and heap // Parallel mark over GC roots and heap
if gcphase == _GCmarktermination { if gcphase == _GCmarktermination {
gcw := &_g_.m.p.ptr().gcw gcw := &_g_.m.p.ptr().gcw
...@@ -2118,10 +2117,6 @@ func gchelper() { ...@@ -2118,10 +2117,6 @@ func gchelper() {
gcw.dispose() gcw.dispose()
} }
if trace.enabled {
traceGCScanDone()
}
nproc := atomic.Load(&work.nproc) // work.nproc can change right after we increment work.ndone nproc := atomic.Load(&work.nproc) // work.nproc can change right after we increment work.ndone
if atomic.Xadd(&work.ndone, +1) == nproc-1 { if atomic.Xadd(&work.ndone, +1) == nproc-1 {
notewakeup(&work.alldone) notewakeup(&work.alldone)
......
...@@ -948,7 +948,7 @@ func stopTheWorld(reason string) { ...@@ -948,7 +948,7 @@ func stopTheWorld(reason string) {
// startTheWorld undoes the effects of stopTheWorld. // startTheWorld undoes the effects of stopTheWorld.
func startTheWorld() { func startTheWorld() {
systemstack(func() { startTheWorldWithSema() }) systemstack(func() { startTheWorldWithSema(false) })
// worldsema must be held over startTheWorldWithSema to ensure // worldsema must be held over startTheWorldWithSema to ensure
// gomaxprocs cannot change while worldsema is held. // gomaxprocs cannot change while worldsema is held.
semrelease(&worldsema) semrelease(&worldsema)
...@@ -1064,7 +1064,7 @@ func mhelpgc() { ...@@ -1064,7 +1064,7 @@ func mhelpgc() {
_g_.m.helpgc = -1 _g_.m.helpgc = -1
} }
func startTheWorldWithSema() int64 { func startTheWorldWithSema(emitTraceEvent bool) int64 {
_g_ := getg() _g_ := getg()
_g_.m.locks++ // disable preemption because it can be holding p in a local var _g_.m.locks++ // disable preemption because it can be holding p in a local var
...@@ -1106,6 +1106,9 @@ func startTheWorldWithSema() int64 { ...@@ -1106,6 +1106,9 @@ func startTheWorldWithSema() int64 {
// Capture start-the-world time before doing clean-up tasks. // Capture start-the-world time before doing clean-up tasks.
startTime := nanotime() startTime := nanotime()
if emitTraceEvent {
traceGCSTWDone()
}
// Wakeup an additional proc in case we have excessive runnable goroutines // Wakeup an additional proc in case we have excessive runnable goroutines
// in local queues or in the global queue. If we don't, the proc will park itself. // in local queues or in the global queue. If we don't, the proc will park itself.
......
...@@ -28,8 +28,8 @@ const ( ...@@ -28,8 +28,8 @@ const (
traceEvProcStop = 6 // stop of P [timestamp] traceEvProcStop = 6 // stop of P [timestamp]
traceEvGCStart = 7 // GC start [timestamp, seq, stack id] traceEvGCStart = 7 // GC start [timestamp, seq, stack id]
traceEvGCDone = 8 // GC done [timestamp] traceEvGCDone = 8 // GC done [timestamp]
traceEvGCScanStart = 9 // GC mark termination start [timestamp] traceEvGCSTWStart = 9 // GC STW start [timestamp, kind]
traceEvGCScanDone = 10 // GC mark termination done [timestamp] traceEvGCSTWDone = 10 // GC STW done [timestamp]
traceEvGCSweepStart = 11 // GC sweep start [timestamp, stack id] traceEvGCSweepStart = 11 // GC sweep start [timestamp, stack id]
traceEvGCSweepDone = 12 // GC sweep done [timestamp, swept, reclaimed] traceEvGCSweepDone = 12 // GC sweep done [timestamp, swept, reclaimed]
traceEvGoCreate = 13 // goroutine creation [timestamp, new goroutine id, new stack id, stack id] traceEvGoCreate = 13 // goroutine creation [timestamp, new goroutine id, new stack id, stack id]
...@@ -382,7 +382,7 @@ func ReadTrace() []byte { ...@@ -382,7 +382,7 @@ func ReadTrace() []byte {
trace.headerWritten = true trace.headerWritten = true
trace.lockOwner = nil trace.lockOwner = nil
unlock(&trace.lock) unlock(&trace.lock)
return []byte("go 1.9 trace\x00\x00\x00\x00") return []byte("go 1.10 trace\x00\x00\x00")
} }
// Wait for new data. // Wait for new data.
if trace.fullHead == 0 && !trace.shutdown { if trace.fullHead == 0 && !trace.shutdown {
...@@ -924,12 +924,12 @@ func traceGCDone() { ...@@ -924,12 +924,12 @@ func traceGCDone() {
traceEvent(traceEvGCDone, -1) traceEvent(traceEvGCDone, -1)
} }
func traceGCScanStart() { func traceGCSTWStart(kind int) {
traceEvent(traceEvGCScanStart, -1) traceEvent(traceEvGCSTWStart, -1, uint64(kind))
} }
func traceGCScanDone() { func traceGCSTWDone() {
traceEvent(traceEvGCScanDone, -1) traceEvent(traceEvGCSTWDone, -1)
} }
// traceGCSweepStart prepares to trace a sweep loop. This does not // traceGCSweepStart prepares to trace a sweep loop. This does not
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment