mirror of
https://github.com/golang/go
synced 2024-11-17 22:14:43 -07:00
runtime: fix missing pprof labels
Use gp.m.curg instead of the gp when recording cpu profiler stack traces. This ensures profiler labels are captured when systemstack or similar is executing on behalf of the current goroutine. After this there are still rare cases of samples containing the labelHog function, so more work might be needed. This patch should fix ~99% of the problem. Fixes #48577. Change-Id: I27132110e3d09721ec3b3ef417122bc70d8f3279 Reviewed-on: https://go-review.googlesource.com/c/go/+/351751 Reviewed-by: Michael Pratt <mpratt@google.com> Run-TryBot: Michael Pratt <mpratt@google.com> TryBot-Result: Go Bot <gobot@golang.org> Trust: Michael Knyszek <mknyszek@google.com>
This commit is contained in:
parent
4d7bf41beb
commit
da7173a2ed
@ -89,7 +89,7 @@ func SetCPUProfileRate(hz int) {
|
|||||||
// held at the time of the signal, nor can it use substantial amounts
|
// held at the time of the signal, nor can it use substantial amounts
|
||||||
// of stack.
|
// of stack.
|
||||||
//go:nowritebarrierrec
|
//go:nowritebarrierrec
|
||||||
func (p *cpuProfile) add(gp *g, stk []uintptr) {
|
func (p *cpuProfile) add(tagPtr *unsafe.Pointer, stk []uintptr) {
|
||||||
// Simple cas-lock to coordinate with setcpuprofilerate.
|
// Simple cas-lock to coordinate with setcpuprofilerate.
|
||||||
for !atomic.Cas(&prof.signalLock, 0, 1) {
|
for !atomic.Cas(&prof.signalLock, 0, 1) {
|
||||||
osyield()
|
osyield()
|
||||||
@ -104,15 +104,6 @@ func (p *cpuProfile) add(gp *g, stk []uintptr) {
|
|||||||
// because otherwise its write barrier behavior may not
|
// because otherwise its write barrier behavior may not
|
||||||
// be correct. See the long comment there before
|
// be correct. See the long comment there before
|
||||||
// changing the argument here.
|
// changing the argument here.
|
||||||
//
|
|
||||||
// Note: it can happen on Windows, where we are calling
|
|
||||||
// p.add with a gp that is not the current g, that gp is nil,
|
|
||||||
// meaning we interrupted a system thread with no g.
|
|
||||||
// Avoid faulting in that case.
|
|
||||||
var tagPtr *unsafe.Pointer
|
|
||||||
if gp != nil {
|
|
||||||
tagPtr = &gp.labels
|
|
||||||
}
|
|
||||||
cpuprof.log.write(tagPtr, nanotime(), hdr[:], stk)
|
cpuprof.log.write(tagPtr, nanotime(), hdr[:], stk)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1361,6 +1361,73 @@ func TestLabelRace(t *testing.T) {
|
|||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func TestLabelSystemstack(t *testing.T) {
|
||||||
|
// See http://golang.org/cl/351751.
|
||||||
|
prof := testCPUProfile(t, stackContainsLabeled, []string{"runtime.systemstack;key=value"}, avoidFunctions(), func(dur time.Duration) {
|
||||||
|
Do(context.Background(), Labels("key", "value"), func(context.Context) {
|
||||||
|
var wg sync.WaitGroup
|
||||||
|
stop := make(chan struct{})
|
||||||
|
for i := 0; i < runtime.GOMAXPROCS(0); i++ {
|
||||||
|
wg.Add(1)
|
||||||
|
go func() {
|
||||||
|
defer wg.Done()
|
||||||
|
labelHog(stop)
|
||||||
|
}()
|
||||||
|
}
|
||||||
|
|
||||||
|
time.Sleep(dur)
|
||||||
|
close(stop)
|
||||||
|
wg.Wait()
|
||||||
|
})
|
||||||
|
})
|
||||||
|
|
||||||
|
var withLabel, withoutLabel int64
|
||||||
|
for _, s := range prof.Sample {
|
||||||
|
var systemstack, labelHog bool
|
||||||
|
for _, loc := range s.Location {
|
||||||
|
for _, l := range loc.Line {
|
||||||
|
switch l.Function.Name {
|
||||||
|
case "runtime.systemstack":
|
||||||
|
systemstack = true
|
||||||
|
case "runtime/pprof.labelHog":
|
||||||
|
labelHog = true
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if systemstack && labelHog {
|
||||||
|
if s.Label != nil && contains(s.Label["key"], "value") {
|
||||||
|
withLabel += s.Value[0]
|
||||||
|
} else {
|
||||||
|
withoutLabel += s.Value[0]
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// ratio on 2019 Intel MBP before/after CL 351751 for n=30 runs:
|
||||||
|
// before: mean=0.013 stddev=0.013 min=0.000 max=0.039
|
||||||
|
// after : mean=0.996 stddev=0.007 min=0.967 max=1.000
|
||||||
|
//
|
||||||
|
// TODO: Figure out why some samples still contain labelHog without labels.
|
||||||
|
// Once fixed this test case can be simplified to just check that all samples
|
||||||
|
// containing labelHog() have the label, and no other samples do.
|
||||||
|
ratio := float64(withLabel) / float64((withLabel + withoutLabel))
|
||||||
|
if ratio < 0.9 {
|
||||||
|
t.Fatalf("only %.1f%% of labelHog(systemstack()) samples have label", ratio*100)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func labelHog(stop chan struct{}) {
|
||||||
|
for i := 0; ; i++ {
|
||||||
|
select {
|
||||||
|
case <-stop:
|
||||||
|
return
|
||||||
|
default:
|
||||||
|
fmt.Fprintf(io.Discard, "%d", i)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
// Check that there is no deadlock when the program receives SIGPROF while in
|
// Check that there is no deadlock when the program receives SIGPROF while in
|
||||||
// 64bit atomics' critical section. Used to happen on mips{,le}. See #20146.
|
// 64bit atomics' critical section. Used to happen on mips{,le}. See #20146.
|
||||||
func TestAtomicLoadStore64(t *testing.T) {
|
func TestAtomicLoadStore64(t *testing.T) {
|
||||||
|
@ -4711,7 +4711,14 @@ func sigprof(pc, sp, lr uintptr, gp *g, mp *m) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
if prof.hz != 0 {
|
if prof.hz != 0 {
|
||||||
cpuprof.add(gp, stk[:n])
|
// Note: it can happen on Windows that we interrupted a system thread
|
||||||
|
// with no g, so gp could nil. The other nil checks are done out of
|
||||||
|
// caution, but not expected to be nil in practice.
|
||||||
|
var tagPtr *unsafe.Pointer
|
||||||
|
if gp != nil && gp.m != nil && gp.m.curg != nil {
|
||||||
|
tagPtr = &gp.m.curg.labels
|
||||||
|
}
|
||||||
|
cpuprof.add(tagPtr, stk[:n])
|
||||||
}
|
}
|
||||||
getg().m.mallocing--
|
getg().m.mallocing--
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user