mirror of
https://github.com/golang/go
synced 2024-11-12 06:30:21 -07:00
runtime: preempt a goroutine which calls a lot of short system calls
A goroutine should be preempted if it runs for 10ms without blocking. We found that this doesn't work for goroutines which call short system calls. For example, the next program can stuck for seconds without this fix: $ cat main.go package main import ( "runtime" "syscall" ) func main() { runtime.GOMAXPROCS(1) c := make(chan int) go func() { c <- 1 for { t := syscall.Timespec{ Nsec: 300, } if true { syscall.Nanosleep(&t, nil) } } }() <-c } $ time go run main.go real 0m8.796s user 0m0.367s sys 0m0.893s Updates #10958 Change-Id: Id3be54d3779cc28bfc8b33fe578f13778f1ae2a2 Reviewed-on: https://go-review.googlesource.com/c/go/+/170138 Reviewed-by: Dmitry Vyukov <dvyukov@google.com> Run-TryBot: Dmitry Vyukov <dvyukov@google.com> TryBot-Result: Gobot Gobot <gobot@golang.org>
This commit is contained in:
parent
08e1823a63
commit
4166ff42c0
@ -34,6 +34,8 @@ var Fastlog2 = fastlog2
|
||||
var Atoi = atoi
|
||||
var Atoi32 = atoi32
|
||||
|
||||
var Nanotime = nanotime
|
||||
|
||||
type LFNode struct {
|
||||
Next uint64
|
||||
Pushcnt uintptr
|
||||
|
@ -4380,10 +4380,24 @@ func retake(now int64) uint32 {
|
||||
}
|
||||
pd := &_p_.sysmontick
|
||||
s := _p_.status
|
||||
sysretake := false
|
||||
if s == _Prunning || s == _Psyscall {
|
||||
// Preempt G if it's running for too long.
|
||||
t := int64(_p_.schedtick)
|
||||
if int64(pd.schedtick) != t {
|
||||
pd.schedtick = uint32(t)
|
||||
pd.schedwhen = now
|
||||
} else if pd.schedwhen+forcePreemptNS <= now {
|
||||
preemptone(_p_)
|
||||
// In case of syscall, preemptone() doesn't
|
||||
// work, because there is no M wired to P.
|
||||
sysretake = true
|
||||
}
|
||||
}
|
||||
if s == _Psyscall {
|
||||
// Retake P from syscall if it's there for more than 1 sysmon tick (at least 20us).
|
||||
t := int64(_p_.syscalltick)
|
||||
if int64(pd.syscalltick) != t {
|
||||
if !sysretake && int64(pd.syscalltick) != t {
|
||||
pd.syscalltick = uint32(t)
|
||||
pd.syscallwhen = now
|
||||
continue
|
||||
@ -4412,18 +4426,6 @@ func retake(now int64) uint32 {
|
||||
}
|
||||
incidlelocked(1)
|
||||
lock(&allpLock)
|
||||
} else if s == _Prunning {
|
||||
// Preempt G if it's running for too long.
|
||||
t := int64(_p_.schedtick)
|
||||
if int64(pd.schedtick) != t {
|
||||
pd.schedtick = uint32(t)
|
||||
pd.schedwhen = now
|
||||
continue
|
||||
}
|
||||
if pd.schedwhen+forcePreemptNS > now {
|
||||
continue
|
||||
}
|
||||
preemptone(_p_)
|
||||
}
|
||||
}
|
||||
unlock(&allpLock)
|
||||
|
@ -5,6 +5,7 @@
|
||||
package runtime_test
|
||||
|
||||
import (
|
||||
"fmt"
|
||||
"math"
|
||||
"net"
|
||||
"runtime"
|
||||
@ -910,3 +911,69 @@ func TestLockOSThreadAvoidsStatePropagation(t *testing.T) {
|
||||
t.Errorf("want %q, got %q", want, output)
|
||||
}
|
||||
}
|
||||
|
||||
// fakeSyscall emulates a system call.
|
||||
//go:nosplit
|
||||
func fakeSyscall(duration time.Duration) {
|
||||
runtime.Entersyscall()
|
||||
for start := runtime.Nanotime(); runtime.Nanotime()-start < int64(duration); {
|
||||
}
|
||||
runtime.Exitsyscall()
|
||||
}
|
||||
|
||||
// Check that a goroutine will be preempted if it is calling short system calls.
|
||||
func testPreemptionAfterSyscall(t *testing.T, syscallDuration time.Duration) {
|
||||
if runtime.GOARCH == "wasm" {
|
||||
t.Skip("no preemption on wasm yet")
|
||||
}
|
||||
|
||||
defer runtime.GOMAXPROCS(runtime.GOMAXPROCS(2))
|
||||
|
||||
interations := 10
|
||||
if testing.Short() {
|
||||
interations = 1
|
||||
}
|
||||
const (
|
||||
maxDuration = 3 * time.Second
|
||||
nroutines = 8
|
||||
)
|
||||
|
||||
for i := 0; i < interations; i++ {
|
||||
c := make(chan bool, nroutines)
|
||||
stop := uint32(0)
|
||||
|
||||
start := time.Now()
|
||||
for g := 0; g < nroutines; g++ {
|
||||
go func(stop *uint32) {
|
||||
c <- true
|
||||
for atomic.LoadUint32(stop) == 0 {
|
||||
fakeSyscall(syscallDuration)
|
||||
}
|
||||
c <- true
|
||||
}(&stop)
|
||||
}
|
||||
// wait until all goroutines have started.
|
||||
for g := 0; g < nroutines; g++ {
|
||||
<-c
|
||||
}
|
||||
atomic.StoreUint32(&stop, 1)
|
||||
// wait until all goroutines have finished.
|
||||
for g := 0; g < nroutines; g++ {
|
||||
<-c
|
||||
}
|
||||
duration := time.Since(start)
|
||||
|
||||
if duration > maxDuration {
|
||||
t.Errorf("timeout exceeded: %v (%v)", duration, maxDuration)
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
func TestPreemptionAfterSyscall(t *testing.T) {
|
||||
for _, i := range []time.Duration{10, 100, 1000} {
|
||||
d := i * time.Microsecond
|
||||
t.Run(fmt.Sprint(d), func(t *testing.T) {
|
||||
testPreemptionAfterSyscall(t, d)
|
||||
})
|
||||
}
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user