Commit 4bb491b1 authored by Dmitriy Vyukov's avatar Dmitriy Vyukov

runtime: improve scheduler fairness

Currently global runqueue is starved if a group of goroutines
constantly respawn each other (local runqueue never becomes empty).
Fixes #5639.

R=golang-dev, iant
CC=golang-dev
https://golang.org/cl/10042044
parent 5caf7624
...@@ -106,7 +106,7 @@ static void gfput(P*, G*); ...@@ -106,7 +106,7 @@ static void gfput(P*, G*);
static G* gfget(P*); static G* gfget(P*);
static void gfpurge(P*); static void gfpurge(P*);
static void globrunqput(G*); static void globrunqput(G*);
static G* globrunqget(P*); static G* globrunqget(P*, int32);
static P* pidleget(void); static P* pidleget(void);
static void pidleput(P*); static void pidleput(P*);
static void injectglist(G*); static void injectglist(G*);
...@@ -1024,7 +1024,7 @@ top: ...@@ -1024,7 +1024,7 @@ top:
// global runq // global runq
if(runtime·sched.runqsize) { if(runtime·sched.runqsize) {
runtime·lock(&runtime·sched); runtime·lock(&runtime·sched);
gp = globrunqget(m->p); gp = globrunqget(m->p, 0);
runtime·unlock(&runtime·sched); runtime·unlock(&runtime·sched);
if(gp) if(gp)
return gp; return gp;
...@@ -1065,7 +1065,7 @@ stop: ...@@ -1065,7 +1065,7 @@ stop:
goto top; goto top;
} }
if(runtime·sched.runqsize) { if(runtime·sched.runqsize) {
gp = globrunqget(m->p); gp = globrunqget(m->p, 0);
runtime·unlock(&runtime·sched); runtime·unlock(&runtime·sched);
return gp; return gp;
} }
...@@ -1144,6 +1144,7 @@ static void ...@@ -1144,6 +1144,7 @@ static void
schedule(void) schedule(void)
{ {
G *gp; G *gp;
uint32 tick;
if(m->locks) if(m->locks)
runtime·throw("schedule: holding locks"); runtime·throw("schedule: holding locks");
...@@ -1154,9 +1155,23 @@ top: ...@@ -1154,9 +1155,23 @@ top:
goto top; goto top;
} }
gp = runqget(m->p); gp = nil;
if(gp && m->spinning) // Check the global runnable queue once in a while to ensure fairness.
runtime·throw("schedule: spinning with local work"); // Otherwise two goroutines can completely occupy the local runqueue
// by constantly respawning each other.
tick = m->p->tick;
// This is a fancy way to say tick%61==0,
// it uses 2 MUL instructions instead of a single DIV and so is faster on modern processors.
if(tick - (((uint64)tick*0x4325c53fu)>>36)*61 == 0 && runtime·sched.runqsize > 0) {
runtime·lock(&runtime·sched);
gp = globrunqget(m->p, 1);
runtime·unlock(&runtime·sched);
}
if(gp == nil) {
gp = runqget(m->p);
if(gp && m->spinning)
runtime·throw("schedule: spinning with local work");
}
if(gp == nil) if(gp == nil)
gp = findrunnable(); gp = findrunnable();
...@@ -2167,7 +2182,7 @@ globrunqput(G *gp) ...@@ -2167,7 +2182,7 @@ globrunqput(G *gp)
// Try get a batch of G's from the global runnable queue. // Try get a batch of G's from the global runnable queue.
// Sched must be locked. // Sched must be locked.
static G* static G*
globrunqget(P *p) globrunqget(P *p, int32 max)
{ {
G *gp, *gp1; G *gp, *gp1;
int32 n; int32 n;
...@@ -2177,6 +2192,8 @@ globrunqget(P *p) ...@@ -2177,6 +2192,8 @@ globrunqget(P *p)
n = runtime·sched.runqsize/runtime·gomaxprocs+1; n = runtime·sched.runqsize/runtime·gomaxprocs+1;
if(n > runtime·sched.runqsize) if(n > runtime·sched.runqsize)
n = runtime·sched.runqsize; n = runtime·sched.runqsize;
if(max > 0 && n > max)
n = max;
runtime·sched.runqsize -= n; runtime·sched.runqsize -= n;
if(runtime·sched.runqsize == 0) if(runtime·sched.runqsize == 0)
runtime·sched.runqtail = nil; runtime·sched.runqtail = nil;
......
...@@ -8,6 +8,7 @@ import ( ...@@ -8,6 +8,7 @@ import (
"math" "math"
"runtime" "runtime"
"sync/atomic" "sync/atomic"
"syscall"
"testing" "testing"
"time" "time"
) )
...@@ -107,6 +108,55 @@ func TestBlockLocked(t *testing.T) { ...@@ -107,6 +108,55 @@ func TestBlockLocked(t *testing.T) {
} }
} }
func TestTimerFairness(t *testing.T) {
done := make(chan bool)
c := make(chan bool)
for i := 0; i < 2; i++ {
go func() {
for {
select {
case c <- true:
case <-done:
return
}
}
}()
}
timer := time.After(20 * time.Millisecond)
for {
select {
case <-c:
case <-timer:
close(done)
return
}
}
}
func TestTimerFairness2(t *testing.T) {
done := make(chan bool)
c := make(chan bool)
for i := 0; i < 2; i++ {
go func() {
timer := time.After(20 * time.Millisecond)
var buf [1]byte
for {
syscall.Read(0, buf[0:0])
select {
case c <- true:
case <-c:
case <-timer:
done <- true
return
}
}
}()
}
<-done
<-done
}
func stackGrowthRecursive(i int) { func stackGrowthRecursive(i int) {
var pad [128]uint64 var pad [128]uint64
if i != 0 && pad[0] == 0 { if i != 0 && pad[0] == 0 {
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment