Commit 4f2e382c authored by Dmitriy Vyukov's avatar Dmitriy Vyukov

runtime: dump scheduler state if GODEBUG=schedtrace is set

The schedtrace value sets dump period in milliseconds.
In default mode the trace looks as follows:
SCHED 0ms: gomaxprocs=4 idleprocs=0 threads=3 idlethreads=0 runqueue=0 [1 0 0 0]
SCHED 1001ms: gomaxprocs=4 idleprocs=3 threads=6 idlethreads=3 runqueue=0 [0 0 0 0]
SCHED 2008ms: gomaxprocs=4 idleprocs=1 threads=6 idlethreads=1 runqueue=0 [0 1 0 0]
If GODEBUG=scheddetail=1 is set as well, then the detailed trace is printed:
SCHED 0ms: gomaxprocs=4 idleprocs=0 threads=3 idlethreads=0 runqueue=0 singleproc=0 gcwaiting=1 mlocked=0 nmspinning=0 stopwait=0 sysmonwait=0
  P0: status=3 tick=1 m=0 runqsize=1/128 gfreecnt=0
  P1: status=3 tick=0 m=-1 runqsize=0/128 gfreecnt=0
  P2: status=3 tick=0 m=-1 runqsize=0/128 gfreecnt=0
  P3: status=3 tick=0 m=-1 runqsize=0/128 gfreecnt=0
  M2: p=-1 curg=-1 mallocing=0 throwing=0 gcing=0 locks=1 dying=0 helpgc=0 spinning=0 lockedg=-1
  M1: p=-1 curg=-1 mallocing=0 throwing=0 gcing=0 locks=1 dying=0 helpgc=0 spinning=0 lockedg=-1
  M0: p=0 curg=1 mallocing=0 throwing=0 gcing=0 locks=1 dying=0 helpgc=0 spinning=0 lockedg=1
  G1: status=2() m=0 lockedm=0
  G2: status=1() m=-1 lockedm=-1

R=golang-dev, raggi, rsc
CC=golang-dev
https://golang.org/cl/11435044
parent 2642c6e2
...@@ -23,10 +23,18 @@ percentage at run time. See http://golang.org/pkg/runtime/debug/#SetGCPercent. ...@@ -23,10 +23,18 @@ percentage at run time. See http://golang.org/pkg/runtime/debug/#SetGCPercent.
The GODEBUG variable controls debug output from the runtime. GODEBUG value is The GODEBUG variable controls debug output from the runtime. GODEBUG value is
a comma-separated list of name=val pairs. Supported names are: a comma-separated list of name=val pairs. Supported names are:
gctrace: setting gctrace=1 causes the garbage collector to emit a single line to standard
error at each collection, summarizing the amount of memory collected and the gctrace: setting gctrace=1 causes the garbage collector to emit a single line to standard
length of the pause. Setting gctrace=2 emits the same summary but also error at each collection, summarizing the amount of memory collected and the
repeats each collection. length of the pause. Setting gctrace=2 emits the same summary but also
repeats each collection.
schedtrace: setting schedtrace=X causes the scheduler to emit a single line to standard
error every X milliseconds, summarizing the scheduler state.
scheddetail: setting schedtrace=X and scheddetail=1 causes the scheduler to emit
detailed multiline info every X milliseconds, describing state of the scheduler,
processors, threads and goroutines.
The GOMAXPROCS variable limits the number of operating system threads that The GOMAXPROCS variable limits the number of operating system threads that
can execute user-level Go code simultaneously. There is no limit to the number of threads can execute user-level Go code simultaneously. There is no limit to the number of threads
......
...@@ -420,6 +420,8 @@ runtime·startpanic(void) ...@@ -420,6 +420,8 @@ runtime·startpanic(void)
g->writebuf = nil; g->writebuf = nil;
runtime·xadd(&runtime·panicking, 1); runtime·xadd(&runtime·panicking, 1);
runtime·lock(&paniclk); runtime·lock(&paniclk);
if(runtime·debug.schedtrace > 0 || runtime·debug.scheddetail > 0)
runtime·schedtrace(true);
runtime·freezetheworld(); runtime·freezetheworld();
} }
......
...@@ -2092,6 +2092,7 @@ procresize(int32 new) ...@@ -2092,6 +2092,7 @@ procresize(int32 new)
p = runtime·allp[i]; p = runtime·allp[i];
if(p == nil) { if(p == nil) {
p = (P*)runtime·mallocgc(sizeof(*p), 0, FlagNoInvokeGC); p = (P*)runtime·mallocgc(sizeof(*p), 0, FlagNoInvokeGC);
p->id = i;
p->status = Pgcstop; p->status = Pgcstop;
runtime·atomicstorep(&runtime·allp[i], p); runtime·atomicstorep(&runtime·allp[i], p);
} }
...@@ -2235,9 +2236,10 @@ static void ...@@ -2235,9 +2236,10 @@ static void
sysmon(void) sysmon(void)
{ {
uint32 idle, delay; uint32 idle, delay;
int64 now, lastpoll; int64 now, lastpoll, lasttrace;
G *gp; G *gp;
lasttrace = 0;
idle = 0; // how many cycles in succession we had not wokeup somebody idle = 0; // how many cycles in succession we had not wokeup somebody
delay = 0; delay = 0;
for(;;) { for(;;) {
...@@ -2248,7 +2250,8 @@ sysmon(void) ...@@ -2248,7 +2250,8 @@ sysmon(void)
if(delay > 10*1000) // up to 10ms if(delay > 10*1000) // up to 10ms
delay = 10*1000; delay = 10*1000;
runtime·usleep(delay); runtime·usleep(delay);
if(runtime·gcwaiting || runtime·atomicload(&runtime·sched.npidle) == runtime·gomaxprocs) { // TODO: fast atomic if(runtime·debug.schedtrace <= 0 &&
(runtime·gcwaiting || runtime·atomicload(&runtime·sched.npidle) == runtime·gomaxprocs)) { // TODO: fast atomic
runtime·lock(&runtime·sched); runtime·lock(&runtime·sched);
if(runtime·atomicload(&runtime·gcwaiting) || runtime·atomicload(&runtime·sched.npidle) == runtime·gomaxprocs) { if(runtime·atomicload(&runtime·gcwaiting) || runtime·atomicload(&runtime·sched.npidle) == runtime·gomaxprocs) {
runtime·atomicstore(&runtime·sched.sysmonwait, 1); runtime·atomicstore(&runtime·sched.sysmonwait, 1);
...@@ -2285,6 +2288,11 @@ sysmon(void) ...@@ -2285,6 +2288,11 @@ sysmon(void)
idle = 0; idle = 0;
else else
idle++; idle++;
if(runtime·debug.schedtrace > 0 && lasttrace + runtime·debug.schedtrace*1000000ll <= now) {
lasttrace = now;
runtime·schedtrace(runtime·debug.scheddetail);
}
} }
} }
...@@ -2397,6 +2405,84 @@ preemptone(P *p) ...@@ -2397,6 +2405,84 @@ preemptone(P *p)
return true; return true;
} }
void
runtime·schedtrace(bool detailed)
{
static int64 starttime;
int64 now;
int32 i, q, t, h, s;
int8 *fmt;
M *mp, *lockedm;
G *gp, *lockedg;
P *p;
now = runtime·nanotime();
if(starttime == 0)
starttime = now;
runtime·lock(&runtime·sched);
runtime·printf("SCHED %Dms: gomaxprocs=%d idleprocs=%d threads=%d idlethreads=%d runqueue=%d",
(now-starttime)/1000000, runtime·gomaxprocs, runtime·sched.npidle, runtime·sched.mcount,
runtime·sched.nmidle, runtime·sched.runqsize);
if(detailed) {
runtime·printf(" gcwaiting=%d nmidlelocked=%d nmspinning=%d stopwait=%d sysmonwait=%d\n",
runtime·gcwaiting, runtime·sched.nmidlelocked, runtime·sched.nmspinning,
runtime·sched.stopwait, runtime·sched.sysmonwait);
}
// We must be careful while reading data from P's, M's and G's.
// Even if we hold schedlock, most data can be changed concurrently.
// E.g. (p->m ? p->m->id : -1) can crash if p->m changes from non-nil to nil.
for(i = 0; i < runtime·gomaxprocs; i++) {
p = runtime·allp[i];
if(p == nil)
continue;
mp = p->m;
t = p->runqtail;
h = p->runqhead;
s = p->runqsize;
q = t - h;
if(q < 0)
q += s;
if(detailed)
runtime·printf(" P%d: status=%d schedtick=%d syscalltick=%d m=%d runqsize=%d/%d gfreecnt=%d\n",
i, p->status, p->schedtick, p->syscalltick, mp ? mp->id : -1, q, s, p->gfreecnt);
else {
// In non-detailed mode format lengths of per-P run queues as:
// [len1 len2 len3 len4]
fmt = " %d";
if(runtime·gomaxprocs == 1)
fmt = " [%d]\n";
else if(i == 0)
fmt = " [%d";
else if(i == runtime·gomaxprocs-1)
fmt = " %d]\n";
runtime·printf(fmt, q);
}
}
if(!detailed) {
runtime·unlock(&runtime·sched);
return;
}
for(mp = runtime·allm; mp; mp = mp->alllink) {
p = mp->p;
gp = mp->curg;
lockedg = mp->lockedg;
runtime·printf(" M%d: p=%d curg=%D mallocing=%d throwing=%d gcing=%d"
" locks=%d dying=%d helpgc=%d spinning=%d lockedg=%D\n",
mp->id, p ? p->id : -1, gp ? gp->goid : (int64)-1,
mp->mallocing, mp->throwing, mp->gcing, mp->locks, mp->dying, mp->helpgc,
mp->spinning, lockedg ? lockedg->goid : (int64)-1);
}
for(gp = runtime·allg; gp; gp = gp->alllink) {
mp = gp->m;
lockedm = gp->lockedm;
runtime·printf(" G%D: status=%d(%s) m=%d lockedm=%d\n",
gp->goid, gp->status, gp->waitreason, mp ? mp->id : -1,
lockedm ? lockedm->id : -1);
}
runtime·unlock(&runtime·sched);
}
// Put mp on midle list. // Put mp on midle list.
// Sched must be locked. // Sched must be locked.
static void static void
......
...@@ -388,6 +388,8 @@ static struct { ...@@ -388,6 +388,8 @@ static struct {
int32* value; int32* value;
} dbgvar[] = { } dbgvar[] = {
{"gctrace", &runtime·debug.gctrace}, {"gctrace", &runtime·debug.gctrace},
{"schedtrace", &runtime·debug.schedtrace},
{"scheddetail", &runtime·debug.scheddetail},
}; };
void void
......
...@@ -361,6 +361,7 @@ struct P ...@@ -361,6 +361,7 @@ struct P
{ {
Lock; Lock;
int32 id;
uint32 status; // one of Pidle/Prunning/... uint32 status; // one of Pidle/Prunning/...
P* link; P* link;
uint32 schedtick; // incremented on every scheduler call uint32 schedtick; // incremented on every scheduler call
...@@ -532,6 +533,8 @@ struct CgoMal ...@@ -532,6 +533,8 @@ struct CgoMal
struct DebugVars struct DebugVars
{ {
int32 gctrace; int32 gctrace;
int32 schedtrace;
int32 scheddetail;
}; };
/* /*
...@@ -823,6 +826,7 @@ void runtime·exit(int32); ...@@ -823,6 +826,7 @@ void runtime·exit(int32);
void runtime·breakpoint(void); void runtime·breakpoint(void);
void runtime·gosched(void); void runtime·gosched(void);
void runtime·gosched0(G*); void runtime·gosched0(G*);
void runtime·schedtrace(bool);
void runtime·park(void(*)(Lock*), Lock*, int8*); void runtime·park(void(*)(Lock*), Lock*, int8*);
void runtime·tsleep(int64, int8*); void runtime·tsleep(int64, int8*);
M* runtime·newm(void); M* runtime·newm(void);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment