runtime: add tracing of runtime events

author Dmitry Vyukov <dvyukov@google.com>

Fri, 12 Dec 2014 17:41:57 +0000 (18:41 +0100)

committer Dmitry Vyukov <dvyukov@google.com>

Wed, 28 Jan 2015 16:35:24 +0000 (16:35 +0000)
author Dmitry Vyukov <dvyukov@google.com>
Fri, 12 Dec 2014 17:41:57 +0000 (18:41 +0100)
committer Dmitry Vyukov <dvyukov@google.com>
Wed, 28 Jan 2015 16:35:24 +0000 (16:35 +0000)
diff --git a/src/runtime/chan.go b/src/runtime/chan.go

index abe73e70a034d7389da651b9c530d4f8a1db1540..56560f94f0d343e49c4526cd9047d61066578e8a 100644 (file)
--- a/src/runtime/chan.go
+++ b/src/runtime/chan.go
@@ -96,7 +96,7 @@ func chansend(t *chantype, c *hchan, ep unsafe.Pointer, block bool, callerpc uin
                 if !block {
                         return false
                 }
-               gopark(nil, nil, "chan send (nil chan)")
+               gopark(nil, nil, "chan send (nil chan)", traceEvGoStop)
                 throw("unreachable")
         }
  
@@ -178,7 +178,7 @@ func chansend(t *chantype, c *hchan, ep unsafe.Pointer, block bool, callerpc uin
                 mysg.selectdone = nil
                 gp.param = nil
                 c.sendq.enqueue(mysg)
-               goparkunlock(&c.lock, "chan send")
+               goparkunlock(&c.lock, "chan send", traceEvGoBlockSend)
  
                 // someone woke us up.
                 if mysg != gp.waiting {
@@ -217,7 +217,7 @@ func chansend(t *chantype, c *hchan, ep unsafe.Pointer, block bool, callerpc uin
                 mysg.elem = nil
                 mysg.selectdone = nil
                 c.sendq.enqueue(mysg)
-               goparkunlock(&c.lock, "chan send")
+               goparkunlock(&c.lock, "chan send", traceEvGoBlockSend)
  
                 // someone woke us up - try again
                 if mysg.releasetime > 0 {
@@ -340,7 +340,7 @@ func chanrecv(t *chantype, c *hchan, ep unsafe.Pointer, block bool) (selected, r
                 if !block {
                         return
                 }
-               gopark(nil, nil, "chan receive (nil chan)")
+               gopark(nil, nil, "chan receive (nil chan)", traceEvGoStop)
                 throw("unreachable")
         }
  
@@ -414,7 +414,7 @@ func chanrecv(t *chantype, c *hchan, ep unsafe.Pointer, block bool) (selected, r
                 mysg.selectdone = nil
                 gp.param = nil
                 c.recvq.enqueue(mysg)
-               goparkunlock(&c.lock, "chan receive")
+               goparkunlock(&c.lock, "chan receive", traceEvGoBlockRecv)
  
                 // someone woke us up
                 if mysg != gp.waiting {
@@ -471,7 +471,7 @@ func chanrecv(t *chantype, c *hchan, ep unsafe.Pointer, block bool) (selected, r
                 mysg.selectdone = nil
  
                 c.recvq.enqueue(mysg)
-               goparkunlock(&c.lock, "chan receive")
+               goparkunlock(&c.lock, "chan receive", traceEvGoBlockRecv)
  
                 // someone woke us up - try again
                 if mysg.releasetime > 0 {
diff --git a/src/runtime/malloc.go b/src/runtime/malloc.go

index 69eb090706427842f254bf431f7b96ae389c198a..f827b9c418fb3fa82fe1d554fc05da25c128689c 100644 (file)
--- a/src/runtime/malloc.go
+++ b/src/runtime/malloc.go
@@ -368,6 +368,12 @@ func gcwork(force int32) {
         if force == 0 {
                 gctimer.cycle.sweepterm = nanotime()
         }
+
+       if trace.enabled {
+               traceGoSched()
+               traceGCStart()
+       }
+
         // Pick up the remaining unswept/not being swept spans before we STW
         for gosweepone() != ^uintptr(0) {
                 sweep.nbgsweep++
@@ -423,6 +429,11 @@ func gcwork(force int32) {
                 gccheckmark_m(startTime, eagersweep)
         })
  
+       if trace.enabled {
+               traceGCDone()
+               traceGoStart()
+       }
+
         // all done
         mp.gcing = 0
  
diff --git a/src/runtime/malloc1.go b/src/runtime/malloc1.go

index 7b5907b2565a9313a632d8c9c2bf8150e61507c3..4d0754ba9d04e97017bd2766089d4c23ca9ce347 100644 (file)
--- a/src/runtime/malloc1.go
+++ b/src/runtime/malloc1.go
@@ -71,6 +71,9 @@ func purgecachedstats(c *mcache) {
         h := &mheap_
         memstats.heap_alloc += uint64(c.local_cachealloc)
         c.local_cachealloc = 0
+       if trace.enabled {
+               traceHeapAlloc()
+       }
         memstats.tinyallocs += uint64(c.local_tinyallocs)
         c.local_tinyallocs = 0
         memstats.nlookup += uint64(c.local_nlookup)
diff --git a/src/runtime/mfinal.go b/src/runtime/mfinal.go

index 3cc9a4e4c35a4348bc4eff55f9e7849d66bf53cb..28afa0dfab1215f168dbf39342bd78c7ab0843f5 100644 (file)
--- a/src/runtime/mfinal.go
+++ b/src/runtime/mfinal.go
@@ -127,7 +127,7 @@ func runfinq() {
                         fing = gp
                         fingwait = true
                         gp.issystem = true
-                       goparkunlock(&finlock, "finalizer wait")
+                       goparkunlock(&finlock, "finalizer wait", traceEvGoBlock)
                         gp.issystem = false
                         continue
                 }
diff --git a/src/runtime/mgc.go b/src/runtime/mgc.go

index 6436a3f786cd179dac53bbd3bb143c7cd8adb902..8cc060c2cf57e612cbef495e76d19b9a79e0b2fc 100644 (file)
--- a/src/runtime/mgc.go
+++ b/src/runtime/mgc.go
@@ -1003,6 +1003,11 @@ func mSpan_Sweep(s *mspan, preserve bool) bool {
                 print("MSpan_Sweep: state=", s.state, " sweepgen=", s.sweepgen, " mheap.sweepgen=", sweepgen, "\n")
                 throw("MSpan_Sweep: bad span state")
         }
+
+       if trace.enabled {
+               traceGCSweepStart()
+       }
+
         cl := s.sizeclass
         size := s.elemsize
         res := false
@@ -1132,6 +1137,10 @@ func mSpan_Sweep(s *mspan, preserve bool) bool {
                 res = mCentral_FreeSpan(&mheap_.central[cl].mcentral, s, int32(nfree), head, end, preserve)
                 // MCentral_FreeSpan updates sweepgen
         }
+       if trace.enabled {
+               traceGCSweepDone()
+               traceNextGC()
+       }
         return res
  }
  
@@ -1212,12 +1221,20 @@ func gchelper() {
         _g_.m.traceback = 2
         gchelperstart()
  
+       if trace.enabled {
+               traceGCScanStart()
+       }
+
         // parallel mark for over GC roots
         parfordo(work.markfor)
         if gcphase != _GCscan {
                 scanblock(0, 0, nil) // blocks in getfull
         }
  
+       if trace.enabled {
+               traceGCScanDone()
+       }
+
         nproc := work.nproc // work.nproc can change right after we increment work.ndone
         if xadd(&work.ndone, +1) == nproc-1 {
                 notewakeup(&work.alldone)
@@ -1540,6 +1557,10 @@ func gc(start_time int64, eagersweep bool) {
                 gp.gcworkdone = false // set to true in gcphasework
         }
  
+       if trace.enabled {
+               traceGCScanStart()
+       }
+
         parforsetup(work.markfor, work.nproc, uint32(_RootCount+allglen), nil, false, markroot)
         if work.nproc > 1 {
                 noteclear(&work.alldone)
@@ -1572,6 +1593,10 @@ func gc(start_time int64, eagersweep bool) {
                 notesleep(&work.alldone)
         }
  
+       if trace.enabled {
+               traceGCScanDone()
+       }
+
         shrinkfinish()
  
         cachestats()
@@ -1581,6 +1606,9 @@ func gc(start_time int64, eagersweep bool) {
         // conservatively set next_gc to high value assuming that everything is live
         // concurrent/lazy sweep will reduce this number while discovering new garbage
         memstats.next_gc = memstats.heap_alloc + memstats.heap_alloc*uint64(gcpercent)/100
+       if trace.enabled {
+               traceNextGC()
+       }
  
         t4 := nanotime()
         atomicstore64(&memstats.last_gc, uint64(unixnanotime())) // must be Unix time to make sense to user
diff --git a/src/runtime/mgc0.go b/src/runtime/mgc0.go

index 5959396bed9a36926697d13a63b341af750ba1f2..bbd786d519949724f47175fa1c32b3be93392e6b 100644 (file)
--- a/src/runtime/mgc0.go
+++ b/src/runtime/mgc0.go
@@ -67,7 +67,7 @@ func backgroundgc() {
                 gcwork(0)
                 lock(&bggc.lock)
                 bggc.working = 0
-               goparkunlock(&bggc.lock, "Concurrent GC wait")
+               goparkunlock(&bggc.lock, "Concurrent GC wait", traceEvGoBlock)
         }
  }
  
@@ -88,6 +88,6 @@ func bgsweep() {
                         continue
                 }
                 sweep.parked = true
-               goparkunlock(&gclock, "GC sweep wait")
+               goparkunlock(&gclock, "GC sweep wait", traceEvGoBlock)
         }
  }
diff --git a/src/runtime/mheap.go b/src/runtime/mheap.go

index 1ff661c9813184af8a36d33b2cea983b45e83cd4..11bc809ec1d036a12957c8494f98afb6855ad99e 100644 (file)
--- a/src/runtime/mheap.go
+++ b/src/runtime/mheap.go
@@ -217,6 +217,9 @@ func mHeap_Alloc_m(h *mheap, npage uintptr, sizeclass int32, large bool) *mspan
                         }
                 }
         }
+       if trace.enabled {
+               traceHeapAlloc()
+       }
         unlock(&h.lock)
         return s
  }
@@ -440,6 +443,9 @@ func mHeap_Free(h *mheap, s *mspan, acct int32) {
                         memstats.heap_objects--
                 }
                 mHeap_FreeSpanLocked(h, s, true, true)
+               if trace.enabled {
+                       traceHeapAlloc()
+               }
                 unlock(&h.lock)
         })
  }
diff --git a/src/runtime/netpoll.go b/src/runtime/netpoll.go

index 3ef45064914c5ccd4bc0e81efeac0c513e3d2103..8ea0878ca27b161b634286855b241ecb9583b712 100644 (file)
--- a/src/runtime/netpoll.go
+++ b/src/runtime/netpoll.go
@@ -71,7 +71,7 @@ type pollCache struct {
  
  var (
         netpollInited uint32
-       pollcache pollCache
+       pollcache     pollCache
  )
  
  //go:linkname net_runtime_pollServerInit net.runtime_pollServerInit
@@ -333,7 +333,7 @@ func netpollblock(pd *pollDesc, mode int32, waitio bool) bool {
         // this is necessary because runtime_pollUnblock/runtime_pollSetDeadline/deadlineimpl
         // do the opposite: store to closing/rd/wd, membarrier, load of rg/wg
         if waitio || netpollcheckerr(pd, mode) == 0 {
-               gopark(netpollblockcommit, unsafe.Pointer(gpp), "IO wait")
+               gopark(netpollblockcommit, unsafe.Pointer(gpp), "IO wait", traceEvGoBlockNet)
         }
         // be careful to not lose concurrent READY notification
         old := xchguintptr(gpp, 0)
diff --git a/src/runtime/proc.go b/src/runtime/proc.go

index 03ba00fd97ee540963e34bab36b73acdeb50dba4..3d84968b10f88f63e2ed569ac9fc2e063986759f 100644 (file)
--- a/src/runtime/proc.go
+++ b/src/runtime/proc.go
@@ -93,7 +93,7 @@ func main() {
         // let the other goroutine finish printing the panic trace.
         // Once it does, it will exit. See issue 3934.
         if panicking != 0 {
-               gopark(nil, nil, "panicwait")
+               gopark(nil, nil, "panicwait", traceEvGoStop)
         }
  
         exit(0)
@@ -117,7 +117,7 @@ func forcegchelper() {
                         throw("forcegc: phase error")
                 }
                 atomicstore(&forcegc.idle, 1)
-               goparkunlock(&forcegc.lock, "force gc (idle)")
+               goparkunlock(&forcegc.lock, "force gc (idle)", traceEvGoBlock)
                 // this goroutine is explicitly resumed by sysmon
                 if debug.gctrace > 0 {
                         println("GC forced")
@@ -136,7 +136,7 @@ func Gosched() {
  
  // Puts the current goroutine into a waiting state and calls unlockf.
  // If unlockf returns false, the goroutine is resumed.
-func gopark(unlockf func(*g, unsafe.Pointer) bool, lock unsafe.Pointer, reason string) {
+func gopark(unlockf func(*g, unsafe.Pointer) bool, lock unsafe.Pointer, reason string, traceEv byte) {
         mp := acquirem()
         gp := mp.curg
         status := readgstatus(gp)
@@ -146,6 +146,7 @@ func gopark(unlockf func(*g, unsafe.Pointer) bool, lock unsafe.Pointer, reason s
         mp.waitlock = lock
         mp.waitunlockf = *(*unsafe.Pointer)(unsafe.Pointer(&unlockf))
         gp.waitreason = reason
+       mp.waittraceev = traceEv
         releasem(mp)
         // can't do anything that might move the G between Ms here.
         mcall(park_m)
@@ -153,8 +154,8 @@ func gopark(unlockf func(*g, unsafe.Pointer) bool, lock unsafe.Pointer, reason s
  
  // Puts the current goroutine into a waiting state and unlocks the lock.
  // The goroutine can be made runnable again by calling goready(gp).
-func goparkunlock(lock *mutex, reason string) {
-       gopark(parkunlock_c, unsafe.Pointer(lock), reason)
+func goparkunlock(lock *mutex, reason string, traceEv byte) {
+       gopark(parkunlock_c, unsafe.Pointer(lock), reason, traceEv)
  }
  
  func goready(gp *g) {
diff --git a/src/runtime/proc1.go b/src/runtime/proc1.go

index 39e80945784860f6309c4115ec1be8ca88878281..fcff60541de33aef519bffe591bc34e8a0c6f745 100644 (file)
--- a/src/runtime/proc1.go
+++ b/src/runtime/proc1.go
@@ -196,6 +196,10 @@ func mcommoninit(mp *m) {
  
  // Mark gp ready to run.
  func ready(gp *g) {
+       if trace.enabled {
+               traceGoUnpark(gp)
+       }
+
         status := readgstatus(gp)
  
         // Mark runnable.
@@ -263,6 +267,7 @@ func helpgc(nproc int32) {
                         throw("gcprocs inconsistency")
                 }
                 mp.helpgc = n
+               mp.p = allp[pos]
                 mp.mcache = allp[pos].mcache
                 pos++
                 notewakeup(&mp.park)
@@ -604,6 +609,11 @@ func stoptheworld() {
                 p := allp[i]
                 s := p.status
                 if s == _Psyscall && cas(&p.status, s, _Pgcstop) {
+                       if trace.enabled {
+                               traceGoSysBlock(p)
+                               traceProcStop(p)
+                       }
+                       p.syscalltick++
                         sched.stopwait--
                 }
         }
@@ -1052,6 +1062,7 @@ retry:
                 gchelper()
                 _g_.m.helpgc = 0
                 _g_.m.mcache = nil
+               _g_.m.p = nil
                 goto retry
         }
         acquirep(_g_.m.nextp)
@@ -1234,6 +1245,10 @@ func execute(gp *g) {
                 resetcpuprofiler(hz)
         }
  
+       if trace.enabled {
+               traceGoStart()
+       }
+
         gogo(&gp.sched)
  }
  
@@ -1272,6 +1287,9 @@ top:
         if gp := netpoll(false); gp != nil { // non-blocking
                 injectglist(gp.schedlink)
                 casgstatus(gp, _Gwaiting, _Grunnable)
+               if trace.enabled {
+                       traceGoUnpark(gp)
+               }
                 return gp
         }
  
@@ -1355,6 +1373,9 @@ stop:
                                 acquirep(_p_)
                                 injectglist(gp.schedlink)
                                 casgstatus(gp, _Gwaiting, _Grunnable)
+                               if trace.enabled {
+                                       traceGoUnpark(gp)
+                               }
                                 return gp
                         }
                         injectglist(gp)
@@ -1391,6 +1412,11 @@ func injectglist(glist *g) {
         if glist == nil {
                 return
         }
+       if trace.enabled {
+               for gp := glist; gp != nil; gp = gp.schedlink {
+                       traceGoUnpark(gp)
+               }
+       }
         lock(&sched.lock)
         var n int
         for n = 0; glist != nil; n++ {
@@ -1426,17 +1452,27 @@ top:
         }
  
         var gp *g
-       // Check the global runnable queue once in a while to ensure fairness.
-       // Otherwise two goroutines can completely occupy the local runqueue
-       // by constantly respawning each other.
-       if _g_.m.p.schedtick%61 == 0 && sched.runqsize > 0 {
-               lock(&sched.lock)
-               gp = globrunqget(_g_.m.p, 1)
-               unlock(&sched.lock)
+       if trace.enabled || trace.shutdown {
+               gp = traceReader()
                 if gp != nil {
+                       casgstatus(gp, _Gwaiting, _Grunnable)
+                       traceGoUnpark(gp)
                         resetspinning()
                 }
         }
+       if gp == nil {
+               // Check the global runnable queue once in a while to ensure fairness.
+               // Otherwise two goroutines can completely occupy the local runqueue
+               // by constantly respawning each other.
+               if _g_.m.p.schedtick%61 == 0 && sched.runqsize > 0 {
+                       lock(&sched.lock)
+                       gp = globrunqget(_g_.m.p, 1)
+                       unlock(&sched.lock)
+                       if gp != nil {
+                               resetspinning()
+                       }
+               }
+       }
         if gp == nil {
                 gp = runqget(_g_.m.p)
                 if gp != nil && _g_.m.spinning {
@@ -1476,11 +1512,12 @@ func dropg() {
  
  // Puts the current goroutine into a waiting state and calls unlockf.
  // If unlockf returns false, the goroutine is resumed.
-func park(unlockf func(*g, unsafe.Pointer) bool, lock unsafe.Pointer, reason string) {
+func park(unlockf func(*g, unsafe.Pointer) bool, lock unsafe.Pointer, reason string, traceev byte) {
         _g_ := getg()
  
         _g_.m.waitlock = lock
         _g_.m.waitunlockf = *(*unsafe.Pointer)(unsafe.Pointer(&unlockf))
+       _g_.m.waittraceev = traceev
         _g_.waitreason = reason
         mcall(park_m)
  }
@@ -1492,14 +1529,18 @@ func parkunlock_c(gp *g, lock unsafe.Pointer) bool {
  
  // Puts the current goroutine into a waiting state and unlocks the lock.
  // The goroutine can be made runnable again by calling ready(gp).
-func parkunlock(lock *mutex, reason string) {
-       park(parkunlock_c, unsafe.Pointer(lock), reason)
+func parkunlock(lock *mutex, reason string, traceev byte) {
+       park(parkunlock_c, unsafe.Pointer(lock), reason, traceev)
  }
  
  // park continuation on g0.
  func park_m(gp *g) {
         _g_ := getg()
  
+       if trace.enabled {
+               traceGoPark(_g_.m.waittraceev, gp)
+       }
+
         casgstatus(gp, _Grunning, _Gwaiting)
         dropg()
  
@@ -1509,6 +1550,9 @@ func park_m(gp *g) {
                 _g_.m.waitunlockf = nil
                 _g_.m.waitlock = nil
                 if !ok {
+                       if trace.enabled {
+                               traceGoUnpark(gp)
+                       }
                         casgstatus(gp, _Gwaiting, _Grunnable)
                         execute(gp) // Schedule it back, never returns.
                 }
@@ -1516,8 +1560,7 @@ func park_m(gp *g) {
         schedule()
  }
  
-// Gosched continuation on g0.
-func gosched_m(gp *g) {
+func goschedImpl(gp *g) {
         status := readgstatus(gp)
         if status&^_Gscan != _Grunning {
                 dumpgstatus(gp)
@@ -1532,6 +1575,21 @@ func gosched_m(gp *g) {
         schedule()
  }
  
+// Gosched continuation on g0.
+func gosched_m(gp *g) {
+       if trace.enabled {
+               traceGoSched()
+       }
+       goschedImpl(gp)
+}
+
+func gopreempt_m(gp *g) {
+       if trace.enabled {
+               traceGoPreempt()
+       }
+       goschedImpl(gp)
+}
+
  // Finishes execution of the current goroutine.
  // Must be NOSPLIT because it is called from Go. (TODO - probably not anymore)
  //go:nosplit
@@ -1539,6 +1597,9 @@ func goexit1() {
         if raceenabled {
                 racegoend()
         }
+       if trace.enabled {
+               traceGoEnd()
+       }
         mcall(goexit0)
  }
  
@@ -1603,6 +1664,20 @@ func save(pc, sp uintptr) {
  // from a function further up in the call stack than the parent, as g->syscallsp
  // must always point to a valid stack frame. entersyscall below is the normal
  // entry point for syscalls, which obtains the SP and PC from the caller.
+//
+// Syscall tracing:
+// At the start of a syscall we emit traceGoSysCall to capture the stack trace.
+// If the syscall does not block, that is it, we do not emit any other events.
+// If the syscall blocks (that is, P is retaken), retaker emits traceGoSysBlock;
+// when syscall returns we emit traceGoSysExit and when the goroutine starts running
+// (potentially instantly, if exitsyscallfast returns true) we emit traceGoStart.
+// To ensure that traceGoSysExit is emitted strictly after traceGoSysBlock,
+// we remember current value of syscalltick in m (_g_.m.syscalltick = _g_.m.p.syscalltick),
+// whoever emits traceGoSysBlock increments p.syscalltick afterwards;
+// and we wait for the increment before emitting traceGoSysExit.
+// Note that the increment is done even if tracing is not enabled,
+// because tracing can be enabled in the middle of syscall. We don't want the wait to hang.
+//
  //go:nosplit
  func reentersyscall(pc, sp uintptr) {
         _g_ := getg()
@@ -1611,6 +1686,10 @@ func reentersyscall(pc, sp uintptr) {
         // but can have inconsistent g->sched, do not let GC observe it.
         _g_.m.locks++
  
+       if trace.enabled {
+               systemstack(traceGoSysCall)
+       }
+
         // Entersyscall must not call any function that might split/grow the stack.
         // (See details in comment above.)
         // Catch calls that might, by replacing the stack guard with something that
@@ -1635,6 +1714,7 @@ func reentersyscall(pc, sp uintptr) {
                 save(pc, sp)
         }
  
+       _g_.m.syscalltick = _g_.m.p.syscalltick
         _g_.m.mcache = nil
         _g_.m.p.m = nil
         atomicstore(&_g_.m.p.status, _Psyscall)
@@ -1667,9 +1747,15 @@ func entersyscall_sysmon() {
  
  func entersyscall_gcwait() {
         _g_ := getg()
+       _p_ := _g_.m.p
  
         lock(&sched.lock)
-       if sched.stopwait > 0 && cas(&_g_.m.p.status, _Psyscall, _Pgcstop) {
+       if sched.stopwait > 0 && cas(&_p_.status, _Psyscall, _Pgcstop) {
+               if trace.enabled {
+                       traceGoSysBlock(_p_)
+                       traceProcStop(_p_)
+               }
+               _p_.syscalltick++
                 if sched.stopwait--; sched.stopwait == 0 {
                         notewakeup(&sched.stopnote)
                 }
@@ -1685,6 +1771,8 @@ func entersyscallblock(dummy int32) {
         _g_.m.locks++ // see comment in entersyscall
         _g_.throwsplit = true
         _g_.stackguard0 = stackPreempt // see comment in entersyscall
+       _g_.m.syscalltick = _g_.m.p.syscalltick
+       _g_.m.p.syscalltick++
  
         // Leave SP around for GC and traceback.
         pc := getcallerpc(unsafe.Pointer(&dummy))
@@ -1718,6 +1806,10 @@ func entersyscallblock(dummy int32) {
  }
  
  func entersyscallblock_handoff() {
+       if trace.enabled {
+               traceGoSysCall()
+               traceGoSysBlock(getg().m.p)
+       }
         handoffp(releasep())
  }
  
@@ -1735,10 +1827,16 @@ func exitsyscall(dummy int32) {
         }
  
         _g_.waitsince = 0
+       oldp := _g_.m.p
         if exitsyscallfast() {
                 if _g_.m.mcache == nil {
                         throw("lost mcache")
                 }
+               if trace.enabled {
+                       if oldp != _g_.m.p || _g_.m.syscalltick != _g_.m.p.syscalltick {
+                               systemstack(traceGoStart)
+                       }
+               }
                 // There's a cpu for us, so we can run.
                 _g_.m.p.syscalltick++
                 // We need to cas the status and scan before resuming...
@@ -1759,6 +1857,15 @@ func exitsyscall(dummy int32) {
                 return
         }
  
+       if trace.enabled {
+               // Wait till traceGoSysBlock event is emited.
+               // This ensures consistency of the trace (the goroutine is started after it is blocked).
+               for oldp != nil && oldp.syscalltick == _g_.m.syscalltick {
+                       osyield()
+               }
+               systemstack(traceGoSysExit)
+       }
+
         _g_.m.locks--
  
         // Call the scheduler.
@@ -1795,16 +1902,41 @@ func exitsyscallfast() bool {
                 // There's a cpu for us, so we can run.
                 _g_.m.mcache = _g_.m.p.mcache
                 _g_.m.p.m = _g_.m
+               if _g_.m.syscalltick != _g_.m.p.syscalltick {
+                       if trace.enabled {
+                               // The p was retaken and then enter into syscall again (since _g_.m.syscalltick has changed).
+                               // traceGoSysBlock for this syscall was already emitted,
+                               // but here we effectively retake the p from the new syscall running on the same p.
+                               systemstack(func() {
+                                       // Denote blocking of the new syscall.
+                                       traceGoSysBlock(_g_.m.p)
+                                       // Denote completion of the current syscall.
+                                       traceGoSysExit()
+                               })
+                       }
+                       _g_.m.p.syscalltick++
+               }
                 return true
         }
  
         // Try to get any other idle P.
+       oldp := _g_.m.p
         _g_.m.mcache = nil
         _g_.m.p = nil
         if sched.pidle != nil {
                 var ok bool
                 systemstack(func() {
                         ok = exitsyscallfast_pidle()
+                       if ok && trace.enabled {
+                               if oldp != nil {
+                                       // Wait till traceGoSysBlock event is emited.
+                                       // This ensures consistency of the trace (the goroutine is started after it is blocked).
+                                       for oldp.syscalltick == _g_.m.syscalltick {
+                                               osyield()
+                                       }
+                               }
+                               traceGoSysExit()
+                       }
                 })
                 if ok {
                         return true
@@ -1984,6 +2116,7 @@ func newproc1(fn *funcval, argp *uint8, narg int32, nret int32, callerpc uintptr
         newg.sched.g = guintptr(unsafe.Pointer(newg))
         gostartcallfn(&newg.sched, fn)
         newg.gopc = callerpc
+       newg.startpc = fn.fn
         casgstatus(newg, _Gdead, _Grunnable)
  
         if _p_.goidcache == _p_.goidcacheend {
@@ -1999,6 +2132,9 @@ func newproc1(fn *funcval, argp *uint8, narg int32, nret int32, callerpc uintptr
         if raceenabled {
                 newg.racectx = racegostart(callerpc)
         }
+       if trace.enabled {
+               traceGoCreate(newg, newg.startpc)
+       }
         runqput(_p_, newg)
  
         if atomicload(&sched.npidle) != 0 && atomicload(&sched.nmspinning) == 0 && unsafe.Pointer(fn.fn) != unsafe.Pointer(funcPC(main)) { // TODO: fast atomic
@@ -2380,6 +2516,9 @@ func procresize(new int32) *p {
         if old < 0 || old > _MaxGomaxprocs || new <= 0 || new > _MaxGomaxprocs {
                 throw("procresize: invalid arg")
         }
+       if trace.enabled {
+               traceGomaxprocs(new)
+       }
  
         // initialize new P's
         for i := int32(0); i < new; i++ {
@@ -2405,6 +2544,14 @@ func procresize(new int32) *p {
         // free unused P's
         for i := new; i < old; i++ {
                 p := allp[i]
+               if trace.enabled {
+                       if p == getg().m.p {
+                               // moving to p[0], pretend that we were descheduled
+                               // and then scheduled again to keep the trace sane.
+                               traceGoSched()
+                               traceProcStop(p)
+                       }
+               }
                 // move all runable goroutines to the global queue
                 for p.runqhead != p.runqtail {
                         // pop from tail of local queue
@@ -2421,6 +2568,7 @@ func procresize(new int32) *p {
                 freemcache(p.mcache)
                 p.mcache = nil
                 gfpurge(p)
+               traceProcFree(p)
                 p.status = _Pdead
                 // can't free P itself because it can be referenced by an M in syscall
         }
@@ -2440,6 +2588,9 @@ func procresize(new int32) *p {
                 p.m = nil
                 p.status = _Pidle
                 acquirep(p)
+               if trace.enabled {
+                       traceGoStart()
+               }
         }
         var runnablePs *p
         for i := new - 1; i >= 0; i-- {
@@ -2480,6 +2631,10 @@ func acquirep(_p_ *p) {
         _g_.m.p = _p_
         _p_.m = _g_.m
         _p_.status = _Prunning
+
+       if trace.enabled {
+               traceProcStart()
+       }
  }
  
  // Disassociate p and the current m.
@@ -2494,6 +2649,9 @@ func releasep() *p {
                 print("releasep: m=", _g_.m, " m->p=", _g_.m.p, " p->m=", _p_.m, " m->mcache=", _g_.m.mcache, " p->mcache=", _p_.mcache, " p->status=", _p_.status, "\n")
                 throw("releasep: invalid p state")
         }
+       if trace.enabled {
+               traceProcStop(_g_.m.p)
+       }
         _g_.m.p = nil
         _g_.m.mcache = nil
         _p_.m = nil
@@ -2713,7 +2871,12 @@ func retake(now int64) uint32 {
                         // increment nmidle and report deadlock.
                         incidlelocked(-1)
                         if cas(&_p_.status, s, _Pidle) {
+                               if trace.enabled {
+                                       traceGoSysBlock(_p_)
+                                       traceProcStop(_p_)
+                               }
                                 n++
+                               _p_.syscalltick++
                                 handoffp(_p_)
                         }
                         incidlelocked(1)
diff --git a/src/runtime/runtime2.go b/src/runtime/runtime2.go

index f0f8c1abc3ab920ad2654dc4a726915f79802703..c71a3c31435a54758ad67eebecd31d0ea43d39cb 100644 (file)
--- a/src/runtime/runtime2.go
+++ b/src/runtime/runtime2.go
@@ -277,6 +277,8 @@ type m struct {
         traceback     uint8
         waitunlockf   unsafe.Pointer // todo go func(*g, unsafe.pointer) bool
         waitlock      unsafe.Pointer
+       waittraceev   byte
+       syscalltick   uint32
         //#ifdef GOOS_windows
         thread uintptr // thread handle
         // these are here because they are too large to be on the stack
diff --git a/src/runtime/select.go b/src/runtime/select.go

index 20dd2995b667b92a582eefd873b487bae362cfe9..34fda16ef890ddb9f475487df44f2003300978bb 100644 (file)
--- a/src/runtime/select.go
+++ b/src/runtime/select.go
@@ -173,7 +173,7 @@ func selparkcommit(gp *g, sel unsafe.Pointer) bool {
  }
  
  func block() {
-       gopark(nil, nil, "select (no cases)") // forever
+       gopark(nil, nil, "select (no cases)", traceEvGoStop) // forever
  }
  
  // overwrites return pc on stack to signal which case of the select
@@ -363,7 +363,7 @@ loop:
  
         // wait for someone to wake us up
         gp.param = nil
-       gopark(selparkcommit, unsafe.Pointer(sel), "select")
+       gopark(selparkcommit, unsafe.Pointer(sel), "select", traceEvGoBlockSelect)
  
         // someone woke us up
         sellock(sel)
diff --git a/src/runtime/sema.go b/src/runtime/sema.go

index 35a126476272eba69de6588bb72fa78f7f09c851..34852ea8354d2581c96aa57449c20e7641a72190 100644 (file)
--- a/src/runtime/sema.go
+++ b/src/runtime/sema.go
@@ -97,7 +97,7 @@ func semacquire(addr *uint32, profile bool) {
                 // Any semrelease after the cansemacquire knows we're waiting
                 // (we set nwait above), so go to sleep.
                 root.queue(addr, s)
-               goparkunlock(&root.lock, "semacquire")
+               goparkunlock(&root.lock, "semacquire", traceEvGoBlockSync)
                 if cansemacquire(addr) {
                         break
                 }
@@ -234,7 +234,7 @@ func syncsemacquire(s *syncSema) {
                         s.tail.next = w
                 }
                 s.tail = w
-               goparkunlock(&s.lock, "semacquire")
+               goparkunlock(&s.lock, "semacquire", traceEvGoBlockCond)
                 if t0 != 0 {
                         blockevent(int64(w.releasetime)-t0, 2)
                 }
@@ -273,7 +273,7 @@ func syncsemrelease(s *syncSema, n uint32) {
                         s.tail.next = w
                 }
                 s.tail = w
-               goparkunlock(&s.lock, "semarelease")
+               goparkunlock(&s.lock, "semarelease", traceEvGoBlockCond)
                 releaseSudog(w)
         } else {
                 unlock(&s.lock)
diff --git a/src/runtime/stack1.go b/src/runtime/stack1.go

index 513f27d143345cf401b85ff37956abe33588d2f7..dda39ce48181984522d41f90044b6061108747a2 100644 (file)
--- a/src/runtime/stack1.go
+++ b/src/runtime/stack1.go
@@ -721,7 +721,7 @@ func newstack() {
  
                 // Act like goroutine called runtime.Gosched.
                 casgstatus(gp, _Gwaiting, _Grunning)
-               gosched_m(gp) // never return
+               gopreempt_m(gp) // never return
         }
  
         // Allocate a bigger segment and move the stack.
diff --git a/src/runtime/time.go b/src/runtime/time.go

index 5917d7ce04d95f7a920670186b0e6ed68de2d04d..50895ca8ec7d7d743020fafef45732b84319ace9 100644 (file)
--- a/src/runtime/time.go
+++ b/src/runtime/time.go
@@ -56,7 +56,7 @@ func timeSleep(ns int64) {
         t.arg = getg()
         lock(&timers.lock)
         addtimerLocked(t)
-       goparkunlock(&timers.lock, "sleep")
+       goparkunlock(&timers.lock, "sleep", traceEvGoSleep)
  }
  
  // startTimer adds t to the timer heap.
@@ -200,7 +200,7 @@ func timerproc() {
                 if delta < 0 || faketime > 0 {
                         // No timers left - put goroutine to sleep.
                         timers.rescheduling = true
-                       goparkunlock(&timers.lock, "timer goroutine (idle)")
+                       goparkunlock(&timers.lock, "timer goroutine (idle)", traceEvGoBlock)
                         continue
                 }
                 // At least one timer pending.  Sleep until then.
diff --git a/src/runtime/trace.go b/src/runtime/trace.go

index 17d029806cb08c91c9d5e2a8a5e3461fd042b9e4..032bef4e770026994c50e209703cdc6e979c8baf 100644 (file)
--- a/src/runtime/trace.go
+++ b/src/runtime/trace.go
@@ -292,7 +292,7 @@ func ReadTrace() []byte {
         // Wait for new data.
         if trace.fullHead == nil && !trace.shutdown {
                 trace.reader = getg()
-               goparkunlock(&trace.lock, "trace reader (blocked)" /*, traceEvGoBlock*/)
+               goparkunlock(&trace.lock, "trace reader (blocked)", traceEvGoBlock)
                 lock(&trace.lock)
         }
         // Write a buffer.
author	Dmitry Vyukov <dvyukov@google.com>
	Fri, 12 Dec 2014 17:41:57 +0000 (18:41 +0100)
committer	Dmitry Vyukov <dvyukov@google.com>
	Wed, 28 Jan 2015 16:35:24 +0000 (16:35 +0000)
src/runtime/chan.go		patch \| blob \| history
src/runtime/malloc.go		patch \| blob \| history
src/runtime/malloc1.go		patch \| blob \| history
src/runtime/mfinal.go		patch \| blob \| history
src/runtime/mgc.go		patch \| blob \| history
src/runtime/mgc0.go		patch \| blob \| history
src/runtime/mheap.go		patch \| blob \| history
src/runtime/netpoll.go		patch \| blob \| history
src/runtime/proc.go		patch \| blob \| history
src/runtime/proc1.go		patch \| blob \| history
src/runtime/runtime2.go		patch \| blob \| history
src/runtime/select.go		patch \| blob \| history
src/runtime/sema.go		patch \| blob \| history
src/runtime/stack1.go		patch \| blob \| history
src/runtime/time.go		patch \| blob \| history
src/runtime/trace.go		patch \| blob \| history