我可能并不会使用golang goroutine

有关goroutine的问题，大多数集中在

它跟线程有啥区别？原理是啥？
都说他好，他好在哪里？
使用上面有啥注意的？

等等,或许我们还有更多疑问，但是先从最基础的开始吧

package mainimport ("fmt")func worker(stop chan bool) {for i:=0;i<10;i++ {fmt.Println("干活....")}stop <- true}func main() {stop := make(chan bool)go worker(stop)<- stop}复制代码

我们在main中新起了一个goroutine来干活。后台实现是runtime.newproc调用,函数体如下

// 使用siz字节参数创建一个运行fn的新g。 // 将其放在g等待运行的队列中。 编译器将go语句转换为对此的调用。 // 无法拆分堆栈，因为它假定参数在＆fn;之后顺序可用。 // 如果发生堆栈拆分，则不会复制它们。//go:nosplitfunc newproc(siz int32, fn *funcval) {    // 从 fn 的地址增加一个指针的长度，从而获取第一参数地址argp := add(unsafe.Pointer(&fn), sys.PtrSize)// 获取当前的运行的ggp := getg()// getcallerpc返回其调用方的程序计数器（PC）。用于存放下一条指令所在单元的地址的地方。pc := getcallerpc()// systemstack在系统堆栈上运行// 如果从每个OS线程（g0）堆栈调用systemstack// ，或者从信号处理（gsignal）堆栈调用systemstack ，// systemstack直接调用fn并返回。// 否则，从普通goroutine的有限堆栈中调用systemstack。// 在这种情况下，系统堆栈切换到每个OS线程堆栈，调用fn，然后切回。// 通常使用func字面量作为参数，以便与调用系统堆栈周围的代码共享输入和输出systemstack(func() {    // 原型：func newproc1(fn *funcval, argp *uint8, narg int32, callergp *g, callerpc uintptr)     // 创建一个新的g，运行fn，其中narg个字节的参数从argp开始。    // callerpc是创建它的go语句的地址。新g放入g等待运行的队列中。newproc1(fn, (*uint8)(argp), siz, gp, pc)})}复制代码

newproc1是重头戏，也比较复杂，可能目前还不能看的很明白，但是，大致先了解一下：

func newproc1(fn *funcval, argp *uint8, narg int32, callergp *g, callerpc uintptr) {_g_ := getg()if fn == nil {_g_.m.throwing = -1 // do not dump full stacksthrow("go of nil func value")}_g_.m.locks++ // disable preemption because it can be holding p in a local varsiz := nargsiz = (siz + 7) &^ 7// We could allocate a larger initial stack if necessary.// Not worth it: this is almost always an error.// 4*sizeof(uintreg): extra space added below// sizeof(uintreg): caller's LR (arm) or return address (x86, in gostartcall).if siz >= _StackMin-4*sys.RegSize-sys.RegSize {throw("newproc: function arguments too large for new goroutine")}_p_ := _g_.m.p.ptr() newg := gfget(_p_) // 根据 p 获得一个新的 g// 初始化阶段，gfget 是不可能找到 g 的// 也可能运行中本来就已经耗尽了if newg == nil {newg = malg(_StackMin) // 创建一个拥有 _StackMin 大小的栈的 gcasgstatus(newg, _Gidle, _Gdead) // 将新创建的 g 从 _Gidle 更新为 _Gdead 状态allgadd(newg) // 将 Gdead 状态的 g 添加到 allg，这样 GC 不会扫描未初始化的栈}if newg.stack.hi == 0 {throw("newproc1: newg missing stack")}if readgstatus(newg) != _Gdead {throw("newproc1: new g is not Gdead")}totalSize := 4*sys.RegSize + uintptr(siz) + sys.MinFrameSize // extra space in case of reads slightly beyond frametotalSize += -totalSize & (sys.SpAlign - 1)                  // align to spAlignsp := newg.stack.hi - totalSizespArg := spif usesLR {// caller's LR*(*uintptr)(unsafe.Pointer(sp)) = 0prepGoExitFrame(sp)spArg += sys.MinFrameSize}if narg > 0 {memmove(unsafe.Pointer(spArg), unsafe.Pointer(argp), uintptr(narg))// This is a stack-to-stack copy. If write barriers// are enabled and the source stack is grey (the// destination is always black), then perform a// barrier copy. We do this *after* the memmove// because the destination stack may have garbage on// it.if writeBarrier.needed && !_g_.m.curg.gcscandone {f := findfunc(fn.fn)stkmap := (*stackmap)(funcdata(f, _FUNCDATA_ArgsPointerMaps))if stkmap.nbit > 0 {// We're in the prologue, so it's always stack map index 0.bv := stackmapdata(stkmap, 0)bulkBarrierBitmap(spArg, spArg, uintptr(bv.n)*sys.PtrSize, 0, bv.bytedata)}}}memclrNoHeapPointers(unsafe.Pointer(&newg.sched), unsafe.Sizeof(newg.sched))newg.sched.sp = spnewg.stktopsp = spnewg.sched.pc = funcPC(goexit) + sys.PCQuantum // +PCQuantum so that previous instruction is in same functionnewg.sched.g = guintptr(unsafe.Pointer(newg))gostartcallfn(&newg.sched, fn)newg.gopc = callerpcnewg.ancestors = saveAncestors(callergp)newg.startpc = fn.fnif _g_.m.curg != nil {newg.labels = _g_.m.curg.labels}if isSystemGoroutine(newg, false) {atomic.Xadd(&sched.ngsys, +1)}newg.gcscanvalid = falsecasgstatus(newg, _Gdead, _Grunnable)if _p_.goidcache == _p_.goidcacheend {// Sched.goidgen is the last allocated id,// this batch must be [sched.goidgen+1, sched.goidgen+GoidCacheBatch].// At startup sched.goidgen=0, so main goroutine receives goid=1._p_.goidcache = atomic.Xadd64(&sched.goidgen, _GoidCacheBatch)_p_.goidcache -= _GoidCacheBatch - 1_p_.goidcacheend = _p_.goidcache + _GoidCacheBatch}newg.goid = int64(_p_.goidcache)_p_.goidcache++if raceenabled {newg.racectx = racegostart(callerpc)}if trace.enabled {traceGoCreate(newg, newg.startpc)}runqput(_p_, newg, true)if atomic.Load(&sched.npidle) != 0 && atomic.Load(&sched.nmspinning) == 0 && mainStarted {wakep()}_g_.m.locks--if _g_.m.locks == 0 && _g_.preempt { // restore the preemption request in case we've cleared it in newstack_g_.stackguard0 = stackPreempt}}复制代码

也就是说，刚开始的时候，p上并没有可以使用的g,所以创建了一个具有很少栈容量的g.

// 分配一个新的g，其堆栈足以容纳stacksize字节。func malg(stacksize int32) *g {newg := new(g)if stacksize >= 0 {stacksize = round2(_StackSystem + stacksize)systemstack(func() {newg.stack = stackalloc(uint32(stacksize))})newg.stackguard0 = newg.stack.lo + _StackGuardnewg.stackguard1 = ^uintptr(0)}return newg}复制代码

分配的g是一个结构体指针,如果stacksize大于零，还将分配stack堆栈，该结构体具体内容如下：

type g struct {// Stack parameters.// stack describes the actual stack memory: [stack.lo, stack.hi).// stackguard0 is the stack pointer compared in the Go stack growth prologue.// It is stack.lo+StackGuard normally, but can be StackPreempt to trigger a preemption.// stackguard1 is the stack pointer compared in the C stack growth prologue.// It is stack.lo+StackGuard on g0 and gsignal stacks.// It is ~0 on other goroutine stacks, to trigger a call to morestackc (and crash).stack       stack   // offset known to runtime/cgostackguard0 uintptr // offset known to liblinkstackguard1 uintptr // offset known to liblink_panic         *_panic // innermost panic - offset known to liblink_defer         *_defer // innermost deferm              *m      // current m; offset known to arm liblinksched          gobufsyscallsp      uintptr        // if status==Gsyscall, syscallsp = sched.sp to use during gcsyscallpc      uintptr        // if status==Gsyscall, syscallpc = sched.pc to use during gcstktopsp       uintptr        // expected sp at top of stack, to check in tracebackparam          unsafe.Pointer // passed parameter on wakeupatomicstatus   uint32stackLock      uint32 // sigprof/scang lock; TODO: fold in to atomicstatusgoid           int64schedlink      guintptrwaitsince      int64      // approx time when the g become blockedwaitreason     waitReason // if status==Gwaitingpreempt        bool       // preemption signal, duplicates stackguard0 = stackpreemptpaniconfault   bool       // panic (instead of crash) on unexpected fault addresspreemptscan    bool       // preempted g does scan for gcgcscandone     bool       // g has scanned stack; protected by _Gscan bit in statusgcscanvalid    bool       // false at start of gc cycle, true if G has not run since last scan; TODO: remove?throwsplit     bool       // must not split stackraceignore     int8       // ignore race detection eventssysblocktraced bool       // StartTrace has emitted EvGoInSyscall about this goroutinesysexitticks   int64      // cputicks when syscall has returned (for tracing)traceseq       uint64     // trace event sequencertracelastp     puintptr   // last P emitted an event for this goroutinelockedm        muintptrsig            uint32writebuf       []bytesigcode0       uintptrsigcode1       uintptrsigpc          uintptrgopc           uintptr         // pc of go statement that created this goroutineancestors      *[]ancestorInfo // ancestor information goroutine(s) that created this goroutine (only used if debug.tracebackancestors)startpc        uintptr         // pc of goroutine functionracectx        uintptrwaiting        *sudog         // sudog structures this g is waiting on (that have a valid elem ptr); in lock ordercgoCtxt        []uintptr      // cgo traceback contextlabels         unsafe.Pointer // profiler labelstimer          *timer         // cached timer for time.SleepselectDone     uint32         // are we participating in a select and did someone win the race?// Per-G GC state// gcAssistBytes is this G's GC assist credit in terms of// bytes allocated. If this is positive, then the G has credit// to allocate gcAssistBytes bytes without assisting. If this// is negative, then the G must correct this by performing// scan work. We track this in bytes to make it fast to update// and check for debt in the malloc hot path. The assist ratio// determines how this corresponds to scan work debt.gcAssistBytes int64}复制代码

东西太多，目前能看懂的就是new过g后，分配了一个round2(_StackSystem + stacksize)个字节的stack.

newg.stackguard0 = newg.stack.lo + _StackGuardnewg.stackguard1 = ^uintptr(0)复制代码

然后将新生成的g的状态由_Gidle变成_Gdead。将 Gdead 状态的 g 添加到 allg切片中。

var (allgs    []*gallglock mutex)func allgadd(gp *g) {if readgstatus(gp) == _Gidle {throw("allgadd: bad status Gidle")}lock(&allglock)allgs = append(allgs, gp)allglen = uintptr(len(allgs))unlock(&allglock)}复制代码

之后对g相关的sched字段进行初始化赋值,该字段类型是个结构体，

type gobuf struct {// The offsets of sp, pc, and g are known to (hard-coded in) libmach.//// ctxt is unusual with respect to GC: it may be a// heap-allocated funcval, so GC needs to track it, but it// needs to be set and cleared from assembly, where it's// difficult to have write barriers. However, ctxt is really a// saved, live register, and we only ever exchange it between// the real register and the gobuf. Hence, we treat it as a// root during stack scanning, which means assembly that saves// and restores it doesn't need write barriers. It's still// typed as a pointer so that any other writes from Go get// write barriers.sp   uintptrpc   uintptrg    guintptrctxt unsafe.Pointerret  sys.Uintreglr   uintptrbp   uintptr // for GOEXPERIMENT=framepointer}复制代码

该字段的功能，目前我们不得而知，先看

memclrNoHeapPointers(unsafe.Pointer(&newg.sched), unsafe.Sizeof(newg.sched))newg.sched.sp = spnewg.stktopsp = spnewg.sched.pc = funcPC(goexit) + sys.PCQuantum // +PCQuantum so that previous instruction is in same functionnewg.sched.g = guintptr(unsafe.Pointer(newg))gostartcallfn(&newg.sched, fn)复制代码

调整Gobuf就像执行对fn的调用一样，然后立即执行gosave.

func gostartcallfn(gobuf *gobuf, fv *funcval) {var fn unsafe.Pointerif fv != nil {fn = unsafe.Pointer(fv.fn)} else {fn = unsafe.Pointer(funcPC(nilfunc))}gostartcall(gobuf, fn, unsafe.Pointer(fv))}复制代码

之后有一个将当前g的状态调整的动作

casgstatus(newg, _Gdead, _Grunnable)复制代码

可运行状态的g会被放入到本地的可运行队列中，

runqput(_p_, newg, true)复制代码

该函数体如下：

// runqput尝试将g放置在本地可运行队列中。 // 如果next为false，则runqput将g添加到可运行队列的尾部。// 如果next为true，则runqput将g放在_p_.runnext插槽中。 // 如果运行队列已满，则runnext将g放入全局队列。 // 仅由所有者P执行。func runqput(_p_ *p, gp *g, next bool) {if randomizeScheduler && next && fastrand()%2 == 0 {next = false}if next {retryNext:oldnext := _p_.runnextif !_p_.runnext.cas(oldnext, guintptr(unsafe.Pointer(gp))) {goto retryNext}if oldnext == 0 {return}// Kick the old runnext out to the regular run queue.gp = oldnext.ptr()}retry:h := atomic.LoadAcq(&_p_.runqhead) // load-acquire, synchronize with consumerst := _p_.runqtailif t-h < uint32(len(_p_.runq)) {_p_.runq[t%uint32(len(_p_.runq))].set(gp)atomic.StoreRel(&_p_.runqtail, t+1) // store-release, makes the item available for consumptionreturn}if runqputslow(_p_, gp, h, t) {return}// the queue is not full, now the put above must succeedgoto retry}复制代码

以上，关于g的内容，我们有了一个大致的了解，当我们将创建的g放到本地队列时，提到了一个结构体p,这个东西是什么呢？下面是他的结构体

type p struct {lock mutexid          int32status      uint32 // one of pidle/prunning/...link        puintptrschedtick   uint32     // incremented on every scheduler callsyscalltick uint32     // incremented on every system callsysmontick  sysmontick // last tick observed by sysmonm           muintptr   // back-link to associated m (nil if idle)mcache      *mcacheracectx     uintptrdeferpool    [5][]*_defer // pool of available defer structs of different sizes (see panic.go)deferpoolbuf [5][32]*_defer// Cache of goroutine ids, amortizes accesses to runtime·sched.goidgen.goidcache    uint64goidcacheend uint64// Queue of runnable goroutines. Accessed without lock.// 可运行goroutines的队列，访问无需锁，这个就是我们上述创建的g存放的位置runqhead uint32runqtail uint32runq     [256]guintptr// runnext（如果不是nil）是当前G准备好的可运行G，// 如果正在运行的G的时间片中还有剩余时间，则应下一个运行，而不是从runq中获取G。// 它将继承当前时间片中剩余的时间。// 如果将一组goroutine锁定为通信等待模式，// 则此调度会将其设置为一个单元，// 并消除（可能很大的）调度延迟，// 否则该延迟可能是由于将就绪的goroutine添加到运行队列的末尾而引起的。runnext guintptr// Available G's (status == Gdead)gFree struct {gListn int32}sudogcache []*sudogsudogbuf   [128]*sudogtracebuf traceBufPtr// traceSweep indicates the sweep events should be traced.// This is used to defer the sweep start event until a span// has actually been swept.traceSweep bool// traceSwept and traceReclaimed track the number of bytes// swept and reclaimed by sweeping in the current sweep loop.traceSwept, traceReclaimed uintptrpalloc persistentAlloc // per-P to avoid mutex// Per-P GC stategcAssistTime         int64 // Nanoseconds in assistAllocgcFractionalMarkTime int64 // Nanoseconds in fractional mark workergcBgMarkWorker       guintptrgcMarkWorkerMode     gcMarkWorkerMode// gcMarkWorkerStartTime is the nanotime() at which this mark// worker started.gcMarkWorkerStartTime int64// gcw is this P's GC work buffer cache. The work buffer is// filled by write barriers, drained by mutator assists, and// disposed on certain GC state transitions.gcw gcWork// wbBuf is this P's GC write barrier buffer.//// TODO: Consider caching this in the running G.wbBuf wbBufrunSafePointFn uint32 // if 1, run sched.safePointFn at next safe pointpad cpu.CacheLinePad}复制代码

在newproc函数中，从当前g获取p结构时，通过的是g的m字段，该字段是个什么呢？是个m结构体指针，m的结构体原型为：

type m struct {g0      *g     // 用于执行调度指令的 goroutinemorebuf gobuf  // gobuf arg to morestackdivmod  uint32 // div/mod denominator for arm - known to liblink// Fields not known to debuggers.procid        uint64       // for debuggers, but offset not hard-codedgsignal       *g           // 处理 signal 的 ggoSigStack    gsignalStack // Go-allocated signal handling stacksigmask       sigset       // storage for saved signal masktls           [6]uintptr   // 线程本地存储mstartfn      func()curg          *g       // 当前运行的Gcaughtsig     guintptr // goroutine running during fatal signalp             puintptr // 执行 go 代码时持有的 p (如果没有执行则为 nil)nextp         puintptroldp          puintptr // the p that was attached before executing a syscallid            int64mallocing     int32throwing      int32preemptoff    string // if != "", keep curg running on this mlocks         int32dying         int32profilehz     int32spinning      bool // m 当前没有运行 work 且正处于寻找 work 的活跃状态blocked       bool // m is blocked on a noteinwb          bool // m is executing a write barriernewSigstack   bool // minit on C thread called sigaltstackprintlock     int8incgo         bool   // m is executing a cgo callfreeWait      uint32 // if == 0, safe to free g0 and delete m (atomic)fastrand      [2]uint32needextram    booltraceback     uint8ncgocall      uint64      // number of cgo calls in totalncgo          int32       // number of cgo calls currently in progresscgoCallersUse uint32      // if non-zero, cgoCallers in use temporarilycgoCallers    *cgoCallers // cgo traceback if crashing in cgo callpark          notealllink       *m // on allmschedlink     muintptrmcache        *mcachelockedg       guintptrcreatestack   [32]uintptr    // stack that created this thread.lockedExt     uint32         // tracking for external LockOSThreadlockedInt     uint32         // tracking for internal lockOSThreadnextwaitm     muintptr       // next m waiting for lockwaitunlockf   unsafe.Pointer // todo go func(*g, unsafe.pointer) boolwaitlock      unsafe.Pointerwaittraceev   bytewaittraceskip intstartingtrace boolsyscalltick   uint32thread        uintptr // thread handlefreelink      *m      // on sched.freem// these are here because they are too large to be on the stack// of low-level NOSPLIT functions.libcall   libcalllibcallpc uintptr // for cpu profilerlibcallsp uintptrlibcallg  guintptrsyscall   libcall // stores syscall parameters on windowsvdsoSP uintptr // SP for traceback while in VDSO call (0 if not in call)vdsoPC uintptr // PC for traceback while in VDSO callmOS}复制代码

看了上面的结构体感觉很空洞，都是些什么呢？就知道newproc时，创建的G,放到了关联的P的本地可运行队列中，要明白这些东西是什么，就要从他们是如何产生的说起？

➜  goroutinetest gdb mainGNU gdb (GDB) 8.3Copyright (C) 2019 Free Software Foundation, Inc.License GPLv3+: GNU GPL version 3 or later <http://gnu.org/licenses/gpl.html>This is free software: you are free to change and redistribute it.There is NO WARRANTY, to the extent permitted by law.Type "show copying" and "show warranty" for details.This GDB was configured as "x86_64-apple-darwin16.7.0".Type "show configuration" for configuration details.For bug reporting instructions, please see:<http://www.gnu.org/software/gdb/bugs/>.Find the GDB manual and other documentation resources online at:    <http://www.gnu.org/software/gdb/documentation/>.For help, type "help".Type "apropos word" to search for commands related to "word"...Reading symbols from main...(No debugging symbols found in main)Loading Go Runtime support.(gdb) info filesSymbols from "/Users/zhaojunwei/workspace/src/just.for.test/goroutinetest/main".Local exec file:`/Users/zhaojunwei/workspace/src/just.for.test/goroutinetest/main', file type mach-o-x86-64.Entry point: 0x10527700x0000000001001000 - 0x0000000001093194 is .text0x00000000010931a0 - 0x00000000010e1ace is __TEXT.__rodata0x00000000010e1ae0 - 0x00000000010e1be2 is __TEXT.__symbol_stub10x00000000010e1c00 - 0x00000000010e2864 is __TEXT.__typelink0x00000000010e2868 - 0x00000000010e28d0 is __TEXT.__itablink0x00000000010e28d0 - 0x00000000010e28d0 is __TEXT.__gosymtab0x00000000010e28e0 - 0x000000000115c108 is __TEXT.__gopclntab0x000000000115d000 - 0x000000000115d158 is __DATA.__nl_symbol_ptr0x000000000115d160 - 0x0000000001169c9c is __DATA.__noptrdata0x0000000001169ca0 - 0x0000000001170610 is .data0x0000000001170620 - 0x000000000118be50 is .bss0x000000000118be60 - 0x000000000118e418 is __DATA.__noptrbss(gdb)(gdb) b *0x1052770Breakpoint 1 at 0x1052770(gdb) info brNum     Type           Disp Enb Address            What1       breakpoint     keep y   0x0000000001052770 <_rt0_amd64_darwin>(gdb)复制代码

查看一下_rt0_amd64_darwin是什么？

#include "textflag.h"TEXT _rt0_amd64_darwin(SB),NOSPLIT,$-8JMP_rt0_amd64(SB)// When linking with -shared, this symbol is called when the shared library// is loaded.TEXT _rt0_amd64_darwin_lib(SB),NOSPLIT,$0JMP_rt0_amd64_lib(SB)复制代码

_rt0_amd64是使用内部链接时大多数amd64系统的通用启动代码。这是内核中普通-buildmode = exe程序的程序入口点。堆栈保存参数数量和C风格的argv。

TEXT _rt0_amd64(SB),NOSPLIT,$-8MOVQ0(SP), DI// argcLEAQ8(SP), SI// argvJMPruntime·rt0_go(SB)复制代码

最终调用的是runtime.rt0_go方法

TEXT runtime·rt0_go(SB),NOSPLIT,$0// SP = stack; R0 = argc; R1 = argvSUB$32, RSPMOVWR0, 8(RSP) // argcMOVDR1, 16(RSP) // argv// create istack out of the given (operating system) stack.// _cgo_init may update stackguard.MOVD$runtime·g0(SB), gMOVDRSP, R7MOVD$(-64*1024)(R7), R0MOVDR0, g_stackguard0(g)MOVDR0, g_stackguard1(g)MOVDR0, (g_stack+stack_lo)(g)MOVDR7, (g_stack+stack_hi)(g)// if there is a _cgo_init, call it using the gcc ABI.MOVD_cgo_init(SB), R12CMP$0, R12BEQnocgoMRS_TPIDR_R0// load TLS base pointerMOVDR0, R3// arg 3: TLS base pointer#ifdef TLSG_IS_VARIABLEMOVD$runtime·tls_g(SB), R2 // arg 2: &tls_g#elseMOVD$0, R2        // arg 2: not used when using platform's TLS#endifMOVD$setg_gcc<>(SB), R1// arg 1: setgMOVDg, R0// arg 0: GSUB$16, RSP// reserve 16 bytes for sp-8 where fp may be saved.BL(R12)ADD$16, RSPnocgo:BLruntime·save_g(SB)// update stackguard after _cgo_initMOVD(g_stack+stack_lo)(g), R0ADD$const__StackGuard, R0MOVDR0, g_stackguard0(g)MOVDR0, g_stackguard1(g)// set the per-goroutine and per-mach "registers"MOVD$runtime·m0(SB), R0// save m->g0 = g0MOVDg, m_g0(R0)// save m0 to g0->mMOVDR0, g_m(g)BLruntime·check(SB)MOVW8(RSP), R0// copy argcMOVWR0, -8(RSP)MOVD16(RSP), R0// copy argvMOVDR0, 0(RSP)BLruntime·args(SB)BLruntime·osinit(SB)BLruntime·schedinit(SB)// create a new goroutine to start programMOVD$runtime·mainPC(SB), R0// entryMOVDRSP, R7MOVD.W$0, -8(R7)MOVD.WR0, -8(R7)MOVD.W$0, -8(R7)MOVD.W$0, -8(R7)MOVDR7, RSPBLruntime·newproc(SB)ADD$32, RSP// start this MBLruntime·mstart(SB)MOVD$0, R0MOVDR0, (R0)// boomUNDEF复制代码

首先进行g0和m0的初始化，之后进行本地线程存储的检测设置。之后尽心调度器的初始化，并创建一个新的goroutine运行程序，最后开启我们的M.

// The bootstrap sequence is:////call osinit//call schedinit//make & queue new G//call runtime·mstart//// The new G calls runtime·main.func schedinit() {// raceinit must be the first call to race detector.// In particular, it must be done before mallocinit below calls racemapshadow._g_ := getg()if raceenabled {_g_.racectx, raceprocctx0 = raceinit()}// 设置最多启动10000个操作系统线程，也是最多10000个Msched.maxmcount = 10000tracebackinit()moduledataverify()stackinit()mallocinit()mcommoninit(_g_.m) // 初始化m0，因为从前面的代码我们知道g0->m = &m0cpuinit()       // must run before alginitalginit()       // maps must not be used before this callmodulesinit()   // provides activeModulestypelinksinit() // uses maps, activeModulesitabsinit()     // uses activeModulesmsigsave(_g_.m)initSigmask = _g_.m.sigmaskgoargs()goenvs()parsedebugvars()gcinit()sched.lastpoll = uint64(nanotime())// 系统中有多少核，就创建和初始化多少个p结构体对象procs := ncpuif n, ok := atoi32(gogetenv("GOMAXPROCS")); ok && n > 0 {    // 如果环境变量指定了GOMAXPROCS，则创建指定数量的pprocs = n}// 创建和初始化全局变量allpif procresize(procs) != nil {throw("unknown runnable goroutine during bootstrap")}// For cgocheck > 1, we turn on the write barrier at all times// and check all pointer writes. We can't do this until after// procresize because the write barrier needs a P.if debug.cgocheck > 1 {writeBarrier.cgo = truewriteBarrier.enabled = truefor _, p := range allp {p.wbBuf.reset()}}if buildVersion == "" {// Condition should never trigger. This code just serves// to ensure runtime·buildVersion is kept in the resulting binary.buildVersion = "unknown"}}复制代码

我们来关注一下m0是如何初始化的

func mcommoninit(mp *m) {_g_ := getg()// g0 stack won't make sense for user (and is not necessary unwindable).if _g_ != _g_.m.g0 {callers(1, mp.createstack[:])}lock(&sched.lock)if sched.mnext+1 < sched.mnext {throw("runtime: thread ID overflow")}// m0分配的id,schedt结构体的mnext字段标识下一个可用的thread id.mp.id = sched.mnextsched.mnext++checkmcount()mp.fastrand[0] = 1597334677 * uint32(mp.id)mp.fastrand[1] = uint32(cputicks())if mp.fastrand[0]|mp.fastrand[1] == 0 {mp.fastrand[1] = 1}mpreinit(mp)if mp.gsignal != nil {mp.gsignal.stackguard1 = mp.gsignal.stack.lo + _StackGuard}// Add to allm so garbage collector doesn't free g->m// when it is just in a register or thread-local storage.// allm挂到这里，防止被垃圾回收mp.alllink = allm// NumCgoCall() iterates over allm w/o schedlock,// so we need to publish it safely.atomicstorep(unsafe.Pointer(&allm), unsafe.Pointer(mp))unlock(&sched.lock)// Allocate memory to hold a cgo traceback if the cgo call crashes.if iscgo || GOOS == "solaris" || GOOS == "windows" {mp.cgoCallers = new(cgoCallers)}}复制代码

调度器初始化最后一部分工作就是p的初始化

初始化调度后，开启新的goroutine运行我们的主程序，然后调用runtime.mstart开启M.

func mstart() {_g_ := getg()    // 通过检查 g 执行占的边界来确定是否为系统栈osStack := _g_.stack.lo == 0if osStack {// Initialize stack bounds from system stack.// Cgo may have left stack size in stack.hi.// minit may update the stack bounds.size := _g_.stack.hiif size == 0 {size = 8192 * sys.StackGuardMultiplier}_g_.stack.hi = uintptr(noescape(unsafe.Pointer(&size)))_g_.stack.lo = _g_.stack.hi - size + 1024}// Initialize stack guards so that we can start calling// both Go and C functions with stack growth prologues._g_.stackguard0 = _g_.stack.lo + _StackGuard_g_.stackguard1 = _g_.stackguard0// 启动mmstart1()// Exit this thread.if GOOS == "windows" || GOOS == "solaris" || GOOS == "plan9" || GOOS == "darwin" || GOOS == "aix" {// Window, Solaris, Darwin, AIX and Plan 9 always system-allocate// the stack, but put it in _g_.stack before mstart,// so the logic above hasn't set osStack yet.osStack = true}mexit(osStack)}func mstart1() {_g_ := getg()if _g_ != _g_.m.g0 {throw("bad runtime·mstart")}// Record the caller for use as the top of stack in mcall and// for terminating the thread.// We're never coming back to mstart1 after we call schedule,// so other calls can reuse the current frame.save(getcallerpc(), getcallersp())asminit()minit()// Install signal handlers; after minit so that minit can// prepare the thread to be able to handle the signals.if _g_.m == &m0 {mstartm0()}if fn := _g_.m.mstartfn; fn != nil {fn()}    // 如果当前 m 并非 m0，则要求绑定 pif _g_.m != &m0 {acquirep(_g_.m.nextp.ptr())_g_.m.nextp = 0}schedule()}复制代码

在mstart1中，调用了schedule函数：一轮调度程序：找到一个可运行的goroutine并执行它。永不return.

func schedule() {_g_ := getg()if _g_.m.locks != 0 {throw("schedule: holding locks")}if _g_.m.lockedg != 0 {stoplockedm()execute(_g_.m.lockedg.ptr(), false) // Never returns.}// We should not schedule away from a g that is executing a cgo call,// since the cgo call is using the m's g0 stack.if _g_.m.incgo {throw("schedule: in cgo")}top:if sched.gcwaiting != 0 {gcstopm()goto top}if _g_.m.p.ptr().runSafePointFn != 0 {runSafePointFn()}var gp *gvar inheritTime boolif trace.enabled || trace.shutdown {gp = traceReader()if gp != nil {casgstatus(gp, _Gwaiting, _Grunnable)traceGoUnpark(gp, 0)}}if gp == nil && gcBlackenEnabled != 0 {gp = gcController.findRunnableGCWorker(_g_.m.p.ptr())}if gp == nil {// // 说明不在 GC//// 每调度 61 次，就检查一次全局队列，保证公平性// 否则两个 goroutine 可以通过互相 respawn 一直占领本地的 runqueueif _g_.m.p.ptr().schedtick%61 == 0 && sched.runqsize > 0 {lock(&sched.lock)// 从全局队列中偷 ggp = globrunqget(_g_.m.p.ptr(), 1)unlock(&sched.lock)}}if gp == nil {gp, inheritTime = runqget(_g_.m.p.ptr())if gp != nil && _g_.m.spinning {throw("schedule: spinning with local work")}}if gp == nil {gp, inheritTime = findrunnable() // 如果偷都偷不到，则休眠，在此阻塞}// 该线程将运行goroutine，并且不再自旋，// 因此，如果将其标记为正在自旋，则需要立即将其重置并可能启动新自旋的M。if _g_.m.spinning {resetspinning()}if sched.disable.user && !schedEnabled(gp) {// Scheduling of this goroutine is disabled. Put it on// the list of pending runnable goroutines for when we// re-enable user scheduling and look again.lock(&sched.lock)if schedEnabled(gp) {// Something re-enabled scheduling while we// were acquiring the lock.unlock(&sched.lock)} else {sched.disable.runnable.pushBack(gp)sched.disable.n++unlock(&sched.lock)goto top}}if gp.lockedm != 0 {// Hands off own p to the locked m,// then blocks waiting for a new p.startlockedm(gp)goto top}    // 开始执行execute(gp, inheritTime)}复制代码

如果m处在自旋的状态，那么将调用resetspinning方法，

func resetspinning() {_g_ := getg()if !_g_.m.spinning {throw("resetspinning: not a spinning m")}_g_.m.spinning = falsenmspinning := atomic.Xadd(&sched.nmspinning, -1)if int32(nmspinning) < 0 {throw("findrunnable: negative nmspinning")}// M的唤醒策略故意有些保守，因此请检查是否需要在此处唤醒另一个P。// 有关详细信息，请参见文件顶部的“工作线程park/unpark”注释。if nmspinning == 0 && atomic.Load(&sched.npidle) > 0 {wakep()}}复制代码

wakep()尝试再添加一个P以执行G。当G变为可运行时调用（newproc，就绪）.该函数会调用startm(nil, true).startm函数调度一些M以运行p（必要时创建M）。如果p == nil，则尝试获取一个空闲P，如果没有空闲P则不执行任何操作。可以与m.p == nil一起运行，因此不允许写障碍。如果设置了旋转，则调用者已增加nmspinning，并且startm将减少nmspinning或在新启动的M中设置m.spinning。

本系列文章：

有任何问题，欢迎留言

参考文献：

智云一二三科技

我可能并不会使用golang goroutine

关于作者: 智云科技

给这篇文章的作者打赏

关于作者: 智云科技

相关文章

Linux性能及调优指南之Linux进程管理

详解SpringIOC容器的基本配置

Goland配置GOROOT无法识别已安装的go

热门文章

1分享新浪图床上传接口源码

2PHP简单实现路由Route功能

3Tideways、xhprof 和 xhgui 打造 PHP 非侵入式监控平台

4centos系统如何查看是否安装了mysql

5curl 工具简述