// Copyright 2013 The Go Authors. All rights reserved.// Use of this source code is governed by a BSD-style// license that can be found in the LICENSE file.// +build aix darwin dragonfly freebsd js,wasm linux netbsd openbsd solaris windowspackage runtimeimport ()// Integrated network poller (platform-independent part).// A particular implementation (epoll/kqueue/port/AIX/Windows)// must define the following functions://// func netpollinit()// Initialize the poller. Only called once.//// func netpollopen(fd uintptr, pd *pollDesc) int32// Arm edge-triggered notifications for fd. The pd argument is to pass// back to netpollready when fd is ready. Return an errno value.//// func netpoll(delta int64) gList// Poll the network. If delta < 0, block indefinitely. If delta == 0,// poll without blocking. If delta > 0, block for up to delta nanoseconds.// Return a list of goroutines built by calling netpollready.//// func netpollBreak()// Wake up the network poller, assumed to be blocked in netpoll.//// func netpollIsPollDescriptor(fd uintptr) bool// Reports whether fd is a file descriptor used by the poller.// Error codes returned by runtime_pollReset and runtime_pollWait.// These must match the values in internal/poll/fd_poll_runtime.go.const (pollNoError = 0// no errorpollErrClosing = 1// descriptor is closedpollErrTimeout = 2// I/O timeoutpollErrNotPollable = 3// general error polling descriptor)// pollDesc contains 2 binary semaphores, rg and wg, to park reader and writer// goroutines respectively. The semaphore can be in the following states:// pdReady - io readiness notification is pending;// a goroutine consumes the notification by changing the state to nil.// pdWait - a goroutine prepares to park on the semaphore, but not yet parked;// the goroutine commits to park by changing the state to G pointer,// or, alternatively, concurrent io notification changes the state to pdReady,// or, alternatively, concurrent timeout/close changes the state to nil.// G pointer - the goroutine is blocked on the semaphore;// io notification or timeout/close changes the state to pdReady or nil respectively// and unparks the goroutine.// nil - none of the above.const (pdReadyuintptr = 1pdWaituintptr = 2)constpollBlockSize = 4 * 1024// Network poller descriptor.//// No heap pointers.////go:notinheaptypepollDescstruct { link *pollDesc// in pollcache, protected by pollcache.lock// The lock protects pollOpen, pollSetDeadline, pollUnblock and deadlineimpl operations. // This fully covers seq, rt and wt variables. fd is constant throughout the PollDesc lifetime. // pollReset, pollWait, pollWaitCanceled and runtime·netpollready (IO readiness notification) // proceed w/o taking the lock. So closing, everr, rg, rd, wg and wd are manipulated // in a lock-free way by all operations. // NOTE(dvyukov): the following code uses uintptr to store *g (rg/wg), // that will blow up when GC starts moving objects. lock mutex// protects the following fields fd uintptr closing bool everr bool// marks event scanning error happened user uint32// user settable cookie rseq uintptr// protects from stale read timers rg uintptr// pdReady, pdWait, G waiting for read or nil rt timer// read deadline timer (set if rt.f != nil) rd int64// read deadline wseq uintptr// protects from stale write timers wg uintptr// pdReady, pdWait, G waiting for write or nil wt timer// write deadline timer wd int64// write deadline self *pollDesc// storage for indirect interface. See (*pollDesc).makeArg.}typepollCachestruct { lock mutex first *pollDesc// PollDesc objects must be type-stable, // because we can get ready notification from epoll/kqueue // after the descriptor is closed/reused. // Stale notifications are detected using seq variable, // seq is incremented when deadlines are changed or descriptor is reused.}var (netpollInitLockmutexnetpollIniteduint32pollcachepollCachenetpollWaitersuint32)//go:linkname poll_runtime_pollServerInit internal/poll.runtime_pollServerInitfunc () {netpollGenericInit()}func () {ifatomic.Load(&netpollInited) == 0 {lockInit(&netpollInitLock, lockRankNetpollInit)lock(&netpollInitLock)ifnetpollInited == 0 {netpollinit()atomic.Store(&netpollInited, 1) }unlock(&netpollInitLock) }}func () bool {returnatomic.Load(&netpollInited) != 0}//go:linkname poll_runtime_isPollServerDescriptor internal/poll.runtime_isPollServerDescriptor// poll_runtime_isPollServerDescriptor reports whether fd is a// descriptor being used by netpoll.func ( uintptr) bool {returnnetpollIsPollDescriptor()}//go:linkname poll_runtime_pollOpen internal/poll.runtime_pollOpenfunc ( uintptr) (*pollDesc, int) { := pollcache.alloc()lock(&.lock)if .wg != 0 && .wg != pdReady {throw("runtime: blocked write on free polldesc") }if .rg != 0 && .rg != pdReady {throw("runtime: blocked read on free polldesc") } .fd = .closing = false .everr = false .rseq++ .rg = 0 .rd = 0 .wseq++ .wg = 0 .wd = 0 .self = unlock(&.lock)varint32 = netpollopen(, )return , int()}//go:linkname poll_runtime_pollClose internal/poll.runtime_pollClosefunc ( *pollDesc) {if !.closing {throw("runtime: close polldesc w/o unblock") }if .wg != 0 && .wg != pdReady {throw("runtime: blocked write on closing polldesc") }if .rg != 0 && .rg != pdReady {throw("runtime: blocked read on closing polldesc") }netpollclose(.fd)pollcache.free()}func ( *pollCache) ( *pollDesc) {lock(&.lock) .link = .first .first = unlock(&.lock)}// poll_runtime_pollReset, which is internal/poll.runtime_pollReset,// prepares a descriptor for polling in mode, which is 'r' or 'w'.// This returns an error code; the codes are defined above.//go:linkname poll_runtime_pollReset internal/poll.runtime_pollResetfunc ( *pollDesc, int) int { := netpollcheckerr(, int32())if != pollNoError {return }if == 'r' { .rg = 0 } elseif == 'w' { .wg = 0 }returnpollNoError}// poll_runtime_pollWait, which is internal/poll.runtime_pollWait,// waits for a descriptor to be ready for reading or writing,// according to mode, which is 'r' or 'w'.// This returns an error code; the codes are defined above.//go:linkname poll_runtime_pollWait internal/poll.runtime_pollWaitfunc ( *pollDesc, int) int { := netpollcheckerr(, int32())if != pollNoError {return }// As for now only Solaris, illumos, and AIX use level-triggered IO.ifGOOS == "solaris" || GOOS == "illumos" || GOOS == "aix" {netpollarm(, ) }for !netpollblock(, int32(), false) { = netpollcheckerr(, int32())if != pollNoError {return }// Can happen if timeout has fired and unblocked us, // but before we had a chance to run, timeout has been reset. // Pretend it has not happened and retry. }returnpollNoError}//go:linkname poll_runtime_pollWaitCanceled internal/poll.runtime_pollWaitCanceledfunc ( *pollDesc, int) {// This function is used only on windows after a failed attempt to cancel // a pending async IO operation. Wait for ioready, ignore closing or timeouts.for !netpollblock(, int32(), true) { }}//go:linkname poll_runtime_pollSetDeadline internal/poll.runtime_pollSetDeadlinefunc ( *pollDesc, int64, int) {lock(&.lock)if .closing {unlock(&.lock)return } , := .rd, .wd := > 0 && == if > 0 { += nanotime()if <= 0 {// If the user has a deadline in the future, but the delay calculation // overflows, then set the deadline to the maximum possible value. = 1<<63 - 1 } }if == 'r' || == 'r'+'w' { .rd = }if == 'w' || == 'r'+'w' { .wd = } := .rd > 0 && .rd == .wd := netpollReadDeadlineif { = netpollDeadline }if .rt.f == nil {if .rd > 0 { .rt.f = // Copy current seq into the timer arg. // Timer func will check the seq against current descriptor seq, // if they differ the descriptor was reused or timers were reset. .rt.arg = .makeArg() .rt.seq = .rseqresettimer(&.rt, .rd) } } elseif .rd != || != { .rseq++ // invalidate current timersif .rd > 0 {modtimer(&.rt, .rd, 0, , .makeArg(), .rseq) } else {deltimer(&.rt) .rt.f = nil } }if .wt.f == nil {if .wd > 0 && ! { .wt.f = netpollWriteDeadline .wt.arg = .makeArg() .wt.seq = .wseqresettimer(&.wt, .wd) } } elseif .wd != || != { .wseq++ // invalidate current timersif .wd > 0 && ! {modtimer(&.wt, .wd, 0, netpollWriteDeadline, .makeArg(), .wseq) } else {deltimer(&.wt) .wt.f = nil } }// If we set the new deadline in the past, unblock currently pending IO if any.var , *gif .rd < 0 || .wd < 0 {atomic.StorepNoWB(noescape(unsafe.Pointer(&)), nil) // full memory barrier between stores to rd/wd and load of rg/wg in netpollunblockif .rd < 0 { = netpollunblock(, 'r', false) }if .wd < 0 { = netpollunblock(, 'w', false) } }unlock(&.lock)if != nil {netpollgoready(, 3) }if != nil {netpollgoready(, 3) }}//go:linkname poll_runtime_pollUnblock internal/poll.runtime_pollUnblockfunc ( *pollDesc) {lock(&.lock)if .closing {throw("runtime: unblock on closing polldesc") } .closing = true .rseq++ .wseq++var , *gatomic.StorepNoWB(noescape(unsafe.Pointer(&)), nil) // full memory barrier between store to closing and read of rg/wg in netpollunblock = netpollunblock(, 'r', false) = netpollunblock(, 'w', false)if .rt.f != nil {deltimer(&.rt) .rt.f = nil }if .wt.f != nil {deltimer(&.wt) .wt.f = nil }unlock(&.lock)if != nil {netpollgoready(, 3) }if != nil {netpollgoready(, 3) }}// netpollready is called by the platform-specific netpoll function.// It declares that the fd associated with pd is ready for I/O.// The toRun argument is used to build a list of goroutines to return// from netpoll. The mode argument is 'r', 'w', or 'r'+'w' to indicate// whether the fd is ready for reading or writing or both.//// This may run while the world is stopped, so write barriers are not allowed.//go:nowritebarrierfunc ( *gList, *pollDesc, int32) {var , *gif == 'r' || == 'r'+'w' { = netpollunblock(, 'r', true) }if == 'w' || == 'r'+'w' { = netpollunblock(, 'w', true) }if != nil { .push() }if != nil { .push() }}func ( *pollDesc, int32) int {if .closing {returnpollErrClosing }if ( == 'r' && .rd < 0) || ( == 'w' && .wd < 0) {returnpollErrTimeout }// Report an event scanning error only on a read event. // An error on a write event will be captured in a subsequent // write call that is able to report a more specific error.if == 'r' && .everr {returnpollErrNotPollable }returnpollNoError}func ( *g, unsafe.Pointer) bool { := atomic.Casuintptr((*uintptr)(), pdWait, uintptr(unsafe.Pointer()))if {// Bump the count of goroutines waiting for the poller. // The scheduler uses this to decide whether to block // waiting for the poller if there is nothing else to do.atomic.Xadd(&netpollWaiters, 1) }return}func ( *g, int) {atomic.Xadd(&netpollWaiters, -1)goready(, +1)}// returns true if IO is ready, or false if timedout or closed// waitio - wait only for completed IO, ignore errorsfunc ( *pollDesc, int32, bool) bool { := &.rgif == 'w' { = &.wg }// set the gpp semaphore to pdWaitfor { := *if == pdReady { * = 0returntrue }if != 0 {throw("runtime: double wait") }ifatomic.Casuintptr(, 0, pdWait) {break } }// need to recheck error states after setting gpp to pdWait // this is necessary because runtime_pollUnblock/runtime_pollSetDeadline/deadlineimpl // do the opposite: store to closing/rd/wd, membarrier, load of rg/wgif || netpollcheckerr(, ) == 0 {gopark(netpollblockcommit, unsafe.Pointer(), waitReasonIOWait, traceEvGoBlockNet, 5) }// be careful to not lose concurrent pdReady notification := atomic.Xchguintptr(, 0)if > pdWait {throw("runtime: corrupted polldesc") }return == pdReady}func ( *pollDesc, int32, bool) *g { := &.rgif == 'w' { = &.wg }for { := *if == pdReady {returnnil }if == 0 && ! {// Only set pdReady for ioready. runtime_pollWait // will check for timeout/cancel before waiting.returnnil }varuintptrif { = pdReady }ifatomic.Casuintptr(, , ) {if == pdWait { = 0 }return (*g)(unsafe.Pointer()) } }}func ( *pollDesc, uintptr, , bool) {lock(&.lock)// Seq arg is seq when the timer was set. // If it's stale, ignore the timer event. := .rseqif ! { = .wseq }if != {// The descriptor was reused or timers were reset.unlock(&.lock)return }var *gif {if .rd <= 0 || .rt.f == nil {throw("runtime: inconsistent read deadline") } .rd = -1atomic.StorepNoWB(unsafe.Pointer(&.rt.f), nil) // full memory barrier between store to rd and load of rg in netpollunblock = netpollunblock(, 'r', false) }var *gif {if .wd <= 0 || .wt.f == nil && ! {throw("runtime: inconsistent write deadline") } .wd = -1atomic.StorepNoWB(unsafe.Pointer(&.wt.f), nil) // full memory barrier between store to wd and load of wg in netpollunblock = netpollunblock(, 'w', false) }unlock(&.lock)if != nil {netpollgoready(, 0) }if != nil {netpollgoready(, 0) }}func ( interface{}, uintptr) {netpolldeadlineimpl(.(*pollDesc), , true, true)}func ( interface{}, uintptr) {netpolldeadlineimpl(.(*pollDesc), , true, false)}func ( interface{}, uintptr) {netpolldeadlineimpl(.(*pollDesc), , false, true)}func ( *pollCache) () *pollDesc {lock(&.lock)if .first == nil {const = unsafe.Sizeof(pollDesc{}) := pollBlockSize / if == 0 { = 1 }// Must be in non-GC memory because can be referenced // only from epoll/kqueue internals. := persistentalloc(*, 0, &memstats.other_sys)for := uintptr(0); < ; ++ { := (*pollDesc)(add(, *)) .link = .first .first = } } := .first .first = .linklockInit(&.lock, lockRankPollDesc)unlock(&.lock)return}// makeArg converts pd to an interface{}.// makeArg does not do any allocation. Normally, such// a conversion requires an allocation because pointers to// go:notinheap types (which pollDesc is) must be stored// in interfaces indirectly. See issue 42076.func ( *pollDesc) () ( interface{}) { := (*eface)(unsafe.Pointer(&)) ._type = pdType .data = unsafe.Pointer(&.self)return}var (pdEfaceinterface{} = (*pollDesc)(nil)pdType *_type = efaceOf(&pdEface)._type)