// Copyright 2013 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

//go:build unix || (js && wasm) || wasip1 || windows

package runtime

import (
	
	
	
)

// Integrated network poller (platform-independent part).
// A particular implementation (epoll/kqueue/port/AIX/Windows)
// must define the following functions:
//
// func netpollinit()
//     Initialize the poller. Only called once.
//
// func netpollopen(fd uintptr, pd *pollDesc) int32
//     Arm edge-triggered notifications for fd. The pd argument is to pass
//     back to netpollready when fd is ready. Return an errno value.
//
// func netpollclose(fd uintptr) int32
//     Disable notifications for fd. Return an errno value.
//
// func netpoll(delta int64) (gList, int32)
//     Poll the network. If delta < 0, block indefinitely. If delta == 0,
//     poll without blocking. If delta > 0, block for up to delta nanoseconds.
//     Return a list of goroutines built by calling netpollready,
//     and a delta to add to netpollWaiters when all goroutines are ready.
//     This will never return an empty list with a non-zero delta.
//
// func netpollBreak()
//     Wake up the network poller, assumed to be blocked in netpoll.
//
// func netpollIsPollDescriptor(fd uintptr) bool
//     Reports whether fd is a file descriptor used by the poller.

// Error codes returned by runtime_pollReset and runtime_pollWait.
// These must match the values in internal/poll/fd_poll_runtime.go.
const (
	pollNoError        = 0 // no error
	pollErrClosing     = 1 // descriptor is closed
	pollErrTimeout     = 2 // I/O timeout
	pollErrNotPollable = 3 // general error polling descriptor
)

// pollDesc contains 2 binary semaphores, rg and wg, to park reader and writer
// goroutines respectively. The semaphore can be in the following states:
//
//	pdReady - io readiness notification is pending;
//	          a goroutine consumes the notification by changing the state to pdNil.
//	pdWait - a goroutine prepares to park on the semaphore, but not yet parked;
//	         the goroutine commits to park by changing the state to G pointer,
//	         or, alternatively, concurrent io notification changes the state to pdReady,
//	         or, alternatively, concurrent timeout/close changes the state to pdNil.
//	G pointer - the goroutine is blocked on the semaphore;
//	            io notification or timeout/close changes the state to pdReady or pdNil respectively
//	            and unparks the goroutine.
//	pdNil - none of the above.
const (
	pdNil   uintptr = 0
	pdReady uintptr = 1
	pdWait  uintptr = 2
)

const pollBlockSize = 4 * 1024

// Network poller descriptor.
//
// No heap pointers.
type pollDesc struct {
	_     sys.NotInHeap
	link  *pollDesc      // in pollcache, protected by pollcache.lock
	fd    uintptr        // constant for pollDesc usage lifetime
	fdseq atomic.Uintptr // protects against stale pollDesc

	// atomicInfo holds bits from closing, rd, and wd,
	// which are only ever written while holding the lock,
	// summarized for use by netpollcheckerr,
	// which cannot acquire the lock.
	// After writing these fields under lock in a way that
	// might change the summary, code must call publishInfo
	// before releasing the lock.
	// Code that changes fields and then calls netpollunblock
	// (while still holding the lock) must call publishInfo
	// before calling netpollunblock, because publishInfo is what
	// stops netpollblock from blocking anew
	// (by changing the result of netpollcheckerr).
	// atomicInfo also holds the eventErr bit,
	// recording whether a poll event on the fd got an error;
	// atomicInfo is the only source of truth for that bit.
	atomicInfo atomic.Uint32 // atomic pollInfo

	// rg, wg are accessed atomically and hold g pointers.
	// (Using atomic.Uintptr here is similar to using guintptr elsewhere.)
	rg atomic.Uintptr // pdReady, pdWait, G waiting for read or pdNil
	wg atomic.Uintptr // pdReady, pdWait, G waiting for write or pdNil

	lock    mutex // protects the following fields
	closing bool
	rrun    bool      // whether rt is running
	wrun    bool      // whether wt is running
	user    uint32    // user settable cookie
	rseq    uintptr   // protects from stale read timers
	rt      timer     // read deadline timer
	rd      int64     // read deadline (a nanotime in the future, -1 when expired)
	wseq    uintptr   // protects from stale write timers
	wt      timer     // write deadline timer
	wd      int64     // write deadline (a nanotime in the future, -1 when expired)
	self    *pollDesc // storage for indirect interface. See (*pollDesc).makeArg.
}

// pollInfo is the bits needed by netpollcheckerr, stored atomically,
// mostly duplicating state that is manipulated under lock in pollDesc.
// The one exception is the pollEventErr bit, which is maintained only
// in the pollInfo.
type pollInfo uint32

const (
	pollClosing = 1 << iota
	pollEventErr
	pollExpiredReadDeadline
	pollExpiredWriteDeadline
	pollFDSeq // 20 bit field, low 20 bits of fdseq field
)

const (
	pollFDSeqBits = 20                   // number of bits in pollFDSeq
	pollFDSeqMask = 1<<pollFDSeqBits - 1 // mask for pollFDSeq
)

func ( pollInfo) () bool              { return &pollClosing != 0 }
func ( pollInfo) () bool             { return &pollEventErr != 0 }
func ( pollInfo) () bool  { return &pollExpiredReadDeadline != 0 }
func ( pollInfo) () bool { return &pollExpiredWriteDeadline != 0 }

// info returns the pollInfo corresponding to pd.
func ( *pollDesc) () pollInfo {
	return pollInfo(.atomicInfo.Load())
}

// publishInfo updates pd.atomicInfo (returned by pd.info)
// using the other values in pd.
// It must be called while holding pd.lock,
// and it must be called after changing anything
// that might affect the info bits.
// In practice this means after changing closing
// or changing rd or wd from < 0 to >= 0.
func ( *pollDesc) () {
	var  uint32
	if .closing {
		 |= pollClosing
	}
	if .rd < 0 {
		 |= pollExpiredReadDeadline
	}
	if .wd < 0 {
		 |= pollExpiredWriteDeadline
	}
	 |= uint32(.fdseq.Load()&pollFDSeqMask) << pollFDSeq

	// Set all of x except the pollEventErr bit.
	 := .atomicInfo.Load()
	for !.atomicInfo.CompareAndSwap(, (&pollEventErr)|) {
		 = .atomicInfo.Load()
	}
}

// setEventErr sets the result of pd.info().eventErr() to b.
// We only change the error bit if seq == 0 or if seq matches pollFDSeq
// (issue #59545).
func ( *pollDesc) ( bool,  uintptr) {
	 := uint32( & pollFDSeqMask)
	 := .atomicInfo.Load()
	 := ( >> pollFDSeq) & pollFDSeqMask
	if  != 0 &&  !=  {
		return
	}
	for (&pollEventErr != 0) !=  && !.atomicInfo.CompareAndSwap(, ^pollEventErr) {
		 = .atomicInfo.Load()
		 := ( >> pollFDSeq) & pollFDSeqMask
		if  != 0 &&  !=  {
			return
		}
	}
}

type pollCache struct {
	lock  mutex
	first *pollDesc
	// PollDesc objects must be type-stable,
	// because we can get ready notification from epoll/kqueue
	// after the descriptor is closed/reused.
	// Stale notifications are detected using seq variable,
	// seq is incremented when deadlines are changed or descriptor is reused.
}

var (
	netpollInitLock mutex
	netpollInited   atomic.Uint32

	pollcache      pollCache
	netpollWaiters atomic.Uint32
)

// netpollWaiters is accessed in tests
//go:linkname netpollWaiters

//go:linkname poll_runtime_pollServerInit internal/poll.runtime_pollServerInit
func poll_runtime_pollServerInit() {
	netpollGenericInit()
}

func netpollGenericInit() {
	if netpollInited.Load() == 0 {
		lockInit(&netpollInitLock, lockRankNetpollInit)
		lockInit(&pollcache.lock, lockRankPollCache)
		lock(&netpollInitLock)
		if netpollInited.Load() == 0 {
			netpollinit()
			netpollInited.Store(1)
		}
		unlock(&netpollInitLock)
	}
}

func netpollinited() bool {
	return netpollInited.Load() != 0
}

//go:linkname poll_runtime_isPollServerDescriptor internal/poll.runtime_isPollServerDescriptor

// poll_runtime_isPollServerDescriptor reports whether fd is a
// descriptor being used by netpoll.
func poll_runtime_isPollServerDescriptor( uintptr) bool {
	return netpollIsPollDescriptor()
}

//go:linkname poll_runtime_pollOpen internal/poll.runtime_pollOpen
func poll_runtime_pollOpen( uintptr) (*pollDesc, int) {
	 := pollcache.alloc()
	lock(&.lock)
	 := .wg.Load()
	if  != pdNil &&  != pdReady {
		throw("runtime: blocked write on free polldesc")
	}
	 := .rg.Load()
	if  != pdNil &&  != pdReady {
		throw("runtime: blocked read on free polldesc")
	}
	.fd = 
	if .fdseq.Load() == 0 {
		// The value 0 is special in setEventErr, so don't use it.
		.fdseq.Store(1)
	}
	.closing = false
	.setEventErr(false, 0)
	.rseq++
	.rg.Store(pdNil)
	.rd = 0
	.wseq++
	.wg.Store(pdNil)
	.wd = 0
	.self = 
	.publishInfo()
	unlock(&.lock)

	 := netpollopen(, )
	if  != 0 {
		pollcache.free()
		return nil, int()
	}
	return , 0
}

//go:linkname poll_runtime_pollClose internal/poll.runtime_pollClose
func poll_runtime_pollClose( *pollDesc) {
	if !.closing {
		throw("runtime: close polldesc w/o unblock")
	}
	 := .wg.Load()
	if  != pdNil &&  != pdReady {
		throw("runtime: blocked write on closing polldesc")
	}
	 := .rg.Load()
	if  != pdNil &&  != pdReady {
		throw("runtime: blocked read on closing polldesc")
	}
	netpollclose(.fd)
	pollcache.free()
}

func ( *pollCache) ( *pollDesc) {
	// pd can't be shared here, but lock anyhow because
	// that's what publishInfo documents.
	lock(&.lock)

	// Increment the fdseq field, so that any currently
	// running netpoll calls will not mark pd as ready.
	 := .fdseq.Load()
	 = ( + 1) & (1<<taggedPointerBits - 1)
	.fdseq.Store()

	.publishInfo()

	unlock(&.lock)

	lock(&.lock)
	.link = .first
	.first = 
	unlock(&.lock)
}

// poll_runtime_pollReset, which is internal/poll.runtime_pollReset,
// prepares a descriptor for polling in mode, which is 'r' or 'w'.
// This returns an error code; the codes are defined above.
//
//go:linkname poll_runtime_pollReset internal/poll.runtime_pollReset
func poll_runtime_pollReset( *pollDesc,  int) int {
	 := netpollcheckerr(, int32())
	if  != pollNoError {
		return 
	}
	if  == 'r' {
		.rg.Store(pdNil)
	} else if  == 'w' {
		.wg.Store(pdNil)
	}
	return pollNoError
}

// poll_runtime_pollWait, which is internal/poll.runtime_pollWait,
// waits for a descriptor to be ready for reading or writing,
// according to mode, which is 'r' or 'w'.
// This returns an error code; the codes are defined above.
//
//go:linkname poll_runtime_pollWait internal/poll.runtime_pollWait
func poll_runtime_pollWait( *pollDesc,  int) int {
	 := netpollcheckerr(, int32())
	if  != pollNoError {
		return 
	}
	// As for now only Solaris, illumos, AIX and wasip1 use level-triggered IO.
	if GOOS == "solaris" || GOOS == "illumos" || GOOS == "aix" || GOOS == "wasip1" {
		netpollarm(, )
	}
	for !netpollblock(, int32(), false) {
		 = netpollcheckerr(, int32())
		if  != pollNoError {
			return 
		}
		// Can happen if timeout has fired and unblocked us,
		// but before we had a chance to run, timeout has been reset.
		// Pretend it has not happened and retry.
	}
	return pollNoError
}

//go:linkname poll_runtime_pollWaitCanceled internal/poll.runtime_pollWaitCanceled
func poll_runtime_pollWaitCanceled( *pollDesc,  int) {
	// This function is used only on windows after a failed attempt to cancel
	// a pending async IO operation. Wait for ioready, ignore closing or timeouts.
	for !netpollblock(, int32(), true) {
	}
}

//go:linkname poll_runtime_pollSetDeadline internal/poll.runtime_pollSetDeadline
func poll_runtime_pollSetDeadline( *pollDesc,  int64,  int) {
	lock(&.lock)
	if .closing {
		unlock(&.lock)
		return
	}
	,  := .rd, .wd
	 :=  > 0 &&  == 
	if  > 0 {
		 += nanotime()
		if  <= 0 {
			// If the user has a deadline in the future, but the delay calculation
			// overflows, then set the deadline to the maximum possible value.
			 = 1<<63 - 1
		}
	}
	if  == 'r' ||  == 'r'+'w' {
		.rd = 
	}
	if  == 'w' ||  == 'r'+'w' {
		.wd = 
	}
	.publishInfo()
	 := .rd > 0 && .rd == .wd
	 := netpollReadDeadline
	if  {
		 = netpollDeadline
	}
	if !.rrun {
		if .rd > 0 {
			// Copy current seq into the timer arg.
			// Timer func will check the seq against current descriptor seq,
			// if they differ the descriptor was reused or timers were reset.
			.rt.modify(.rd, 0, , .makeArg(), .rseq)
			.rrun = true
		}
	} else if .rd !=  ||  !=  {
		.rseq++ // invalidate current timers
		if .rd > 0 {
			.rt.modify(.rd, 0, , .makeArg(), .rseq)
		} else {
			.rt.stop()
			.rrun = false
		}
	}
	if !.wrun {
		if .wd > 0 && ! {
			.wt.modify(.wd, 0, netpollWriteDeadline, .makeArg(), .wseq)
			.wrun = true
		}
	} else if .wd !=  ||  !=  {
		.wseq++ // invalidate current timers
		if .wd > 0 && ! {
			.wt.modify(.wd, 0, netpollWriteDeadline, .makeArg(), .wseq)
		} else {
			.wt.stop()
			.wrun = false
		}
	}
	// If we set the new deadline in the past, unblock currently pending IO if any.
	// Note that pd.publishInfo has already been called, above, immediately after modifying rd and wd.
	 := int32(0)
	var ,  *g
	if .rd < 0 {
		 = netpollunblock(, 'r', false, &)
	}
	if .wd < 0 {
		 = netpollunblock(, 'w', false, &)
	}
	unlock(&.lock)
	if  != nil {
		netpollgoready(, 3)
	}
	if  != nil {
		netpollgoready(, 3)
	}
	netpollAdjustWaiters()
}

//go:linkname poll_runtime_pollUnblock internal/poll.runtime_pollUnblock
func poll_runtime_pollUnblock( *pollDesc) {
	lock(&.lock)
	if .closing {
		throw("runtime: unblock on closing polldesc")
	}
	.closing = true
	.rseq++
	.wseq++
	var ,  *g
	.publishInfo()
	 := int32(0)
	 = netpollunblock(, 'r', false, &)
	 = netpollunblock(, 'w', false, &)
	if .rrun {
		.rt.stop()
		.rrun = false
	}
	if .wrun {
		.wt.stop()
		.wrun = false
	}
	unlock(&.lock)
	if  != nil {
		netpollgoready(, 3)
	}
	if  != nil {
		netpollgoready(, 3)
	}
	netpollAdjustWaiters()
}

// netpollready is called by the platform-specific netpoll function.
// It declares that the fd associated with pd is ready for I/O.
// The toRun argument is used to build a list of goroutines to return
// from netpoll. The mode argument is 'r', 'w', or 'r'+'w' to indicate
// whether the fd is ready for reading or writing or both.
//
// This returns a delta to apply to netpollWaiters.
//
// This may run while the world is stopped, so write barriers are not allowed.
//
//go:nowritebarrier
func netpollready( *gList,  *pollDesc,  int32) int32 {
	 := int32(0)
	var ,  *g
	if  == 'r' ||  == 'r'+'w' {
		 = netpollunblock(, 'r', true, &)
	}
	if  == 'w' ||  == 'r'+'w' {
		 = netpollunblock(, 'w', true, &)
	}
	if  != nil {
		.push()
	}
	if  != nil {
		.push()
	}
	return 
}

func netpollcheckerr( *pollDesc,  int32) int {
	 := .info()
	if .closing() {
		return pollErrClosing
	}
	if ( == 'r' && .expiredReadDeadline()) || ( == 'w' && .expiredWriteDeadline()) {
		return pollErrTimeout
	}
	// Report an event scanning error only on a read event.
	// An error on a write event will be captured in a subsequent
	// write call that is able to report a more specific error.
	if  == 'r' && .eventErr() {
		return pollErrNotPollable
	}
	return pollNoError
}

func netpollblockcommit( *g,  unsafe.Pointer) bool {
	 := atomic.Casuintptr((*uintptr)(), pdWait, uintptr(unsafe.Pointer()))
	if  {
		// Bump the count of goroutines waiting for the poller.
		// The scheduler uses this to decide whether to block
		// waiting for the poller if there is nothing else to do.
		netpollAdjustWaiters(1)
	}
	return 
}

func netpollgoready( *g,  int) {
	goready(, +1)
}

// returns true if IO is ready, or false if timed out or closed
// waitio - wait only for completed IO, ignore errors
// Concurrent calls to netpollblock in the same mode are forbidden, as pollDesc
// can hold only a single waiting goroutine for each mode.
func netpollblock( *pollDesc,  int32,  bool) bool {
	 := &.rg
	if  == 'w' {
		 = &.wg
	}

	// set the gpp semaphore to pdWait
	for {
		// Consume notification if already ready.
		if .CompareAndSwap(pdReady, pdNil) {
			return true
		}
		if .CompareAndSwap(pdNil, pdWait) {
			break
		}

		// Double check that this isn't corrupt; otherwise we'd loop
		// forever.
		if  := .Load();  != pdReady &&  != pdNil {
			throw("runtime: double wait")
		}
	}

	// need to recheck error states after setting gpp to pdWait
	// this is necessary because runtime_pollUnblock/runtime_pollSetDeadline/deadlineimpl
	// do the opposite: store to closing/rd/wd, publishInfo, load of rg/wg
	if  || netpollcheckerr(, ) == pollNoError {
		gopark(netpollblockcommit, unsafe.Pointer(), waitReasonIOWait, traceBlockNet, 5)
	}
	// be careful to not lose concurrent pdReady notification
	 := .Swap(pdNil)
	if  > pdWait {
		throw("runtime: corrupted polldesc")
	}
	return  == pdReady
}

// netpollunblock moves either pd.rg (if mode == 'r') or
// pd.wg (if mode == 'w') into the pdReady state.
// This returns any goroutine blocked on pd.{rg,wg}.
// It adds any adjustment to netpollWaiters to *delta;
// this adjustment should be applied after the goroutine has
// been marked ready.
func netpollunblock( *pollDesc,  int32,  bool,  *int32) *g {
	 := &.rg
	if  == 'w' {
		 = &.wg
	}

	for {
		 := .Load()
		if  == pdReady {
			return nil
		}
		if  == pdNil && ! {
			// Only set pdReady for ioready. runtime_pollWait
			// will check for timeout/cancel before waiting.
			return nil
		}
		 := pdNil
		if  {
			 = pdReady
		}
		if .CompareAndSwap(, ) {
			if  == pdWait {
				 = pdNil
			} else if  != pdNil {
				* -= 1
			}
			return (*g)(unsafe.Pointer())
		}
	}
}

func netpolldeadlineimpl( *pollDesc,  uintptr, ,  bool) {
	lock(&.lock)
	// Seq arg is seq when the timer was set.
	// If it's stale, ignore the timer event.
	 := .rseq
	if ! {
		 = .wseq
	}
	if  !=  {
		// The descriptor was reused or timers were reset.
		unlock(&.lock)
		return
	}
	 := int32(0)
	var  *g
	if  {
		if .rd <= 0 || !.rrun {
			throw("runtime: inconsistent read deadline")
		}
		.rd = -1
		.publishInfo()
		 = netpollunblock(, 'r', false, &)
	}
	var  *g
	if  {
		if .wd <= 0 || !.wrun && ! {
			throw("runtime: inconsistent write deadline")
		}
		.wd = -1
		.publishInfo()
		 = netpollunblock(, 'w', false, &)
	}
	unlock(&.lock)
	if  != nil {
		netpollgoready(, 0)
	}
	if  != nil {
		netpollgoready(, 0)
	}
	netpollAdjustWaiters()
}

func netpollDeadline( any,  uintptr,  int64) {
	netpolldeadlineimpl(.(*pollDesc), , true, true)
}

func netpollReadDeadline( any,  uintptr,  int64) {
	netpolldeadlineimpl(.(*pollDesc), , true, false)
}

func netpollWriteDeadline( any,  uintptr,  int64) {
	netpolldeadlineimpl(.(*pollDesc), , false, true)
}

// netpollAnyWaiters reports whether any goroutines are waiting for I/O.
func netpollAnyWaiters() bool {
	return netpollWaiters.Load() > 0
}

// netpollAdjustWaiters adds delta to netpollWaiters.
func netpollAdjustWaiters( int32) {
	if  != 0 {
		netpollWaiters.Add()
	}
}

func ( *pollCache) () *pollDesc {
	lock(&.lock)
	if .first == nil {
		const  = unsafe.Sizeof(pollDesc{})
		 := pollBlockSize / 
		if  == 0 {
			 = 1
		}
		// Must be in non-GC memory because can be referenced
		// only from epoll/kqueue internals.
		 := persistentalloc(*, 0, &memstats.other_sys)
		for  := uintptr(0);  < ; ++ {
			 := (*pollDesc)(add(, *))
			lockInit(&.lock, lockRankPollDesc)
			.rt.init(nil, nil)
			.wt.init(nil, nil)
			.link = .first
			.first = 
		}
	}
	 := .first
	.first = .link
	unlock(&.lock)
	return 
}

// makeArg converts pd to an interface{}.
// makeArg does not do any allocation. Normally, such
// a conversion requires an allocation because pointers to
// types which embed runtime/internal/sys.NotInHeap (which pollDesc is)
// must be stored in interfaces indirectly. See issue 42076.
func ( *pollDesc) () ( any) {
	 := (*eface)(unsafe.Pointer(&))
	._type = pdType
	.data = unsafe.Pointer(&.self)
	return
}

var (
	pdEface any    = (*pollDesc)(nil)
	pdType  *_type = efaceOf(&pdEface)._type
)