mirror of
https://github.com/cwinfo/yggdrasil-go.git
synced 2024-11-10 09:50:27 +00:00
Add deadline timers, keep searches alive until they complete (or the conn is closed) to keep Write from blocking forever
This commit is contained in:
parent
0059baf36c
commit
15051b0a3c
@ -11,19 +11,35 @@ import (
|
|||||||
"github.com/yggdrasil-network/yggdrasil-go/src/util"
|
"github.com/yggdrasil-network/yggdrasil-go/src/util"
|
||||||
)
|
)
|
||||||
|
|
||||||
|
// Error implements the net.Error interface
|
||||||
|
type ConnError struct {
|
||||||
|
error
|
||||||
|
timeout bool
|
||||||
|
temporary bool
|
||||||
|
}
|
||||||
|
|
||||||
|
func (e *ConnError) Timeout() bool {
|
||||||
|
return e.timeout
|
||||||
|
}
|
||||||
|
|
||||||
|
func (e *ConnError) Temporary() bool {
|
||||||
|
return e.temporary
|
||||||
|
}
|
||||||
|
|
||||||
type Conn struct {
|
type Conn struct {
|
||||||
core *Core
|
core *Core
|
||||||
nodeID *crypto.NodeID
|
nodeID *crypto.NodeID
|
||||||
nodeMask *crypto.NodeID
|
nodeMask *crypto.NodeID
|
||||||
mutex sync.RWMutex
|
mutex sync.RWMutex
|
||||||
|
closed bool
|
||||||
session *sessionInfo
|
session *sessionInfo
|
||||||
readDeadline atomic.Value // time.Time // TODO timer
|
readDeadline atomic.Value // time.Time // TODO timer
|
||||||
writeDeadline atomic.Value // time.Time // TODO timer
|
writeDeadline atomic.Value // time.Time // TODO timer
|
||||||
searching atomic.Value // bool
|
searching atomic.Value // bool
|
||||||
searchwait chan struct{}
|
searchwait chan struct{} // Never reset this, it's only used for the initial search
|
||||||
}
|
}
|
||||||
|
|
||||||
// TODO func NewConn() that initializes atomic and channel fields so things don't crash or block indefinitely
|
// TODO func NewConn() that initializes additional fields as needed
|
||||||
func newConn(core *Core, nodeID *crypto.NodeID, nodeMask *crypto.NodeID, session *sessionInfo) *Conn {
|
func newConn(core *Core, nodeID *crypto.NodeID, nodeMask *crypto.NodeID, session *sessionInfo) *Conn {
|
||||||
conn := Conn{
|
conn := Conn{
|
||||||
core: core,
|
core: core,
|
||||||
@ -32,7 +48,6 @@ func newConn(core *Core, nodeID *crypto.NodeID, nodeMask *crypto.NodeID, session
|
|||||||
session: session,
|
session: session,
|
||||||
searchwait: make(chan struct{}),
|
searchwait: make(chan struct{}),
|
||||||
}
|
}
|
||||||
conn.SetDeadline(time.Time{})
|
|
||||||
conn.searching.Store(false)
|
conn.searching.Store(false)
|
||||||
return &conn
|
return &conn
|
||||||
}
|
}
|
||||||
@ -45,22 +60,27 @@ func (c *Conn) String() string {
|
|||||||
func (c *Conn) startSearch() {
|
func (c *Conn) startSearch() {
|
||||||
// The searchCompleted callback is given to the search
|
// The searchCompleted callback is given to the search
|
||||||
searchCompleted := func(sinfo *sessionInfo, err error) {
|
searchCompleted := func(sinfo *sessionInfo, err error) {
|
||||||
// Make sure that any blocks on read/write operations are lifted
|
defer c.searching.Store(false)
|
||||||
defer func() {
|
|
||||||
defer func() { recover() }() // In case searchwait was closed by another goroutine
|
|
||||||
c.searching.Store(false)
|
|
||||||
close(c.searchwait) // Never reset this to an open channel
|
|
||||||
}()
|
|
||||||
// If the search failed for some reason, e.g. it hit a dead end or timed
|
// If the search failed for some reason, e.g. it hit a dead end or timed
|
||||||
// out, then do nothing
|
// out, then do nothing
|
||||||
if err != nil {
|
if err != nil {
|
||||||
c.core.log.Debugln(c.String(), "DHT search failed:", err)
|
c.core.log.Debugln(c.String(), "DHT search failed:", err)
|
||||||
|
go func() {
|
||||||
|
time.Sleep(time.Second)
|
||||||
|
c.mutex.RLock()
|
||||||
|
closed := c.closed
|
||||||
|
c.mutex.RUnlock()
|
||||||
|
if !closed {
|
||||||
|
// Restart the search, or else Write can stay blocked forever
|
||||||
|
c.core.router.admin <- c.startSearch
|
||||||
|
}
|
||||||
|
}()
|
||||||
return
|
return
|
||||||
}
|
}
|
||||||
// Take the connection mutex
|
// Take the connection mutex
|
||||||
c.mutex.Lock()
|
c.mutex.Lock()
|
||||||
defer c.mutex.Unlock()
|
defer c.mutex.Unlock()
|
||||||
// Were we successfully given a sessionInfo pointeR?
|
// Were we successfully given a sessionInfo pointer?
|
||||||
if sinfo != nil {
|
if sinfo != nil {
|
||||||
// Store it, and update the nodeID and nodeMask (which may have been
|
// Store it, and update the nodeID and nodeMask (which may have been
|
||||||
// wildcarded before now) with their complete counterparts
|
// wildcarded before now) with their complete counterparts
|
||||||
@ -70,11 +90,19 @@ func (c *Conn) startSearch() {
|
|||||||
for i := range c.nodeMask {
|
for i := range c.nodeMask {
|
||||||
c.nodeMask[i] = 0xFF
|
c.nodeMask[i] = 0xFF
|
||||||
}
|
}
|
||||||
|
// Make sure that any blocks on read/write operations are lifted
|
||||||
|
defer func() { recover() }() // So duplicate searches don't panic
|
||||||
|
close(c.searchwait)
|
||||||
} else {
|
} else {
|
||||||
// No session was returned - this shouldn't really happen because we
|
// No session was returned - this shouldn't really happen because we
|
||||||
// should always return an error reason if we don't return a session
|
// should always return an error reason if we don't return a session
|
||||||
panic("DHT search didn't return an error or a sessionInfo")
|
panic("DHT search didn't return an error or a sessionInfo")
|
||||||
}
|
}
|
||||||
|
if c.closed {
|
||||||
|
// Things were closed before the search returned
|
||||||
|
// Go ahead and close it again to make sure the session is cleaned up
|
||||||
|
go c.Close()
|
||||||
|
}
|
||||||
}
|
}
|
||||||
// doSearch will be called below in response to one or more conditions
|
// doSearch will be called below in response to one or more conditions
|
||||||
doSearch := func() {
|
doSearch := func() {
|
||||||
@ -115,17 +143,30 @@ func (c *Conn) startSearch() {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func getDeadlineTimer(value *atomic.Value) *time.Timer {
|
||||||
|
timer := time.NewTimer(0)
|
||||||
|
util.TimerStop(timer)
|
||||||
|
if deadline, ok := value.Load().(time.Time); ok {
|
||||||
|
timer.Reset(time.Until(deadline))
|
||||||
|
}
|
||||||
|
return timer
|
||||||
|
}
|
||||||
|
|
||||||
func (c *Conn) Read(b []byte) (int, error) {
|
func (c *Conn) Read(b []byte) (int, error) {
|
||||||
// Take a copy of the session object
|
// Take a copy of the session object
|
||||||
c.mutex.RLock()
|
c.mutex.RLock()
|
||||||
sinfo := c.session
|
sinfo := c.session
|
||||||
c.mutex.RUnlock()
|
c.mutex.RUnlock()
|
||||||
timer := time.NewTimer(0)
|
timer := getDeadlineTimer(&c.readDeadline)
|
||||||
util.TimerStop(timer)
|
defer util.TimerStop(timer)
|
||||||
// If there is a search in progress then wait for the result
|
// If there is a search in progress then wait for the result
|
||||||
if sinfo == nil {
|
if sinfo == nil {
|
||||||
// Wait for the search to complete
|
// Wait for the search to complete
|
||||||
<-c.searchwait
|
select {
|
||||||
|
case <-c.searchwait:
|
||||||
|
case <-timer.C:
|
||||||
|
return 0, ConnError{errors.New("Timeout"), true, false}
|
||||||
|
}
|
||||||
// Retrieve our session info again
|
// Retrieve our session info again
|
||||||
c.mutex.RLock()
|
c.mutex.RLock()
|
||||||
sinfo = c.session
|
sinfo = c.session
|
||||||
@ -146,8 +187,9 @@ func (c *Conn) Read(b []byte) (int, error) {
|
|||||||
}
|
}
|
||||||
defer util.PutBytes(p.Payload)
|
defer util.PutBytes(p.Payload)
|
||||||
var err error
|
var err error
|
||||||
// Hand over to the session worker
|
done := make(chan struct{})
|
||||||
sinfo.doWorker(func() {
|
workerFunc := func() {
|
||||||
|
defer close(done)
|
||||||
// If the nonce is bad then drop the packet and return an error
|
// If the nonce is bad then drop the packet and return an error
|
||||||
if !sinfo.nonceIsOK(&p.Nonce) {
|
if !sinfo.nonceIsOK(&p.Nonce) {
|
||||||
err = errors.New("packet dropped due to invalid nonce")
|
err = errors.New("packet dropped due to invalid nonce")
|
||||||
@ -172,7 +214,18 @@ func (c *Conn) Read(b []byte) (int, error) {
|
|||||||
sinfo.updateNonce(&p.Nonce)
|
sinfo.updateNonce(&p.Nonce)
|
||||||
sinfo.time = time.Now()
|
sinfo.time = time.Now()
|
||||||
sinfo.bytesRecvd += uint64(len(b))
|
sinfo.bytesRecvd += uint64(len(b))
|
||||||
})
|
}
|
||||||
|
// Hand over to the session worker
|
||||||
|
select { // Send to worker
|
||||||
|
case sinfo.worker <- workerFunc:
|
||||||
|
case <-timer.C:
|
||||||
|
return 0, ConnError{errors.New("Timeout"), true, false}
|
||||||
|
}
|
||||||
|
select { // Wait for worker to return
|
||||||
|
case <-done:
|
||||||
|
case <-timer.C:
|
||||||
|
return 0, ConnError{errors.New("Timeout"), true, false}
|
||||||
|
}
|
||||||
// Something went wrong in the session worker so abort
|
// Something went wrong in the session worker so abort
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return 0, err
|
return 0, err
|
||||||
@ -187,6 +240,8 @@ func (c *Conn) Write(b []byte) (bytesWritten int, err error) {
|
|||||||
c.mutex.RLock()
|
c.mutex.RLock()
|
||||||
sinfo := c.session
|
sinfo := c.session
|
||||||
c.mutex.RUnlock()
|
c.mutex.RUnlock()
|
||||||
|
timer := getDeadlineTimer(&c.writeDeadline)
|
||||||
|
defer util.TimerStop(timer)
|
||||||
// If the session doesn't exist, or isn't initialised (which probably means
|
// If the session doesn't exist, or isn't initialised (which probably means
|
||||||
// that the search didn't complete successfully) then we may need to wait for
|
// that the search didn't complete successfully) then we may need to wait for
|
||||||
// the search to complete or start the search again
|
// the search to complete or start the search again
|
||||||
@ -199,7 +254,11 @@ func (c *Conn) Write(b []byte) (bytesWritten int, err error) {
|
|||||||
})
|
})
|
||||||
}
|
}
|
||||||
// Wait for the search to complete
|
// Wait for the search to complete
|
||||||
<-c.searchwait
|
select {
|
||||||
|
case <-c.searchwait:
|
||||||
|
case <-timer.C:
|
||||||
|
return 0, ConnError{errors.New("Timeout"), true, false}
|
||||||
|
}
|
||||||
// Retrieve our session info again
|
// Retrieve our session info again
|
||||||
c.mutex.RLock()
|
c.mutex.RLock()
|
||||||
sinfo = c.session
|
sinfo = c.session
|
||||||
@ -213,8 +272,9 @@ func (c *Conn) Write(b []byte) (bytesWritten int, err error) {
|
|||||||
}
|
}
|
||||||
// defer util.PutBytes(b)
|
// defer util.PutBytes(b)
|
||||||
var packet []byte
|
var packet []byte
|
||||||
// Hand over to the session worker
|
done := make(chan struct{})
|
||||||
sinfo.doWorker(func() {
|
workerFunc := func() {
|
||||||
|
defer close(done)
|
||||||
// Encrypt the packet
|
// Encrypt the packet
|
||||||
payload, nonce := crypto.BoxSeal(&sinfo.sharedSesKey, b, &sinfo.myNonce)
|
payload, nonce := crypto.BoxSeal(&sinfo.sharedSesKey, b, &sinfo.myNonce)
|
||||||
defer util.PutBytes(payload)
|
defer util.PutBytes(payload)
|
||||||
@ -227,7 +287,18 @@ func (c *Conn) Write(b []byte) (bytesWritten int, err error) {
|
|||||||
}
|
}
|
||||||
packet = p.encode()
|
packet = p.encode()
|
||||||
sinfo.bytesSent += uint64(len(b))
|
sinfo.bytesSent += uint64(len(b))
|
||||||
})
|
}
|
||||||
|
// Hand over to the session worker
|
||||||
|
select { // Send to worker
|
||||||
|
case sinfo.worker <- workerFunc:
|
||||||
|
case <-timer.C:
|
||||||
|
return 0, ConnError{errors.New("Timeout"), true, false}
|
||||||
|
}
|
||||||
|
select { // Wait for worker to return
|
||||||
|
case <-done:
|
||||||
|
case <-timer.C:
|
||||||
|
return 0, ConnError{errors.New("Timeout"), true, false}
|
||||||
|
}
|
||||||
// Give the packet to the router
|
// Give the packet to the router
|
||||||
sinfo.core.router.out(packet)
|
sinfo.core.router.out(packet)
|
||||||
// Finally return the number of bytes we wrote
|
// Finally return the number of bytes we wrote
|
||||||
@ -235,10 +306,15 @@ func (c *Conn) Write(b []byte) (bytesWritten int, err error) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
func (c *Conn) Close() error {
|
func (c *Conn) Close() error {
|
||||||
|
c.mutex.Lock()
|
||||||
|
defer c.mutex.Unlock()
|
||||||
|
if c.session != nil {
|
||||||
// Close the session, if it hasn't been closed already
|
// Close the session, if it hasn't been closed already
|
||||||
c.session.close()
|
c.session.close()
|
||||||
c.session = nil
|
c.session = nil
|
||||||
|
}
|
||||||
// This can't fail yet - TODO?
|
// This can't fail yet - TODO?
|
||||||
|
c.closed = true
|
||||||
return nil
|
return nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user