mirror of
https://github.com/codex-storage/nim-libp2p.git
synced 2025-01-15 21:44:19 +00:00
980764774e
* add finegrained timeouts to pubsub * use 10 millis timeout in tests * finalization * revert timeouts * use `atEof` for reads * adjust timeouts and use atEof for reads * use atEof for reads * set isEof flag * no backoff for pubsub streams * temp timer increase, make macos finalize * don't call `subscribePeer` in libp2p anymore * more traces * leak tests * lower timeouts * handle exceptions in control message * don't use `cancelAndWait` * handle exceptions in helpers * wip * don't send empty messages * check for leaks properly * don't use cancelAndWait * don't await subscribption sends * remove subscrivePeer calls from switch * trying without the hooks again
346 lines
9.0 KiB
Nim
346 lines
9.0 KiB
Nim
## Nim-LibP2P
|
|
## Copyright (c) 2019 Status Research & Development GmbH
|
|
## Licensed under either of
|
|
## * Apache License, version 2.0, ([LICENSE-APACHE](LICENSE-APACHE))
|
|
## * MIT license ([LICENSE-MIT](LICENSE-MIT))
|
|
## at your option.
|
|
## This file may not be copied, modified, or distributed except according to
|
|
## those terms.
|
|
|
|
import oids, deques
|
|
import chronos, chronicles, metrics
|
|
import types,
|
|
coder,
|
|
../muxer,
|
|
nimcrypto/utils,
|
|
../../stream/connection,
|
|
../../stream/bufferstream,
|
|
../../peerinfo
|
|
|
|
export connection
|
|
|
|
logScope:
|
|
topics = "mplexchannel"
|
|
|
|
## Channel half-closed states
|
|
##
|
|
## | State | Closed local | Closed remote
|
|
## |=============================================
|
|
## | Read | Yes (until EOF) | No
|
|
## | Write | No | Yes
|
|
##
|
|
|
|
# TODO: this is one place where we need to use
|
|
# a proper state machine, but I've opted out of
|
|
# it for now for two reasons:
|
|
#
|
|
# 1) we don't have that many states to manage
|
|
# 2) I'm not sure if adding the state machine
|
|
# would have simplified or complicated the code
|
|
#
|
|
# But now that this is in place, we should perhaps
|
|
# reconsider reworking it again, this time with a
|
|
# more formal approach.
|
|
#
|
|
|
|
type
|
|
LPChannel* = ref object of BufferStream
|
|
id*: uint64 # channel id
|
|
timeout: Duration # channel timeout if no activity
|
|
activity: bool # reset every time data is sent or received
|
|
name*: string # name of the channel (for debugging)
|
|
conn*: Connection # wrapped connection used to for writing
|
|
initiator*: bool # initiated remotely or locally flag
|
|
isLazy*: bool # is channel lazy
|
|
isOpen*: bool # has channel been opened (only used with isLazy)
|
|
closedLocal*: bool # has channel been closed locally
|
|
msgCode*: MessageType # cached in/out message code
|
|
closeCode*: MessageType # cached in/out close code
|
|
resetCode*: MessageType # cached in/out reset code
|
|
timerTaskFut: Future[void] # the current timer instanse
|
|
|
|
proc open*(s: LPChannel) {.async, gcsafe.}
|
|
|
|
template withWriteLock(lock: AsyncLock, body: untyped): untyped =
|
|
try:
|
|
await lock.acquire()
|
|
body
|
|
finally:
|
|
if not(isNil(lock)) and lock.locked:
|
|
lock.release()
|
|
|
|
template withEOFExceptions(body: untyped): untyped =
|
|
try:
|
|
body
|
|
except LPStreamEOFError as exc:
|
|
trace "muxed connection EOF", exc = exc.msg
|
|
except LPStreamClosedError as exc:
|
|
trace "muxed connection closed", exc = exc.msg
|
|
except LPStreamIncompleteError as exc:
|
|
trace "incomplete message", exc = exc.msg
|
|
|
|
proc cleanupTimer(s: LPChannel) {.async.} =
|
|
## cleanup timers
|
|
if not isNil(s.timerTaskFut) and not s.timerTaskFut.finished:
|
|
s.timerTaskFut.cancel()
|
|
|
|
proc closeMessage(s: LPChannel) {.async.} =
|
|
logScope:
|
|
id = s.id
|
|
initiator = s.initiator
|
|
name = s.name
|
|
oid = $s.oid
|
|
peer = $s.conn.peerInfo
|
|
# stack = getStackTrace()
|
|
|
|
## send close message - this will not raise
|
|
## on EOF or Closed
|
|
withWriteLock(s.writeLock):
|
|
trace "sending close message"
|
|
|
|
await s.conn.writeMsg(s.id, s.closeCode) # write close
|
|
|
|
proc resetMessage(s: LPChannel) {.async.} =
|
|
logScope:
|
|
id = s.id
|
|
initiator = s.initiator
|
|
name = s.name
|
|
oid = $s.oid
|
|
peer = $s.conn.peerInfo
|
|
# stack = getStackTrace()
|
|
|
|
## send reset message - this will not raise
|
|
withEOFExceptions:
|
|
withWriteLock(s.writeLock):
|
|
trace "sending reset message"
|
|
|
|
await s.conn.writeMsg(s.id, s.resetCode) # write reset
|
|
|
|
proc open*(s: LPChannel) {.async, gcsafe.} =
|
|
logScope:
|
|
id = s.id
|
|
initiator = s.initiator
|
|
name = s.name
|
|
oid = $s.oid
|
|
peer = $s.conn.peerInfo
|
|
# stack = getStackTrace()
|
|
|
|
## NOTE: Don't call withExcAndLock or withWriteLock,
|
|
## because this already gets called from writeHandler
|
|
## which is locked
|
|
await s.conn.writeMsg(s.id, MessageType.New, s.name)
|
|
trace "opened channel"
|
|
s.isOpen = true
|
|
|
|
proc closeRemote*(s: LPChannel) {.async.} =
|
|
logScope:
|
|
id = s.id
|
|
initiator = s.initiator
|
|
name = s.name
|
|
oid = $s.oid
|
|
peer = $s.conn.peerInfo
|
|
# stack = getStackTrace()
|
|
|
|
trace "got EOF, closing channel"
|
|
try:
|
|
await s.drainBuffer()
|
|
|
|
s.isEof = true # set EOF immediately to prevent further reads
|
|
await s.close() # close local end
|
|
|
|
# call to avoid leaks
|
|
await procCall BufferStream(s).close() # close parent bufferstream
|
|
await s.cleanupTimer()
|
|
|
|
trace "channel closed on EOF"
|
|
except CancelledError as exc:
|
|
raise exc
|
|
except CatchableError as exc:
|
|
trace "exception closing remote channel", exc = exc.msg
|
|
|
|
method closed*(s: LPChannel): bool =
|
|
## this emulates half-closed behavior
|
|
## when closed locally writing is
|
|
## disabled - see the table in the
|
|
## header of the file
|
|
s.closedLocal
|
|
|
|
method reset*(s: LPChannel) {.base, async, gcsafe.} =
|
|
logScope:
|
|
id = s.id
|
|
initiator = s.initiator
|
|
name = s.name
|
|
oid = $s.oid
|
|
peer = $s.conn.peerInfo
|
|
# stack = getStackTrace()
|
|
|
|
if s.closedLocal and s.isEof:
|
|
trace "channel already closed or reset"
|
|
return
|
|
|
|
trace "resetting channel"
|
|
|
|
# we asyncCheck here because the other end
|
|
# might be dead already - reset is always
|
|
# optimistic
|
|
asyncCheck s.resetMessage()
|
|
|
|
try:
|
|
# drain the buffer before closing
|
|
await s.drainBuffer()
|
|
await procCall BufferStream(s).close()
|
|
|
|
s.isEof = true
|
|
s.closedLocal = true
|
|
|
|
await s.cleanupTimer()
|
|
|
|
except CancelledError as exc:
|
|
raise exc
|
|
except CatchableError as exc:
|
|
trace "exception in reset", exc = exc.msg
|
|
|
|
trace "channel reset"
|
|
|
|
method close*(s: LPChannel) {.async, gcsafe.} =
|
|
logScope:
|
|
id = s.id
|
|
initiator = s.initiator
|
|
name = s.name
|
|
oid = $s.oid
|
|
peer = $s.conn.peerInfo
|
|
# stack = getStackTrace()
|
|
|
|
if s.closedLocal:
|
|
trace "channel already closed"
|
|
return
|
|
|
|
trace "closing local lpchannel"
|
|
|
|
proc closeInternal() {.async.} =
|
|
try:
|
|
await s.closeMessage().wait(2.minutes)
|
|
if s.atEof: # already closed by remote close parent buffer immediately
|
|
await procCall BufferStream(s).close()
|
|
await s.cleanupTimer()
|
|
except CancelledError as exc:
|
|
await s.reset()
|
|
raise exc
|
|
except CatchableError as exc:
|
|
trace "exception closing channel", exc = exc.msg
|
|
await s.reset()
|
|
|
|
trace "lpchannel closed local"
|
|
|
|
s.closedLocal = true
|
|
asyncCheck closeInternal()
|
|
|
|
proc timeoutMonitor(s: LPChannel) {.async.} =
|
|
## monitor the channel for innactivity
|
|
##
|
|
## if the timeout was hit, it means that
|
|
## neither incoming nor outgoing activity
|
|
## has been detected and the channel will
|
|
## be reset
|
|
##
|
|
|
|
logScope:
|
|
id = s.id
|
|
initiator = s.initiator
|
|
name = s.name
|
|
oid = $s.oid
|
|
peer = $s.conn.peerInfo
|
|
|
|
try:
|
|
while true:
|
|
await sleepAsync(s.timeout)
|
|
|
|
if s.closed or s.atEof:
|
|
return
|
|
|
|
if s.activity:
|
|
s.activity = false
|
|
continue
|
|
|
|
break
|
|
|
|
# reset channel on innactivity timeout
|
|
trace "channel timed out, resetting"
|
|
await s.reset()
|
|
except CancelledError as exc:
|
|
raise exc
|
|
except CatchableError as exc:
|
|
trace "exception in timeout", exc = exc.msg
|
|
|
|
method initStream*(s: LPChannel) =
|
|
if s.objName.len == 0:
|
|
s.objName = "LPChannel"
|
|
|
|
procCall BufferStream(s).initStream()
|
|
|
|
method readOnce*(s: LPChannel,
|
|
pbytes: pointer,
|
|
nbytes: int):
|
|
Future[int] =
|
|
s.activity = true
|
|
procCall BufferStream(s).readOnce(pbytes, nbytes)
|
|
|
|
method write*(s: LPChannel, msg: seq[byte]): Future[void] =
|
|
s.activity = true
|
|
procCall BufferStream(s).write(msg)
|
|
|
|
proc init*(
|
|
L: type LPChannel,
|
|
id: uint64,
|
|
conn: Connection,
|
|
initiator: bool,
|
|
name: string = "",
|
|
size: int = DefaultBufferSize,
|
|
lazy: bool = false,
|
|
timeout: Duration = DefaultChanTimeout): LPChannel =
|
|
|
|
let chann = L(
|
|
id: id,
|
|
name: name,
|
|
conn: conn,
|
|
initiator: initiator,
|
|
isLazy: lazy,
|
|
timeout: timeout,
|
|
msgCode: if initiator: MessageType.MsgOut else: MessageType.MsgIn,
|
|
closeCode: if initiator: MessageType.CloseOut else: MessageType.CloseIn,
|
|
resetCode: if initiator: MessageType.ResetOut else: MessageType.ResetIn,
|
|
dir: if initiator: Direction.Out else: Direction.In)
|
|
|
|
logScope:
|
|
id = chann.id
|
|
initiator = chann.initiator
|
|
name = chann.name
|
|
oid = $chann.oid
|
|
peer = $chann.conn.peerInfo
|
|
# stack = getStackTrace()
|
|
|
|
proc writeHandler(data: seq[byte]) {.async, gcsafe.} =
|
|
try:
|
|
if chann.isLazy and not(chann.isOpen):
|
|
await chann.open()
|
|
|
|
# writes should happen in sequence
|
|
trace "sending data"
|
|
|
|
await conn.writeMsg(chann.id,
|
|
chann.msgCode,
|
|
data)
|
|
except CatchableError as exc:
|
|
trace "exception in lpchannel write handler", exc = exc.msg
|
|
await chann.reset()
|
|
raise exc
|
|
|
|
chann.initBufferStream(writeHandler, size)
|
|
when chronicles.enabledLogLevel == LogLevel.TRACE:
|
|
chann.name = if chann.name.len > 0: chann.name else: $chann.oid
|
|
|
|
chann.timerTaskFut = chann.timeoutMonitor()
|
|
trace "created new lpchannel"
|
|
|
|
return chann
|