
712 lines
21 KiB
Raw Normal View History

2019-08-27 15:46:12 -06:00
## Nim-LibP2P
2019-09-24 11:48:23 -06:00
## Copyright (c) 2019 Status Research & Development GmbH
2019-08-27 15:46:12 -06:00
## Licensed under either of
## * Apache License, version 2.0, ([LICENSE-APACHE](LICENSE-APACHE))
## at your option.
## This file may not be copied, modified, or distributed except according to
## those terms.
import tables,
import chronos,
import stream/connection,
2019-09-11 13:03:30 -06:00
2020-06-16 22:14:02 -06:00
2019-09-06 01:13:47 -06:00
2019-09-14 07:55:52 -06:00
2019-09-11 13:03:30 -06:00
2019-09-06 01:13:47 -06:00
2019-09-11 20:10:38 -06:00
topics = "switch"
2019-09-11 20:10:38 -06:00
#TODO: General note - use a finite state machine to manage the different
# steps of connections establishing and upgrading. This makes everything
# more robust and less prone to ordering attacks - i.e. muxing can come if
# and only if the channel has been secured (i.e. if a secure manager has been
# previously provided)
declareGauge(libp2p_peers, "total connected peers")
declareCounter(libp2p_dialed_peers, "dialed peers")
declareCounter(libp2p_failed_dials, "failed dials")
declareCounter(libp2p_failed_upgrade, "peers failed upgrade")
const MaxConnectionsPerPeer = 5
NoPubSubException* = object of CatchableError
TooManyConnections* = object of CatchableError
Direction {.pure.} = enum
In, Out
ConnectionHolder = object
dir: Direction
conn: Connection
MuxerHolder = object
dir: Direction
muxer: Muxer
handle: Future[void]
2019-09-11 13:03:30 -06:00
Switch* = ref object of RootObj
2019-08-29 23:17:07 -06:00
peerInfo*: PeerInfo
connections*: Table[string, seq[ConnectionHolder]]
muxed*: Table[string, seq[MuxerHolder]]
2019-08-29 23:17:07 -06:00
transports*: seq[Transport]
protocols*: seq[LPProtocol]
2019-09-04 16:00:39 -06:00
muxers*: Table[string, MuxerProvider]
2020-02-04 17:16:21 +01:00
ms*: MultistreamSelect
2019-09-03 19:50:17 -06:00
identity*: Identify
2019-09-06 01:13:47 -06:00
streamHandler*: StreamHandler
secureManagers*: seq[Secure]
2019-09-11 13:03:30 -06:00
pubSub*: Option[PubSub]
dialLock: Table[string, AsyncLock]
cleanUpLock: Table[string, AsyncLock]
2019-09-11 13:03:30 -06:00
proc newNoPubSubException(): ref NoPubSubException {.inline.} =
2019-09-11 13:03:30 -06:00
result = newException(NoPubSubException, "no pubsub provided!")
2019-08-27 15:46:12 -06:00
proc newTooManyConnections(): ref TooManyConnections {.inline.} =
result = newException(TooManyConnections, "too many connections for peer")
proc disconnect*(s: Switch, peer: PeerInfo) {.async, gcsafe.}
proc subscribePeer*(s: Switch, peerInfo: PeerInfo) {.async, gcsafe.}
proc selectConn(s: Switch, peerInfo: PeerInfo): Connection =
## select the "best" connection according to some criteria
## Ideally when the connection's stats are available
## we'd select the fastest, but for now we simply pick an outgoing
## connection first if none is available, we pick the first outgoing
if isNil(peerInfo):
let conns = s.connections
# it should be OK to sort on each
# access as there should only be
# up to MaxConnectionsPerPeer entries
proc(a, b: ConnectionHolder): int =
if a.dir < b.dir: -1
elif a.dir == b.dir: 0
else: 1
, SortOrder.Descending)
if conns.len > 0:
return conns[0].conn
proc selectMuxer(s: Switch, conn: Connection): Muxer =
## select the muxer for the supplied connection
if isNil(conn):
if not(isNil(conn.peerInfo)) and in s.muxed:
if s.muxed[].len > 0:
let muxers = s.muxed[]
.filterIt( it.muxer.connection == conn )
if muxers.len > 0:
return muxers[0].muxer
proc storeConn(s: Switch,
muxer: Muxer,
dir: Direction,
handle: Future[void] = nil) {.async.} =
## store the connection and muxer
if isNil(muxer):
let conn = muxer.connection
if isNil(conn):
let id =
if s.connections.getOrDefault(id).len > MaxConnectionsPerPeer:
warn "disconnecting peer, too many connections", peer = $conn.peerInfo,
conns = s.connections
await s.disconnect(conn.peerInfo)
raise newTooManyConnections()
.add(ConnectionHolder(conn: conn, dir: dir))
.add(MuxerHolder(muxer: muxer, handle: handle, dir: dir))
trace "storred connection", connections = s.connections.len
proc secure(s: Switch, conn: Connection): Future[Connection] {.async, gcsafe.} =
if s.secureManagers.len <= 0:
2019-09-09 17:17:45 -06:00
raise newException(CatchableError, "No secure managers registered!")
let manager = await, s.secureManagers.mapIt(it.codec))
if manager.len == 0:
2019-09-06 01:13:47 -06:00
raise newException(CatchableError, "Unable to negotiate a secure channel!")
2019-09-09 17:17:45 -06:00
trace "securing connection", codec = manager
let secureProtocol = s.secureManagers.filterIt(it.codec == manager)
# should deal with the correctness of this
# let's avoid duplicating checks but detect if it fails to do it properly
2020-06-21 11:14:19 +02:00
doAssert(secureProtocol.len > 0)
result = await secureProtocol[0].secure(conn, true)
2019-08-31 11:58:49 -06:00
proc identify(s: Switch, conn: Connection) {.async, gcsafe.} =
2019-09-03 19:50:17 -06:00
## identify the connection
2019-09-28 13:54:32 -06:00
if (await, s.identity.codec)):
let info = await s.identity.identify(conn, conn.peerInfo)
if info.pubKey.isNone and isNil(conn):
raise newException(CatchableError,
"no public key provided and no existing peer identity found")
if isNil(conn.peerInfo):
conn.peerInfo = PeerInfo.init(info.pubKey.get())
if info.addrs.len > 0:
conn.peerInfo.addrs = info.addrs
if info.agentVersion.isSome:
conn.peerInfo.agentVersion = info.agentVersion.get()
2020-06-09 20:42:52 +02:00
if info.protoVersion.isSome:
conn.peerInfo.protoVersion = info.protoVersion.get()
2020-06-09 20:42:52 +02:00
if info.protos.len > 0:
conn.peerInfo.protocols = info.protos
trace "identify: identified remote peer", peer = $conn.peerInfo
2019-09-06 01:13:47 -06:00
proc mux(s: Switch, conn: Connection) {.async, gcsafe.} =
2019-09-03 19:50:17 -06:00
## mux incoming connection
2019-09-28 13:54:32 -06:00
2020-06-21 11:14:19 +02:00
trace "muxing connection", peer = $conn
2019-09-04 16:00:39 -06:00
let muxers = toSeq(s.muxers.keys)
2019-09-13 14:04:46 -06:00
if muxers.len == 0:
warn "no muxers registered, skipping upgrade flow"
2019-09-13 14:04:46 -06:00
2019-09-04 16:00:39 -06:00
let muxerName = await, muxers)
2019-09-06 01:13:47 -06:00
if muxerName.len == 0 or muxerName == "na":
2020-06-21 11:14:19 +02:00
debug "no muxer available, early exit", peer = $conn
2019-09-04 16:00:39 -06:00
2019-09-14 09:55:58 -06:00
# create new muxer for connection
2019-09-04 16:00:39 -06:00
let muxer = s.muxers[muxerName].newMuxer(conn)
trace "found a muxer", name = muxerName, peer = $conn
2019-09-04 16:00:39 -06:00
# install stream handler
2019-09-06 01:13:47 -06:00
muxer.streamHandler = s.streamHandler
2019-09-04 16:00:39 -06:00
2019-09-14 09:55:58 -06:00
# new stream for identify
var stream = await muxer.newStream()
var handlerFut: Future[void]
if not(isNil(stream)):
await stream.close() # close identify stream
# call muxer handler, this should
# not end until muxer ends
handlerFut = muxer.handle()
2019-09-08 01:43:33 -06:00
# do identify first, so that we have a
# PeerInfo in case we didn't before
await s.identify(stream)
if isNil(conn.peerInfo):
await muxer.close()
raise newException(CatchableError,
"unable to identify peer, aborting upgrade")
2019-09-05 09:19:39 -06:00
# store it in muxed connections if we have a peer for it
trace "adding muxer for peer", peer =
await s.storeConn(muxer, Direction.Out, handlerFut)
2019-09-04 16:00:39 -06:00
2019-09-28 13:54:32 -06:00
proc cleanupConn(s: Switch, conn: Connection) {.async, gcsafe.} =
if isNil(conn):
if isNil(conn.peerInfo):
let id =
let lock = s.cleanUpLock.mgetOrPut(id, newAsyncLock())
await lock.acquire()
trace "cleaning up connection for peer", peerId = id
if id in s.muxed:
let muxerHolder = s.muxed[id]
it.muxer.connection == conn
if muxerHolder.len > 0:
await muxerHolder[0].muxer.close()
if not(isNil(muxerHolder[0].handle)):
await muxerHolder[0].handle
if id in s.muxed:
it.muxer.connection != conn
if s.muxed[id].len == 0:
if s.pubSub.isSome:
await s.pubSub.get()
if id in s.connections:
it.conn != conn
if s.connections[id].len == 0:
# TODO: Investigate cleanupConn() always called twice for one peer.
if not(conn.peerInfo.isClosed()):
await conn.close()
if lock.locked():
proc disconnect*(s: Switch, peer: PeerInfo) {.async, gcsafe.} =
let connections = s.connections.getOrDefault(
for connHolder in connections:
if not isNil(connHolder.conn):
await s.cleanupConn(connHolder.conn)
proc getMuxedStream(s: Switch, peerInfo: PeerInfo): Future[Connection] {.async, gcsafe.} =
2019-09-28 13:54:32 -06:00
# if there is a muxer for the connection
# use it instead to create a muxed stream
let muxer = s.selectMuxer(s.selectConn(peerInfo)) # always get the first muxer here
if not(isNil(muxer)):
return await muxer.newStream()
2019-09-28 13:54:32 -06:00
proc upgradeOutgoing(s: Switch, conn: Connection): Future[Connection] {.async, gcsafe.} =
conn = $conn
oid = $conn.oid
let sconn = await # secure the connection
if isNil(sconn):
raise newException(CatchableError,
"unable to secure connection, stopping upgrade")
trace "upgrading connection"
await s.mux(sconn) # mux it if possible
if isNil(sconn.peerInfo):
await sconn.close()
raise newException(CatchableError,
"unable to mux connection, stopping upgrade")
trace "succesfully upgraded outgoing connection", uoid = sconn.oid
return sconn
2019-09-04 16:00:39 -06:00
proc upgradeIncoming(s: Switch, conn: Connection) {.async, gcsafe.} =
trace "upgrading incoming connection", conn = $conn, oid = conn.oid
2019-09-28 13:54:32 -06:00
let ms = newMultistream()
2019-09-03 19:50:17 -06:00
2019-09-28 13:54:32 -06:00
# secure incoming connections
proc securedHandler (conn: Connection,
proto: string)
{.async, gcsafe, closure.} =
var sconn: Connection
trace "Securing connection", oid = conn.oid
let secure = s.secureManagers.filterIt(it.codec == proto)[0]
sconn = await, false)
if isNil(sconn):
await sconn.close()
2019-09-28 13:54:32 -06:00
# add the muxer
for muxer in s.muxers.values:
ms.addHandler(muxer.codec, muxer)
# handle subsequent requests
await ms.handle(sconn)
except CancelledError as exc:
raise exc
except CatchableError as exc:
debug "ending secured handler", err = exc.msg
2019-09-28 13:54:32 -06:00
if (await # just handshake
# add the secure handlers
for k in s.secureManagers:
ms.addHandler(k.codec, securedHandler)
2019-09-11 13:03:30 -06:00
# handle secured connections
await ms.handle(conn)
2020-02-20 19:14:39 -06:00
proc internalConnect(s: Switch,
peer: PeerInfo): Future[Connection] {.async.} =
if s.peerInfo.peerId == peer.peerId:
raise newException(CatchableError, "can't dial self!")
let id =
var conn: Connection
let lock = s.dialLock.mgetOrPut(id, newAsyncLock())
if lock.locked():
await lock.acquire()
trace "about to dial peer", peer = id
conn = s.selectConn(peer)
if conn.isNil or conn.closed:
trace "Dialing peer", peer = id
for t in s.transports: # for each transport
for a in peer.addrs: # for each address
if t.handles(a): # check if it can dial it
trace "Dialing address", address = $a
conn = await t.dial(a)
except CancelledError as exc:
trace "dialing canceled", exc = exc.msg
except CatchableError as exc:
trace "dialing failed", exc = exc.msg
# make sure to assign the peer to the connection
conn.peerInfo = peer
conn = await s.upgradeOutgoing(conn)
except CatchableError as exc:
if not(isNil(conn)):
await conn.close()
trace "Unable to establish outgoing link", exc = exc.msg
raise exc
if isNil(conn):
.addCallback do(udata: pointer):
asyncCheck s.cleanupConn(conn)
trace "Reusing existing connection", oid = conn.oid
if isNil(conn):
raise newException(CatchableError,
"Unable to establish outgoing link")
if conn.closed or conn.atEof:
await conn.close()
raise newException(CatchableError,
"Connection dead on arrival")
doAssert( in s.connections,
"connection not tracked!")
trace "dial succesfull", oid = $conn.oid,
peer = $conn.peerInfo
await s.subscribePeer(peer)
return conn
proc connect*(s: Switch, peer: PeerInfo) {.async.} =
discard await s.internalConnect(peer)
proc dial*(s: Switch,
peer: PeerInfo,
proto: string):
Future[Connection] {.async.} =
let conn = await s.internalConnect(peer)
let stream = await s.getMuxedStream(peer)
proc cleanup() {.async.} =
if not(isNil(stream)):
await stream.close()
if not(isNil(conn)):
await conn.close()
if isNil(stream):
await conn.close()
raise newException(CatchableError, "Couldn't get muxed stream")
2020-02-20 19:14:39 -06:00
trace "Attempting to select remote", proto = proto, oid = conn.oid
if not await, proto):
await stream.close()
raise newException(CatchableError, "Unable to select sub-protocol " & proto)
return stream
except CancelledError as exc:
trace "dial canceled"
await cleanup()
raise exc
except CatchableError as exc:
trace "error dialing"
await cleanup()
raise exc
proc mount*[T: LPProtocol](s: Switch, proto: T) {.gcsafe.} =
2019-08-31 11:58:49 -06:00
if isNil(proto.handler):
raise newException(CatchableError,
"Protocol has to define a handle method or proc")
2019-08-27 15:46:12 -06:00
2019-09-06 01:13:47 -06:00
if proto.codec.len == 0:
raise newException(CatchableError,
"Protocol has to define a codec string")
2019-08-31 12:52:56 -06:00
2019-08-31 11:58:49 -06:00, proto)
2019-08-27 20:30:53 -06:00
2020-05-05 17:55:02 +02:00
proc start*(s: Switch): Future[seq[Future[void]]] {.async, gcsafe.} =
2020-06-09 20:42:52 +02:00
trace "starting switch for peer", peerInfo = shortLog(s.peerInfo)
2019-08-31 12:52:56 -06:00
proc handle(conn: Connection): Future[void] {.async, closure, gcsafe.} =
2019-09-04 16:00:39 -06:00
await s.cleanupConn(conn)
await s.upgradeIncoming(conn) # perform upgrade on incoming connection
except CancelledError as exc:
raise exc
except CatchableError as exc:
trace "Exception occurred in Switch.start", exc = exc.msg
2019-09-11 18:15:04 -06:00
var startFuts: seq[Future[void]]
2019-08-27 20:30:53 -06:00
for t in s.transports: # for each transport
2019-09-28 13:54:32 -06:00
for i, a in s.peerInfo.addrs:
2019-08-27 20:30:53 -06:00
if t.handles(a): # check if it handles the multiaddr
2020-05-05 17:55:02 +02:00
var server = await t.listen(a, handle)
2019-09-28 13:54:32 -06:00
s.peerInfo.addrs[i] = # update peer's address
2019-09-11 18:15:04 -06:00
PubSub (Gossip & Flood) Implementation (#36) This adds gossipsub and floodsub, as well as basic interop testing with the go libp2p daemon. * add close event * wip: gossipsub * splitting rpc message * making message handling more consistent * initial gossipsub implementation * feat: nim 1.0 cleanup * wip: gossipsub protobuf * adding encoding/decoding of gossipsub messages * add disconnect handler * add proper gossipsub msg handling * misc: cleanup for nim 1.0 * splitting floodsub and gossipsub tests * feat: add mesh rebalansing * test pubsub * add mesh rebalansing tests * testing mesh maintenance * finishing mcache implementatin * wip: commenting out broken tests * wip: don't run heartbeat for now * switchout debug for trace logging * testing gossip peer selection algorithm * test stream piping * more work around message amplification * get the peerid from message * use timed cache as backing store * allow setting timeout in constructor * several changes to improve performance * more through testing of msg amplification * prevent gc issues * allow piping to self and prevent deadlocks * improove floodsub * allow running hook on cache eviction * prevent race conditions * prevent race conditions and improove tests * use hashes as cache keys * removing useless file * don't create a new seq * re-enable pubsub tests * fix imports * reduce number of runs to speed up tests * break out control message processing * normalize sleeps between steps * implement proper transport filtering * initial interop testing * clean up floodsub publish logic * allow dialing without a protocol * adding multiple reads/writes * use protobuf varint in mplex * don't loose conn's peerInfo * initial interop pubsub tests * don't duplicate connections/peers * bring back interop tests * wip: interop * re-enable interop and daemon tests * add multiple read write tests from handlers * don't cleanup channel prematurely * use correct channel to send/receive msgs * adjust tests with latest changes * include interop tests * remove temp logging output * fix ci * use correct public key serialization * additional tests for pubsub interop
2019-12-05 20:16:18 -06:00
if s.pubSub.isSome:
await s.pubSub.get().start()
info "started libp2p node", peer = $s.peerInfo, addrs = s.peerInfo.addrs
2019-09-11 18:15:04 -06:00
result = startFuts # listen for incoming connections
2019-08-27 15:46:12 -06:00
proc stop*(s: Switch) {.async.} =
trace "stopping switch"
# we want to report errors but we do not want to fail
# or crash here, cos we need to clean possibly MANY items
# and any following conn/transport won't be cleaned up
if s.pubSub.isSome:
await s.pubSub.get().stop()
for conns in toSeq(s.connections.values):
for conn in conns:
2020-05-27 14:46:25 -06:00
await s.cleanupConn(conn.conn)
except CancelledError as exc:
raise exc
2020-05-27 14:46:25 -06:00
except CatchableError as exc:
warn "error cleaning up connections"
2019-09-06 01:13:47 -06:00
for t in s.transports:
await t.close()
except CancelledError as exc:
raise exc
except CatchableError as exc:
warn "error cleaning up transports"
trace "switch stopped"
proc subscribePeer*(s: Switch, peerInfo: PeerInfo) {.async, gcsafe.} =
2019-09-11 20:10:38 -06:00
## Subscribe to pub sub peer
if s.pubSub.isSome and not(s.pubSub.get().connected(peerInfo)):
trace "about to subscribe to pubsub peer", peer = peerInfo.shortLog()
var stream: Connection
stream = await s.getMuxedStream(peerInfo)
except CancelledError as exc:
if not(isNil(stream)):
await stream.close()
raise exc
except CatchableError as exc:
trace "exception in subscribe to peer", peer = peerInfo.shortLog,
exc = exc.msg
if not(isNil(stream)):
await stream.close()
if isNil(stream):
trace "unable to subscribe to peer", peer = peerInfo.shortLog
if not await, s.pubSub.get().codec):
if not(isNil(stream)):
await stream.close()
2019-09-11 13:03:30 -06:00
proc subscribe*(s: Switch, topic: string,
handler: TopicHandler): Future[void] =
2019-09-11 20:10:38 -06:00
## subscribe to a pubsub topic
2019-09-11 13:03:30 -06:00
if s.pubSub.isNone:
var retFuture = newFuture[void]("Switch.subscribe")
return retFuture
return s.pubSub.get().subscribe(topic, handler)
2019-09-11 13:03:30 -06:00
proc unsubscribe*(s: Switch, topics: seq[TopicPair]): Future[void] =
2019-09-11 20:10:38 -06:00
## unsubscribe from topics
2019-09-11 13:03:30 -06:00
if s.pubSub.isNone:
var retFuture = newFuture[void]("Switch.unsubscribe")
return retFuture
return s.pubSub.get().unsubscribe(topics)
2019-09-11 13:03:30 -06:00
proc publish*(s: Switch, topic: string, data: seq[byte]): Future[int] =
2019-09-11 20:10:38 -06:00
# pubslish to pubsub topic
2019-09-11 13:03:30 -06:00
if s.pubSub.isNone:
var retFuture = newFuture[int]("Switch.publish")
return retFuture
2019-09-11 13:03:30 -06:00
return s.pubSub.get().publish(topic, data)
2019-09-11 13:03:30 -06:00
proc addValidator*(s: Switch,
topics: varargs[string],
hook: ValidatorHandler) =
# add validator
if s.pubSub.isNone:
raise newNoPubSubException()
s.pubSub.get().addValidator(topics, hook)
proc removeValidator*(s: Switch,
topics: varargs[string],
hook: ValidatorHandler) =
# pubslish to pubsub topic
if s.pubSub.isNone:
raise newNoPubSubException()
s.pubSub.get().removeValidator(topics, hook)
proc muxerHandler(s: Switch, muxer: Muxer) {.async, gcsafe.} =
var stream = await muxer.newStream()
if not(isNil(stream)):
await stream.close()
# once we got a muxed connection, attempt to
# identify it
await s.identify(stream)
if isNil(stream.peerInfo):
await muxer.close()
muxer.connection.peerInfo = stream.peerInfo
# store muxer and muxed connection
await s.storeConn(muxer, Direction.In)
.addCallback do(udata: pointer):
asyncCheck s.cleanupConn(muxer.connection)
trace "got new muxer", peer = $muxer.connection.peerInfo
# try establishing a pubsub connection
await s.subscribePeer(muxer.connection.peerInfo)
except CancelledError as exc:
await muxer.close()
raise exc
except CatchableError as exc:
await muxer.close()
trace "exception in muxer handler", exc = exc.msg
2019-09-06 01:13:47 -06:00
proc newSwitch*(peerInfo: PeerInfo,
transports: seq[Transport],
identity: Identify,
2019-09-09 11:33:32 -06:00
muxers: Table[string, MuxerProvider],
secureManagers: openarray[Secure] = [],
2019-09-11 13:03:30 -06:00
pubSub: Option[PubSub] = none(PubSub)): Switch =
if secureManagers.len == 0:
raise (ref CatchableError)(msg: "Provide at least one secure manager")
result = Switch(
peerInfo: peerInfo,
ms: newMultistream(),
transports: transports,
connections: initTable[string, seq[ConnectionHolder]](),
muxed: initTable[string, seq[MuxerHolder]](),
identity: identity,
muxers: muxers,
secureManagers: @secureManagers,
2019-09-06 01:13:47 -06:00
let s = result # can't capture result
result.streamHandler = proc(stream: Connection) {.async, gcsafe.} =
2020-05-23 13:25:53 -06:00
2020-06-09 20:42:52 +02:00
trace "handling connection for", peerInfo = $stream
if not(isNil(stream)):
2020-05-23 13:25:53 -06:00
await stream.close()
await # handle incoming connection
except CancelledError as exc:
raise exc
2020-05-23 13:25:53 -06:00
except CatchableError as exc:
trace "exception in stream handler", exc = exc.msg
2019-09-06 01:13:47 -06:00
for key, val in muxers:
val.streamHandler = result.streamHandler
val.muxerHandler = proc(muxer: Muxer): Future[void] =
2019-09-11 13:03:30 -06:00
if pubSub.isSome:
result.pubSub = pubSub