## Waku Store protocol for historical messaging support. ## See spec for more details: ## https://github.com/vacp2p/specs/blob/master/specs/waku/v2/waku-store.md {.push raises: [Defect].} import std/[tables, times, sequtils, options, math], stew/results, chronicles, chronos, bearssl, libp2p/crypto/crypto, libp2p/protocols/protocol, libp2p/protobuf/minprotobuf, libp2p/stream/connection, metrics import ../../node/storage/message/message_store, ../../node/storage/message/waku_store_queue, ../../node/peer_manager/peer_manager, ../../utils/time, ../../utils/pagination, ../../utils/requests, ../waku_message, ../waku_swap/waku_swap, ./rpc, ./rpc_codec declarePublicGauge waku_store_messages, "number of historical messages", ["type"] declarePublicGauge waku_store_peers, "number of store peers" declarePublicGauge waku_store_errors, "number of store protocol errors", ["type"] declarePublicGauge waku_store_queries, "number of store queries received" logScope: topics = "wakustore" const WakuStoreCodec* = "/vac/waku/store/2.0.0-beta4" DefaultTopic* = "/waku/2/default-waku/proto" # Constants required for pagination ------------------------------------------- MaxPageSize* = StoreMaxPageSize # TODO the DefaultPageSize can be changed, it's current value is random DefaultPageSize* = uint64(20) # A recommended default number of waku messages per page MaxTimeVariance* = StoreMaxTimeVariance const MaxRpcSize = StoreMaxPageSize * MaxWakuMessageSize + 64*1024 # We add a 64kB safety buffer for protocol overhead # Error types (metric label values) const storeFailure = "store_failure" dialFailure = "dial_failure" decodeRpcFailure = "decode_rpc_failure" peerNotFoundFailure = "peer_not_found_failure" type WakuStoreResult*[T] = Result[T, string] WakuStore* = ref object of LPProtocol peerManager*: PeerManager rng*: ref BrHmacDrbgContext messages*: StoreQueueRef # in-memory message store store*: MessageStore # sqlite DB handle wakuSwap*: WakuSwap persistMessages*: bool #TODO: WakuMessageStore currenly also holds isSqliteOnly; put it in single place. isSqliteOnly: bool # if true, don't use in memory-store and answer history queries from the sqlite DB proc findMessages(w: WakuStore, query: HistoryQuery): HistoryResponse {.gcsafe.} = ## Query history to return a single page of messages matching the query # Extract query criteria. All query criteria are optional let qContentTopics = if (query.contentFilters.len != 0): some(query.contentFilters.mapIt(it.contentTopic)) else: none(seq[ContentTopic]) qPubSubTopic = if (query.pubsubTopic != ""): some(query.pubsubTopic) else: none(string) qCursor = if query.pagingInfo.cursor != Index(): some(query.pagingInfo.cursor) else: none(Index) qStartTime = if query.startTime != Timestamp(0): some(query.startTime) else: none(Timestamp) qEndTime = if query.endTime != Timestamp(0): some(query.endTime) else: none(Timestamp) qMaxPageSize = query.pagingInfo.pageSize qAscendingOrder = query.pagingInfo.direction == PagingDirection.FORWARD let queryRes = block: if w.isSqliteOnly: w.store.getMessagesByHistoryQuery( contentTopic = qContentTopics, pubsubTopic = qPubSubTopic, cursor = qCursor, startTime = qStartTime, endTime = qEndTime, maxPageSize = qMaxPageSize, ascendingOrder = qAscendingOrder ) else: w.messages.getMessagesByHistoryQuery( contentTopic = qContentTopics, pubsubTopic = qPubSubTopic, cursor = qCursor, startTime = qStartTime, endTime = qEndTime, maxPageSize = qMaxPageSize, ascendingOrder = qAscendingOrder ) # Build response # TODO: Improve error reporting if queryRes.isErr(): return HistoryResponse(messages: @[], pagingInfo: PagingInfo(), error: HistoryResponseError.INVALID_CURSOR) let (messages, updatedPagingInfo) = queryRes.get() HistoryResponse( messages: messages, pagingInfo: updatedPagingInfo.get(PagingInfo()), error: HistoryResponseError.NONE ) proc init*(ws: WakuStore, capacity = StoreDefaultCapacity) = proc handler(conn: Connection, proto: string) {.async.} = let buf = await conn.readLp(MaxRpcSize.int) let resReq = HistoryRPC.init(buf) if resReq.isErr(): error "failed to decode rpc", peerId=conn.peerId waku_store_errors.inc(labelValues = [decodeRpcFailure]) return let req = resReq.value info "received history query", peerId=conn.peerId, requestId=req.requestId, query=req.query waku_store_queries.inc() let resp = ws.findMessages(req.query) if not ws.wakuSwap.isNil: info "handle store swap", peerId=conn.peerId, requestId=req.requestId, text=ws.wakuSwap.text # Perform accounting operation # TODO: Do accounting here, response is HistoryResponse. How do we get node or swap context? let peerId = conn.peerId let messages = resp.messages ws.wakuSwap.credit(peerId, messages.len) info "sending history response", peerId=conn.peerId, requestId=req.requestId, messages=resp.messages.len let rpc = HistoryRPC(requestId: req.requestId, response: resp) await conn.writeLp(rpc.encode().buffer) ws.handler = handler ws.codec = WakuStoreCodec ws.messages = StoreQueueRef.new(capacity) if ws.store.isNil: return if ws.isSqliteOnly: info "SQLite-only store initialized. Messages are *not* loaded into memory." return # Load all messages from sqliteStore into queueStore info "attempting to load messages from persistent storage" let res = ws.store.getAllMessages() if res.isOk(): for (receiverTime, msg, pubsubTopic) in res.value: let index = Index.compute(msg, receiverTime, pubsubTopic) discard ws.messages.put(index, msg, pubsubTopic) info "successfully loaded messages from the persistent store" else: warn "failed to load messages from the persistent store", err = res.error() debug "the number of messages in the memory", messageNum=ws.messages.len waku_store_messages.set(ws.messages.len.int64, labelValues = ["stored"]) proc init*(T: type WakuStore, peerManager: PeerManager, rng: ref BrHmacDrbgContext, store: MessageStore = nil, wakuSwap: WakuSwap = nil, persistMessages = true, capacity = StoreDefaultCapacity, isSqliteOnly = false): T = let ws = WakuStore(rng: rng, peerManager: peerManager, store: store, wakuSwap: wakuSwap, persistMessages: persistMessages, isSqliteOnly: isSqliteOnly) ws.init(capacity) return ws # TODO: This should probably be an add function and append the peer to an array proc setPeer*(ws: WakuStore, peer: RemotePeerInfo) = ws.peerManager.addPeer(peer, WakuStoreCodec) waku_store_peers.inc() proc handleMessage*(w: WakuStore, topic: string, msg: WakuMessage) {.async.} = if not w.persistMessages: # Store is mounted but new messages should not be stored return let index = Index.compute( msg, receivedTime = getNanosecondTime(getTime().toUnixFloat()), pubsubTopic = topic ) # Add message to in-memory store if not w.isSqliteOnly: # Handle WakuMessage according to store protocol trace "handle message in WakuStore", topic=topic, msg=msg let addRes = w.messages.add(IndexedWakuMessage(msg: msg, index: index, pubsubTopic: topic)) if addRes.isErr(): trace "Attempt to add message to store failed", msg=msg, index=index, err=addRes.error() waku_store_errors.inc(labelValues = [$(addRes.error())]) return waku_store_messages.set(w.messages.len.int64, labelValues = ["stored"]) if w.store.isNil: return let res = w.store.put(index, msg, topic) if res.isErr(): trace "failed to store messages", err=res.error() waku_store_errors.inc(labelValues = [storeFailure]) # TODO: Remove after converting the query method into a non-callback method type QueryHandlerFunc* = proc(response: HistoryResponse) {.gcsafe, closure.} proc query(w: WakuStore, req: HistoryQuery, peer: RemotePeerInfo): Future[WakuStoreResult[HistoryResponse]] {.async, gcsafe.} = let connOpt = await w.peerManager.dialPeer(peer, WakuStoreCodec) if connOpt.isNone(): waku_store_errors.inc(labelValues = [dialFailure]) return err(dialFailure) let connection = connOpt.get() let rpc = HistoryRPC(requestId: generateRequestId(w.rng), query: req) await connection.writeLP(rpc.encode().buffer) var message = await connOpt.get().readLp(MaxRpcSize.int) let response = HistoryRPC.init(message) if response.isErr(): error "failed to decode response" waku_store_errors.inc(labelValues = [decodeRpcFailure]) return err(decodeRpcFailure) waku_store_messages.set(response.value.response.messages.len.int64, labelValues = ["retrieved"]) return ok(response.value.response) proc query*(w: WakuStore, req: HistoryQuery): Future[WakuStoreResult[HistoryResponse]] {.async, gcsafe.} = # TODO: We need to be more stratigic about which peers we dial. Right now we just set one on the service. # Ideally depending on the query and our set of peers we take a subset of ideal peers. # This will require us to check for various factors such as: # - which topics they track # - latency? # - default store peer? let peerOpt = w.peerManager.selectPeer(WakuStoreCodec) if peerOpt.isNone(): error "no suitable remote peers" waku_store_errors.inc(labelValues = [peerNotFoundFailure]) return err(peerNotFoundFailure) return await w.query(req, peerOpt.get()) proc query*(w: WakuStore, req: HistoryQuery, handler: QueryHandlerFunc) {.async, gcsafe, deprecated: "Use the no-callback version of this method".} = let response = await w.query(req) if response.isErr(): error "history query failed", error=response.error() return handler(response.get()) ## 21/WAKU2-FAULT-TOLERANT-STORE proc queryFrom*(w: WakuStore, req: HistoryQuery, handler: QueryHandlerFunc, peer: RemotePeerInfo): Future[WakuStoreResult[uint64]] {.async, gcsafe, deprecated: "Use the query() no-callback procedure instead".} = ## Sends the query to the given peer. Returns the number of retrieved messages if no error occurs, otherwise returns the error string # TODO: dialPeer add it to the list of known peers, while it does not cause any issue but might be unnecessary let res = await w.query(req, peer) if res.isErr(): return err(res.error()) let response = res.get() handler(response) return ok(response.messages.len.uint64) proc queryFromWithPaging*(w: WakuStore, query: HistoryQuery, peer: RemotePeerInfo): Future[WakuStoreResult[seq[WakuMessage]]] {.async, gcsafe.} = ## A thin wrapper for query. Sends the query to the given peer. when the query has a valid pagingInfo, ## it retrieves the historical messages in pages. ## Returns all the fetched messages, if error occurs, returns an error string # Make a copy of the query var req = query var messageList: seq[WakuMessage] = @[] # Fetch the history in pages while true: let res = await w.query(req, peer) if res.isErr(): return err(res.error()) let response = res.get() messageList.add(response.messages) # Check whether it is the last page if response.pagingInfo.pageSize == 0: break # Update paging cursor req.pagingInfo.cursor = response.pagingInfo.cursor return ok(messageList) proc queryLoop(w: WakuStore, req: HistoryQuery, candidateList: seq[RemotePeerInfo]): Future[WakuStoreResult[seq[WakuMessage]]] {.async, gcsafe.} = ## Loops through the peers candidate list in order and sends the query to each ## ## Once all responses have been received, the retrieved messages are consolidated into one deduplicated list. ## if no messages have been retrieved, the returned future will resolve into a result holding an empty seq. let queriesList = candidateList.mapIt(w.queryFromWithPaging(req, it)) await allFutures(queriesList) let messagesList = queriesList .map(proc (fut: Future[WakuStoreResult[seq[WakuMessage]]]): seq[WakuMessage] = # These futures have been awaited before using allFutures(). Call completed() just as a sanity check. if not fut.completed() or fut.read().isErr(): return @[] fut.read().value ) .concat() .deduplicate() if messagesList.len == 0: return err("failed to resolve the query") return ok(messagesList) proc resume*(w: WakuStore, peerList: Option[seq[RemotePeerInfo]] = none(seq[RemotePeerInfo]), pageSize: uint64 = DefaultPageSize, pubsubTopic = DefaultTopic): Future[WakuStoreResult[uint64]] {.async, gcsafe.} = ## resume proc retrieves the history of waku messages published on the default waku pubsub topic since the last time the waku store node has been online ## messages are stored in the store node's messages field and in the message db ## the offline time window is measured as the difference between the current time and the timestamp of the most recent persisted waku message ## an offset of 20 second is added to the time window to count for nodes asynchrony ## peerList indicates the list of peers to query from. ## The history is fetched from all available peers in this list and then consolidated into one deduplicated list. ## Such candidates should be found through a discovery method (to be developed). ## if no peerList is passed, one of the peers in the underlying peer manager unit of the store protocol is picked randomly to fetch the history from. ## The history gets fetched successfully if the dialed peer has been online during the queried time window. ## the resume proc returns the number of retrieved messages if no error occurs, otherwise returns the error string var lastSeenTime = Timestamp(0) var currentTime = getNanosecondTime(epochTime()) let lastSeenItem = w.messages.last() if lastSeenItem.isOk(): lastSeenTime = lastSeenItem.get().msg.timestamp # adjust the time window with an offset of 20 seconds let offset: Timestamp = getNanosecondTime(20) currentTime = currentTime + offset lastSeenTime = max(lastSeenTime - offset, 0) debug "the offline time window is", lastSeenTime=lastSeenTime, currentTime=currentTime let req = HistoryQuery( pubsubTopic: pubsubTopic, startTime: lastSeenTime, endTime: currentTime, pagingInfo: PagingInfo( direction:PagingDirection.FORWARD, pageSize: pageSize ) ) var res: WakuStoreResult[seq[WakuMessage]] if peerList.isSome(): debug "trying the candidate list to fetch the history" res = await w.queryLoop(req, peerList.get()) else: debug "no candidate list is provided, selecting a random peer" # if no peerList is set then query from one of the peers stored in the peer manager let peerOpt = w.peerManager.selectPeer(WakuStoreCodec) if peerOpt.isNone(): warn "no suitable remote peers" waku_store_errors.inc(labelValues = [peerNotFoundFailure]) return err("no suitable remote peers") debug "a peer is selected from peer manager" res = await w.queryFromWithPaging(req, peerOpt.get()) if res.isErr(): debug "failed to resume the history" return err("failed to resume the history") # Save the retrieved messages in the store var dismissed: uint = 0 var added: uint = 0 for msg in res.get(): let index = Index.compute( msg, receivedTime = getNanosecondTime(getTime().toUnixFloat()), pubsubTopic = pubsubTopic ) # check for duplicate messages # TODO: Should take pubsub topic into account if we are going to support topics rather than the DefaultTopic if w.messages.contains(index): dismissed.inc() continue # store the new message let resPut = w.messages.put(index, msg, pubsubTopic) if resPut.isErr(): trace "failed to store messages", err = resPut.error() waku_store_errors.inc(labelValues = [storeFailure]) continue # store in db if exists if not w.store.isNil(): let resPut = w.store.put(index, msg, pubsubTopic) if resPut.isErr(): trace "failed to store messages", err = resPut.error() waku_store_errors.inc(labelValues = [storeFailure]) continue added.inc() waku_store_messages.set(w.messages.len.int64, labelValues = ["stored"]) debug "resume finished successfully", addedMessages=added, dimissedMessages=dismissed return ok(added) ## EXPERIMENTAL # NOTE: Experimental, maybe incorporate as part of query call proc queryWithAccounting*(ws: WakuStore, req: HistoryQuery): Future[WakuStoreResult[HistoryResponse]] {.async, gcsafe.} = let peerOpt = ws.peerManager.selectPeer(WakuStoreCodec) if peerOpt.isNone(): error "no suitable remote peers" waku_store_errors.inc(labelValues = [peerNotFoundFailure]) return err(peerNotFoundFailure) let res = await ws.query(req, peerOpt.get()) if res.isErr(): return err(res.error()) let response = res.get() # Perform accounting operation. Assumes wakuSwap protocol is mounted ws.wakuSwap.debit(peerOpt.get().peerId, response.messages.len) return ok(response) proc queryWithAccounting*(ws: WakuStore, req: HistoryQuery, handler: QueryHandlerFunc) {.async, gcsafe, deprecated: "Use the no-callback procedure instead".} = # TODO: We need to be more stratigic about which peers we dial. Right now we just set one on the service. # Ideally depending on the query and our set of peers we take a subset of ideal peers. # This will require us to check for various factors such as: # - which topics they track # - latency? # - default store peer? let response = await ws.queryWithAccounting(req) if response.isErr(): error "history query failed", error=response.error() return handler(response.get())