2022-11-22 19:40:24 +01:00
|
|
|
when (NimMajor, NimMinor) < (1, 4):
|
|
|
|
{.push raises: [Defect].}
|
|
|
|
else:
|
|
|
|
{.push raises: [].}
|
|
|
|
|
|
|
|
import
|
2024-03-12 07:51:03 -04:00
|
|
|
std/[times, options, sequtils, strutils, algorithm],
|
2024-01-25 16:03:48 +01:00
|
|
|
stew/[results, byteutils],
|
2022-11-22 19:40:24 +01:00
|
|
|
chronicles,
|
|
|
|
chronos,
|
|
|
|
metrics
|
|
|
|
import
|
2024-03-12 07:51:03 -04:00
|
|
|
../common/paging,
|
2023-06-27 13:24:31 +02:00
|
|
|
./driver,
|
|
|
|
./retention_policy,
|
2023-04-19 13:29:23 +02:00
|
|
|
../waku_core,
|
2023-11-22 17:32:56 +01:00
|
|
|
../waku_core/message/digest,
|
2022-11-22 19:40:24 +01:00
|
|
|
./common,
|
2023-06-27 13:24:31 +02:00
|
|
|
./archive_metrics
|
2022-11-22 19:40:24 +01:00
|
|
|
|
|
|
|
logScope:
|
|
|
|
topics = "waku archive"
|
|
|
|
|
|
|
|
const
|
|
|
|
DefaultPageSize*: uint = 20
|
|
|
|
MaxPageSize*: uint = 100
|
|
|
|
|
2024-03-16 00:08:47 +01:00
|
|
|
# Retention policy
|
2024-03-12 07:51:03 -04:00
|
|
|
WakuArchiveDefaultRetentionPolicyInterval* = chronos.minutes(30)
|
|
|
|
|
2024-03-16 00:08:47 +01:00
|
|
|
# Metrics reporting
|
2024-03-12 07:51:03 -04:00
|
|
|
WakuArchiveDefaultMetricsReportInterval* = chronos.minutes(1)
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-16 00:08:47 +01:00
|
|
|
# Message validation
|
|
|
|
# 20 seconds maximum allowable sender timestamp "drift"
|
|
|
|
MaxMessageTimestampVariance* = getNanoSecondTime(20)
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-16 00:08:47 +01:00
|
|
|
type MessageValidator* =
|
|
|
|
proc(msg: WakuMessage): Result[void, string] {.closure, gcsafe, raises: [].}
|
2024-03-12 07:51:03 -04:00
|
|
|
|
|
|
|
## Archive
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
type WakuArchive* = ref object
|
|
|
|
driver: ArchiveDriver
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
validator: MessageValidator
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
retentionPolicy: Option[RetentionPolicy]
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
retentionPolicyHandle: Future[void]
|
|
|
|
metricsHandle: Future[void]
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
proc validate*(msg: WakuMessage): Result[void, string] =
|
|
|
|
if msg.ephemeral:
|
|
|
|
# Ephemeral message, do not store
|
|
|
|
return
|
2024-03-16 00:08:47 +01:00
|
|
|
|
2022-11-22 19:40:24 +01:00
|
|
|
if msg.timestamp == 0:
|
|
|
|
return ok()
|
|
|
|
|
|
|
|
let
|
|
|
|
now = getNanosecondTime(getTime().toUnixFloat())
|
|
|
|
lowerBound = now - MaxMessageTimestampVariance
|
|
|
|
upperBound = now + MaxMessageTimestampVariance
|
|
|
|
|
|
|
|
if msg.timestamp < lowerBound:
|
|
|
|
return err(invalidMessageOld)
|
|
|
|
|
|
|
|
if upperBound < msg.timestamp:
|
|
|
|
return err(invalidMessageFuture)
|
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
return ok()
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-16 00:08:47 +01:00
|
|
|
proc new*(
|
|
|
|
T: type WakuArchive,
|
|
|
|
driver: ArchiveDriver,
|
|
|
|
validator: MessageValidator = validate,
|
|
|
|
retentionPolicy = none(RetentionPolicy),
|
|
|
|
): Result[T, string] =
|
2024-03-12 07:51:03 -04:00
|
|
|
if driver.isNil():
|
|
|
|
return err("archive driver is Nil")
|
|
|
|
|
|
|
|
let archive =
|
2024-03-16 00:08:47 +01:00
|
|
|
WakuArchive(driver: driver, validator: validator, retentionPolicy: retentionPolicy)
|
2023-06-27 13:24:31 +02:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
return ok(archive)
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-16 00:08:47 +01:00
|
|
|
proc handleMessage*(
|
|
|
|
self: WakuArchive, pubsubTopic: PubsubTopic, msg: WakuMessage
|
|
|
|
) {.async.} =
|
2024-03-12 07:51:03 -04:00
|
|
|
self.validator(msg).isOkOr:
|
|
|
|
waku_archive_errors.inc(labelValues = [error])
|
2022-11-22 19:40:24 +01:00
|
|
|
return
|
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
let
|
|
|
|
msgDigest = computeDigest(msg)
|
|
|
|
msgHash = computeMessageHash(pubsubTopic, msg)
|
2024-03-16 00:08:47 +01:00
|
|
|
msgTimestamp =
|
|
|
|
if msg.timestamp > 0:
|
|
|
|
msg.timestamp
|
|
|
|
else:
|
|
|
|
getNanosecondTime(getTime().toUnixFloat())
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
trace "handling message",
|
2024-03-16 00:08:47 +01:00
|
|
|
pubsubTopic = pubsubTopic,
|
|
|
|
contentTopic = msg.contentTopic,
|
|
|
|
msgTimestamp = msg.timestamp,
|
|
|
|
usedTimestamp = msgTimestamp,
|
|
|
|
digest = toHex(msgDigest.data),
|
|
|
|
messageHash = toHex(msgHash)
|
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
let insertStartTime = getTime().toUnixFloat()
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
(await self.driver.put(pubsubTopic, msg, msgDigest, msgHash, msgTimestamp)).isOkOr:
|
|
|
|
waku_archive_errors.inc(labelValues = [insertFailure])
|
2024-03-18 15:59:45 +01:00
|
|
|
debug "failed to insert message", err = error
|
2022-11-25 23:20:24 +01:00
|
|
|
let insertDuration = getTime().toUnixFloat() - insertStartTime
|
|
|
|
waku_archive_insert_duration_seconds.observe(insertDuration)
|
|
|
|
|
2024-03-16 00:08:47 +01:00
|
|
|
proc findMessages*(
|
|
|
|
self: WakuArchive, query: ArchiveQuery
|
|
|
|
): Future[ArchiveResult] {.async, gcsafe.} =
|
2022-11-22 19:40:24 +01:00
|
|
|
## Search the archive to return a single page of messages matching the query criteria
|
2024-03-16 00:08:47 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
let maxPageSize =
|
|
|
|
if query.pageSize <= 0:
|
|
|
|
DefaultPageSize
|
|
|
|
else:
|
|
|
|
min(query.pageSize, MaxPageSize)
|
2024-03-16 00:08:47 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
let isAscendingOrder = query.direction.into()
|
|
|
|
|
|
|
|
if query.contentTopics.len > 10:
|
2023-01-11 12:19:59 +01:00
|
|
|
return err(ArchiveError.invalidQuery("too many content topics"))
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2022-11-25 23:20:24 +01:00
|
|
|
let queryStartTime = getTime().toUnixFloat()
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-16 00:08:47 +01:00
|
|
|
let rows = (
|
|
|
|
await self.driver.getMessages(
|
|
|
|
contentTopic = query.contentTopics,
|
|
|
|
pubsubTopic = query.pubsubTopic,
|
|
|
|
cursor = query.cursor,
|
|
|
|
startTime = query.startTime,
|
|
|
|
endTime = query.endTime,
|
|
|
|
hashes = query.hashes,
|
|
|
|
maxPageSize = maxPageSize + 1,
|
|
|
|
ascendingOrder = isAscendingOrder,
|
|
|
|
)
|
|
|
|
).valueOr:
|
2024-03-12 07:51:03 -04:00
|
|
|
return err(ArchiveError(kind: ArchiveErrorKind.DRIVER_ERROR, cause: error))
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2022-11-25 23:20:24 +01:00
|
|
|
let queryDuration = getTime().toUnixFloat() - queryStartTime
|
|
|
|
waku_archive_query_duration_seconds.observe(queryDuration)
|
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
var hashes = newSeq[WakuMessageHash]()
|
2023-01-26 10:19:58 +01:00
|
|
|
var messages = newSeq[WakuMessage]()
|
|
|
|
var cursor = none(ArchiveCursor)
|
2024-03-16 00:08:47 +01:00
|
|
|
|
2023-01-26 10:19:58 +01:00
|
|
|
if rows.len == 0:
|
2024-03-12 07:51:03 -04:00
|
|
|
return ok(ArchiveResponse(hashes: hashes, messages: messages, cursor: cursor))
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2023-01-26 10:19:58 +01:00
|
|
|
## Messages
|
2024-03-12 07:51:03 -04:00
|
|
|
let pageSize = min(rows.len, int(maxPageSize))
|
2024-03-16 00:08:47 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
#TODO once store v2 is removed, unzip instead of 2x map
|
2024-03-16 00:08:47 +01:00
|
|
|
messages = rows[0 ..< pageSize].mapIt(it[1])
|
|
|
|
hashes = rows[0 ..< pageSize].mapIt(it[4])
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2023-01-26 10:19:58 +01:00
|
|
|
## Cursor
|
2024-03-12 07:51:03 -04:00
|
|
|
if rows.len > int(maxPageSize):
|
2022-11-22 19:40:24 +01:00
|
|
|
## Build last message cursor
|
|
|
|
## The cursor is built from the last message INCLUDED in the response
|
|
|
|
## (i.e. the second last message in the rows list)
|
2024-03-16 00:08:47 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
#TODO Once Store v2 is removed keep only message and hash
|
|
|
|
let (pubsubTopic, message, digest, storeTimestamp, hash) = rows[^2]
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
#TODO Once Store v2 is removed, the cursor becomes the hash of the last message
|
2024-03-16 00:08:47 +01:00
|
|
|
cursor = some(
|
|
|
|
ArchiveCursor(
|
|
|
|
digest: MessageDigest.fromBytes(digest),
|
|
|
|
storeTime: storeTimestamp,
|
|
|
|
sendertime: message.timestamp,
|
|
|
|
pubsubTopic: pubsubTopic,
|
|
|
|
hash: hash,
|
|
|
|
)
|
|
|
|
)
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2023-01-26 10:19:58 +01:00
|
|
|
# All messages MUST be returned in chronological order
|
2023-12-19 15:10:27 +01:00
|
|
|
if not isAscendingOrder:
|
2023-01-26 10:19:58 +01:00
|
|
|
reverse(messages)
|
2024-03-12 07:51:03 -04:00
|
|
|
reverse(hashes)
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
return ok(ArchiveResponse(hashes: hashes, messages: messages, cursor: cursor))
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-04-25 09:09:52 -04:00
|
|
|
proc findMessagesV2*(
|
|
|
|
self: WakuArchive, query: ArchiveQuery
|
|
|
|
): Future[ArchiveResult] {.async, gcsafe.} =
|
|
|
|
## Search the archive to return a single page of messages matching the query criteria
|
|
|
|
|
|
|
|
let maxPageSize =
|
|
|
|
if query.pageSize <= 0:
|
|
|
|
DefaultPageSize
|
|
|
|
else:
|
|
|
|
min(query.pageSize, MaxPageSize)
|
|
|
|
|
|
|
|
let isAscendingOrder = query.direction.into()
|
|
|
|
|
|
|
|
if query.contentTopics.len > 10:
|
|
|
|
return err(ArchiveError.invalidQuery("too many content topics"))
|
|
|
|
|
|
|
|
let queryStartTime = getTime().toUnixFloat()
|
|
|
|
|
|
|
|
let rows = (
|
|
|
|
await self.driver.getMessagesV2(
|
|
|
|
contentTopic = query.contentTopics,
|
|
|
|
pubsubTopic = query.pubsubTopic,
|
|
|
|
cursor = query.cursor,
|
|
|
|
startTime = query.startTime,
|
|
|
|
endTime = query.endTime,
|
|
|
|
maxPageSize = maxPageSize + 1,
|
|
|
|
ascendingOrder = isAscendingOrder,
|
|
|
|
)
|
|
|
|
).valueOr:
|
|
|
|
return err(ArchiveError(kind: ArchiveErrorKind.DRIVER_ERROR, cause: error))
|
|
|
|
|
|
|
|
let queryDuration = getTime().toUnixFloat() - queryStartTime
|
|
|
|
waku_archive_query_duration_seconds.observe(queryDuration)
|
|
|
|
|
|
|
|
var messages = newSeq[WakuMessage]()
|
|
|
|
var cursor = none(ArchiveCursor)
|
|
|
|
|
|
|
|
if rows.len == 0:
|
|
|
|
return ok(ArchiveResponse(messages: messages, cursor: cursor))
|
|
|
|
|
|
|
|
## Messages
|
|
|
|
let pageSize = min(rows.len, int(maxPageSize))
|
|
|
|
|
|
|
|
messages = rows[0 ..< pageSize].mapIt(it[1])
|
|
|
|
|
|
|
|
## Cursor
|
|
|
|
if rows.len > int(maxPageSize):
|
|
|
|
## Build last message cursor
|
|
|
|
## The cursor is built from the last message INCLUDED in the response
|
|
|
|
## (i.e. the second last message in the rows list)
|
|
|
|
|
|
|
|
let (pubsubTopic, message, digest, storeTimestamp, _) = rows[^2]
|
|
|
|
|
|
|
|
cursor = some(
|
|
|
|
ArchiveCursor(
|
|
|
|
digest: MessageDigest.fromBytes(digest),
|
|
|
|
storeTime: storeTimestamp,
|
|
|
|
sendertime: message.timestamp,
|
|
|
|
pubsubTopic: pubsubTopic,
|
|
|
|
)
|
|
|
|
)
|
|
|
|
|
|
|
|
# All messages MUST be returned in chronological order
|
|
|
|
if not isAscendingOrder:
|
|
|
|
reverse(messages)
|
|
|
|
|
|
|
|
return ok(ArchiveResponse(messages: messages, cursor: cursor))
|
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
proc periodicRetentionPolicy(self: WakuArchive) {.async.} =
|
|
|
|
debug "executing message retention policy"
|
2023-12-11 08:50:40 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
let policy = self.retentionPolicy.get()
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2023-12-11 08:50:40 +01:00
|
|
|
while true:
|
2024-03-12 07:51:03 -04:00
|
|
|
(await policy.execute(self.driver)).isOkOr:
|
|
|
|
waku_archive_errors.inc(labelValues = [retPolicyFailure])
|
2024-03-16 00:08:47 +01:00
|
|
|
error "failed execution of retention policy", error = error
|
2023-12-11 08:50:40 +01:00
|
|
|
|
|
|
|
await sleepAsync(WakuArchiveDefaultRetentionPolicyInterval)
|
2023-06-27 13:24:31 +02:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
proc periodicMetricReport(self: WakuArchive) {.async.} =
|
|
|
|
while true:
|
|
|
|
let countRes = (await self.driver.getMessagesCount())
|
|
|
|
if countRes.isErr():
|
2024-03-16 00:08:47 +01:00
|
|
|
error "loopReportStoredMessagesMetric failed to get messages count",
|
|
|
|
error = countRes.error
|
2024-03-12 07:51:03 -04:00
|
|
|
else:
|
|
|
|
let count = countRes.get()
|
|
|
|
waku_archive_messages.set(count, labelValues = ["stored"])
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
await sleepAsync(WakuArchiveDefaultMetricsReportInterval)
|
2023-12-14 17:00:13 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
proc start*(self: WakuArchive) =
|
|
|
|
if self.retentionPolicy.isSome():
|
|
|
|
self.retentionPolicyHandle = self.periodicRetentionPolicy()
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
self.metricsHandle = self.periodicMetricReport()
|
2022-11-22 19:40:24 +01:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
proc stopWait*(self: WakuArchive) {.async.} =
|
|
|
|
var futures: seq[Future[void]]
|
2023-06-27 13:24:31 +02:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
if self.retentionPolicy.isSome() and not self.retentionPolicyHandle.isNil():
|
|
|
|
futures.add(self.retentionPolicyHandle.cancelAndWait())
|
2023-06-27 13:24:31 +02:00
|
|
|
|
2024-03-12 07:51:03 -04:00
|
|
|
if not self.metricsHandle.isNil:
|
|
|
|
futures.add(self.metricsHandle.cancelAndWait())
|
2023-06-27 13:24:31 +02:00
|
|
|
|
2024-03-16 00:08:47 +01:00
|
|
|
await noCancel(allFutures(futures))
|