2023-05-31 08:28:48 +00:00
|
|
|
when (NimMajor, NimMinor) < (1, 4):
|
|
|
|
{.push raises: [Defect].}
|
|
|
|
else:
|
|
|
|
{.push raises: [].}
|
|
|
|
|
|
|
|
import
|
2024-03-12 11:51:03 +00:00
|
|
|
std/[nre, options, sequtils, strutils, strformat, times],
|
|
|
|
stew/[results, byteutils, arrayops],
|
2023-06-07 08:08:43 +00:00
|
|
|
db_postgres,
|
2023-10-31 13:46:46 +00:00
|
|
|
postgres,
|
|
|
|
chronos,
|
|
|
|
chronicles
|
2023-05-31 08:28:48 +00:00
|
|
|
import
|
2024-02-15 11:25:08 +00:00
|
|
|
../../../common/error_handling,
|
2023-05-31 08:28:48 +00:00
|
|
|
../../../waku_core,
|
|
|
|
../../common,
|
2023-06-07 08:08:43 +00:00
|
|
|
../../driver,
|
2023-09-06 17:16:37 +00:00
|
|
|
../../../common/databases/db_postgres as waku_postgres,
|
2024-03-06 19:50:22 +00:00
|
|
|
./postgres_healthcheck,
|
|
|
|
./partitions_manager
|
2023-05-31 08:28:48 +00:00
|
|
|
|
|
|
|
type PostgresDriver* = ref object of ArchiveDriver
|
2023-10-30 14:16:49 +00:00
|
|
|
## Establish a separate pools for read/write operations
|
|
|
|
writeConnPool: PgAsyncPool
|
|
|
|
readConnPool: PgAsyncPool
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2024-03-06 19:50:22 +00:00
|
|
|
## Partition container
|
|
|
|
partitionMngr: PartitionManager
|
|
|
|
futLoopPartitionFactory: Future[void]
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2023-11-07 12:38:37 +00:00
|
|
|
const InsertRowStmtName = "InsertRow"
|
2024-03-15 23:08:47 +00:00
|
|
|
const InsertRowStmtDefinition = # TODO: get the sql queries from a file
|
|
|
|
"""INSERT INTO messages (id, messageHash, storedAt, contentTopic, payload, pubsubTopic,
|
2024-05-06 08:20:21 +00:00
|
|
|
version, timestamp, meta) VALUES ($1, $2, $3, $4, $5, $6, $7, $8, CASE WHEN $9 = '' THEN NULL ELSE $9 END) ON CONFLICT DO NOTHING;"""
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2023-11-07 12:38:37 +00:00
|
|
|
const SelectNoCursorAscStmtName = "SelectWithoutCursorAsc"
|
|
|
|
const SelectNoCursorAscStmtDef =
|
2024-05-06 08:20:21 +00:00
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash, meta FROM messages
|
2024-04-25 13:09:52 +00:00
|
|
|
WHERE contentTopic IN ($1) AND
|
|
|
|
messageHash IN ($2) AND
|
|
|
|
pubsubTopic = $3 AND
|
|
|
|
storedAt >= $4 AND
|
|
|
|
storedAt <= $5
|
|
|
|
ORDER BY storedAt ASC, messageHash ASC LIMIT $6;"""
|
|
|
|
|
|
|
|
const SelectNoCursorDescStmtName = "SelectWithoutCursorDesc"
|
|
|
|
const SelectNoCursorDescStmtDef =
|
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash FROM messages
|
|
|
|
WHERE contentTopic IN ($1) AND
|
|
|
|
messageHash IN ($2) AND
|
|
|
|
pubsubTopic = $3 AND
|
|
|
|
storedAt >= $4 AND
|
|
|
|
storedAt <= $5
|
|
|
|
ORDER BY storedAt DESC, messageHash DESC LIMIT $6;"""
|
|
|
|
|
|
|
|
const SelectWithCursorDescStmtName = "SelectWithCursorDesc"
|
|
|
|
const SelectWithCursorDescStmtDef =
|
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash FROM messages
|
|
|
|
WHERE contentTopic IN ($1) AND
|
|
|
|
messageHash IN ($2) AND
|
|
|
|
pubsubTopic = $3 AND
|
|
|
|
(storedAt, messageHash) < ($4,$5) AND
|
|
|
|
storedAt >= $6 AND
|
|
|
|
storedAt <= $7
|
|
|
|
ORDER BY storedAt DESC, messageHash DESC LIMIT $8;"""
|
|
|
|
|
|
|
|
const SelectWithCursorAscStmtName = "SelectWithCursorAsc"
|
|
|
|
const SelectWithCursorAscStmtDef =
|
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash FROM messages
|
|
|
|
WHERE contentTopic IN ($1) AND
|
|
|
|
messageHash IN ($2) AND
|
|
|
|
pubsubTopic = $3 AND
|
|
|
|
(storedAt, messageHash) > ($4,$5) AND
|
|
|
|
storedAt >= $6 AND
|
|
|
|
storedAt <= $7
|
|
|
|
ORDER BY storedAt ASC, messageHash ASC LIMIT $8;"""
|
|
|
|
|
|
|
|
const SelectNoCursorV2AscStmtName = "SelectWithoutCursorV2Asc"
|
|
|
|
const SelectNoCursorV2AscStmtDef =
|
2024-03-15 23:08:47 +00:00
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash FROM messages
|
2023-11-07 12:38:37 +00:00
|
|
|
WHERE contentTopic IN ($1) AND
|
|
|
|
pubsubTopic = $2 AND
|
|
|
|
storedAt >= $3 AND
|
|
|
|
storedAt <= $4
|
|
|
|
ORDER BY storedAt ASC LIMIT $5;"""
|
|
|
|
|
2024-04-25 13:09:52 +00:00
|
|
|
const SelectNoCursorV2DescStmtName = "SelectWithoutCursorV2Desc"
|
|
|
|
const SelectNoCursorV2DescStmtDef =
|
2024-05-06 08:20:21 +00:00
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash, meta FROM messages
|
2023-11-07 12:38:37 +00:00
|
|
|
WHERE contentTopic IN ($1) AND
|
|
|
|
pubsubTopic = $2 AND
|
|
|
|
storedAt >= $3 AND
|
|
|
|
storedAt <= $4
|
|
|
|
ORDER BY storedAt DESC LIMIT $5;"""
|
|
|
|
|
2024-04-25 13:09:52 +00:00
|
|
|
const SelectWithCursorV2DescStmtName = "SelectWithCursorV2Desc"
|
|
|
|
const SelectWithCursorV2DescStmtDef =
|
2024-05-06 08:20:21 +00:00
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash, meta FROM messages
|
2023-11-07 12:38:37 +00:00
|
|
|
WHERE contentTopic IN ($1) AND
|
|
|
|
pubsubTopic = $2 AND
|
|
|
|
(storedAt, id) < ($3,$4) AND
|
|
|
|
storedAt >= $5 AND
|
|
|
|
storedAt <= $6
|
|
|
|
ORDER BY storedAt DESC LIMIT $7;"""
|
|
|
|
|
2024-04-25 13:09:52 +00:00
|
|
|
const SelectWithCursorV2AscStmtName = "SelectWithCursorV2Asc"
|
|
|
|
const SelectWithCursorV2AscStmtDef =
|
2024-05-06 08:20:21 +00:00
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash, meta FROM messages
|
2023-11-07 12:38:37 +00:00
|
|
|
WHERE contentTopic IN ($1) AND
|
|
|
|
pubsubTopic = $2 AND
|
|
|
|
(storedAt, id) > ($3,$4) AND
|
|
|
|
storedAt >= $5 AND
|
|
|
|
storedAt <= $6
|
|
|
|
ORDER BY storedAt ASC LIMIT $7;"""
|
|
|
|
|
2023-11-24 15:21:22 +00:00
|
|
|
const DefaultMaxNumConns = 50
|
2023-06-07 08:08:43 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc new*(
|
|
|
|
T: type PostgresDriver,
|
|
|
|
dbUrl: string,
|
|
|
|
maxConnections = DefaultMaxNumConns,
|
|
|
|
onFatalErrorAction: OnFatalErrorHandler = nil,
|
|
|
|
): ArchiveDriverResult[T] =
|
2023-11-24 15:21:22 +00:00
|
|
|
## Very simplistic split of max connections
|
|
|
|
let maxNumConnOnEachPool = int(maxConnections / 2)
|
|
|
|
|
|
|
|
let readConnPool = PgAsyncPool.new(dbUrl, maxNumConnOnEachPool).valueOr:
|
2023-10-30 14:16:49 +00:00
|
|
|
return err("error creating read conn pool PgAsyncPool")
|
2023-06-07 08:08:43 +00:00
|
|
|
|
2023-11-24 15:21:22 +00:00
|
|
|
let writeConnPool = PgAsyncPool.new(dbUrl, maxNumConnOnEachPool).valueOr:
|
2023-10-30 14:16:49 +00:00
|
|
|
return err("error creating write conn pool PgAsyncPool")
|
2023-09-06 17:16:37 +00:00
|
|
|
|
2024-02-15 11:25:08 +00:00
|
|
|
if not isNil(onFatalErrorAction):
|
|
|
|
asyncSpawn checkConnectivity(readConnPool, onFatalErrorAction)
|
2023-09-06 17:16:37 +00:00
|
|
|
|
2024-02-15 11:25:08 +00:00
|
|
|
if not isNil(onFatalErrorAction):
|
|
|
|
asyncSpawn checkConnectivity(writeConnPool, onFatalErrorAction)
|
2023-10-30 14:16:49 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
let driver = PostgresDriver(
|
|
|
|
writeConnPool: writeConnPool,
|
|
|
|
readConnPool: readConnPool,
|
|
|
|
partitionMngr: PartitionManager.new(),
|
|
|
|
)
|
2024-03-06 19:50:22 +00:00
|
|
|
return ok(driver)
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2023-06-07 08:08:43 +00:00
|
|
|
proc reset*(s: PostgresDriver): Future[ArchiveDriverResult[void]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
## Clear the database partitions
|
|
|
|
let targetSize = 0
|
|
|
|
let forceRemoval = true
|
|
|
|
let ret = await s.decreaseDatabaseSize(targetSize, forceRemoval)
|
|
|
|
return ret
|
2023-06-07 08:08:43 +00:00
|
|
|
|
2024-03-12 11:51:03 +00:00
|
|
|
proc rowCallbackImpl(
|
2024-03-15 23:08:47 +00:00
|
|
|
pqResult: ptr PGresult,
|
|
|
|
outRows: var seq[(PubsubTopic, WakuMessage, seq[byte], Timestamp, WakuMessageHash)],
|
|
|
|
) =
|
2023-10-31 13:46:46 +00:00
|
|
|
## Proc aimed to contain the logic of the callback passed to the `psasyncpool`.
|
|
|
|
## That callback is used in "SELECT" queries.
|
|
|
|
##
|
|
|
|
## pqResult - contains the query results
|
|
|
|
## outRows - seq of Store-rows. This is populated from the info contained in pqResult
|
|
|
|
|
|
|
|
let numFields = pqResult.pqnfields()
|
2024-05-06 08:20:21 +00:00
|
|
|
if numFields != 9:
|
2023-10-31 13:46:46 +00:00
|
|
|
error "Wrong number of fields"
|
|
|
|
return
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
for iRow in 0 ..< pqResult.pqNtuples():
|
2023-10-31 13:46:46 +00:00
|
|
|
var wakuMessage: WakuMessage
|
|
|
|
var timestamp: Timestamp
|
|
|
|
var version: uint
|
|
|
|
var pubSubTopic: string
|
|
|
|
var contentTopic: string
|
|
|
|
var storedAt: int64
|
|
|
|
var digest: string
|
|
|
|
var payload: string
|
2024-03-12 11:51:03 +00:00
|
|
|
var hashHex: string
|
|
|
|
var msgHash: WakuMessageHash
|
2024-05-06 08:20:21 +00:00
|
|
|
var meta: string
|
2024-03-15 23:08:47 +00:00
|
|
|
|
2023-10-31 13:46:46 +00:00
|
|
|
try:
|
2024-03-15 23:08:47 +00:00
|
|
|
storedAt = parseInt($(pqgetvalue(pqResult, iRow, 0)))
|
2023-10-31 13:46:46 +00:00
|
|
|
contentTopic = $(pqgetvalue(pqResult, iRow, 1))
|
2024-03-15 23:08:47 +00:00
|
|
|
payload = parseHexStr($(pqgetvalue(pqResult, iRow, 2)))
|
2023-10-31 13:46:46 +00:00
|
|
|
pubSubTopic = $(pqgetvalue(pqResult, iRow, 3))
|
2024-03-15 23:08:47 +00:00
|
|
|
version = parseUInt($(pqgetvalue(pqResult, iRow, 4)))
|
|
|
|
timestamp = parseInt($(pqgetvalue(pqResult, iRow, 5)))
|
|
|
|
digest = parseHexStr($(pqgetvalue(pqResult, iRow, 6)))
|
|
|
|
hashHex = parseHexStr($(pqgetvalue(pqResult, iRow, 7)))
|
2024-05-06 08:20:21 +00:00
|
|
|
meta = parseHexStr($(pqgetvalue(pqResult, iRow, 8)))
|
2024-03-12 11:51:03 +00:00
|
|
|
msgHash = fromBytes(hashHex.toOpenArrayByte(0, 31))
|
2023-10-31 13:46:46 +00:00
|
|
|
except ValueError:
|
|
|
|
error "could not parse correctly", error = getCurrentExceptionMsg()
|
|
|
|
|
|
|
|
wakuMessage.timestamp = timestamp
|
|
|
|
wakuMessage.version = uint32(version)
|
|
|
|
wakuMessage.contentTopic = contentTopic
|
|
|
|
wakuMessage.payload = @(payload.toOpenArrayByte(0, payload.high))
|
2024-05-06 08:20:21 +00:00
|
|
|
wakuMessage.meta = @(meta.toOpenArrayByte(0, meta.high))
|
2023-10-31 13:46:46 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
outRows.add(
|
|
|
|
(
|
|
|
|
pubSubTopic,
|
|
|
|
wakuMessage,
|
|
|
|
@(digest.toOpenArrayByte(0, digest.high)),
|
|
|
|
storedAt,
|
|
|
|
msgHash,
|
|
|
|
)
|
|
|
|
)
|
|
|
|
|
|
|
|
method put*(
|
|
|
|
s: PostgresDriver,
|
|
|
|
pubsubTopic: PubsubTopic,
|
|
|
|
message: WakuMessage,
|
|
|
|
digest: MessageDigest,
|
|
|
|
messageHash: WakuMessageHash,
|
|
|
|
receivedTime: Timestamp,
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
2023-11-07 12:38:37 +00:00
|
|
|
let digest = toHex(digest.data)
|
2023-11-22 16:32:56 +00:00
|
|
|
let messageHash = toHex(messageHash)
|
2023-11-07 12:38:37 +00:00
|
|
|
let rxTime = $receivedTime
|
|
|
|
let contentTopic = message.contentTopic
|
|
|
|
let payload = toHex(message.payload)
|
|
|
|
let version = $message.version
|
|
|
|
let timestamp = $message.timestamp
|
2024-05-06 08:20:21 +00:00
|
|
|
let meta = toHex(message.meta)
|
2023-11-07 12:38:37 +00:00
|
|
|
|
2024-05-03 15:41:14 +00:00
|
|
|
trace "put PostgresDriver", timestamp = timestamp
|
2024-03-06 19:50:22 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
return await s.writeConnPool.runStmt(
|
|
|
|
InsertRowStmtName,
|
|
|
|
InsertRowStmtDefinition,
|
|
|
|
@[
|
|
|
|
digest, messageHash, rxTime, contentTopic, payload, pubsubTopic, version,
|
2024-05-06 08:20:21 +00:00
|
|
|
timestamp, meta,
|
2024-03-15 23:08:47 +00:00
|
|
|
],
|
|
|
|
@[
|
|
|
|
int32(digest.len),
|
|
|
|
int32(messageHash.len),
|
|
|
|
int32(rxTime.len),
|
|
|
|
int32(contentTopic.len),
|
|
|
|
int32(payload.len),
|
|
|
|
int32(pubsubTopic.len),
|
|
|
|
int32(version.len),
|
|
|
|
int32(timestamp.len),
|
2024-05-06 08:20:21 +00:00
|
|
|
int32(meta.len),
|
|
|
|
],
|
|
|
|
@[
|
|
|
|
int32(0),
|
|
|
|
int32(0),
|
|
|
|
int32(0),
|
|
|
|
int32(0),
|
|
|
|
int32(0),
|
|
|
|
int32(0),
|
|
|
|
int32(0),
|
|
|
|
int32(0),
|
|
|
|
int32(0),
|
2024-03-15 23:08:47 +00:00
|
|
|
],
|
|
|
|
)
|
|
|
|
|
|
|
|
method getAllMessages*(
|
|
|
|
s: PostgresDriver
|
|
|
|
): Future[ArchiveDriverResult[seq[ArchiveRow]]] {.async.} =
|
2023-10-06 08:36:00 +00:00
|
|
|
## Retrieve all messages from the store.
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2024-03-12 11:51:03 +00:00
|
|
|
var rows: seq[(PubsubTopic, WakuMessage, seq[byte], Timestamp, WakuMessageHash)]
|
2023-10-31 13:46:46 +00:00
|
|
|
proc rowCallback(pqResult: ptr PGresult) =
|
|
|
|
rowCallbackImpl(pqResult, rows)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
(
|
|
|
|
await s.readConnPool.pgQuery(
|
|
|
|
"""SELECT storedAt, contentTopic,
|
2023-06-07 08:08:43 +00:00
|
|
|
payload, pubsubTopic, version, timestamp,
|
2024-05-06 08:20:21 +00:00
|
|
|
id, messageHash, meta FROM messages ORDER BY storedAt ASC""",
|
2024-03-15 23:08:47 +00:00
|
|
|
newSeq[string](0),
|
|
|
|
rowCallback,
|
|
|
|
)
|
|
|
|
).isOkOr:
|
2023-10-31 13:46:46 +00:00
|
|
|
return err("failed in query: " & $error)
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2023-10-31 13:46:46 +00:00
|
|
|
return ok(rows)
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc getPartitionsList(
|
|
|
|
s: PostgresDriver
|
|
|
|
): Future[ArchiveDriverResult[seq[string]]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
## Retrieves the seq of partition table names.
|
|
|
|
## e.g: @["messages_1708534333_1708534393", "messages_1708534273_1708534333"]
|
|
|
|
|
|
|
|
var partitions: seq[string]
|
|
|
|
proc rowCallback(pqResult: ptr PGresult) =
|
2024-03-15 23:08:47 +00:00
|
|
|
for iRow in 0 ..< pqResult.pqNtuples():
|
2024-03-06 19:50:22 +00:00
|
|
|
let partitionName = $(pqgetvalue(pqResult, iRow, 0))
|
|
|
|
partitions.add(partitionName)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
(
|
|
|
|
await s.readConnPool.pgQuery(
|
|
|
|
"""
|
2024-03-06 19:50:22 +00:00
|
|
|
SELECT child.relname AS partition_name
|
|
|
|
FROM pg_inherits
|
|
|
|
JOIN pg_class parent ON pg_inherits.inhparent = parent.oid
|
|
|
|
JOIN pg_class child ON pg_inherits.inhrelid = child.oid
|
|
|
|
JOIN pg_namespace nmsp_parent ON nmsp_parent.oid = parent.relnamespace
|
|
|
|
JOIN pg_namespace nmsp_child ON nmsp_child.oid = child.relnamespace
|
|
|
|
WHERE parent.relname='messages'
|
2024-03-25 17:02:07 +00:00
|
|
|
ORDER BY partition_name ASC
|
2024-03-06 19:50:22 +00:00
|
|
|
""",
|
2024-03-15 23:08:47 +00:00
|
|
|
newSeq[string](0),
|
|
|
|
rowCallback,
|
|
|
|
)
|
|
|
|
).isOkOr:
|
2024-03-06 19:50:22 +00:00
|
|
|
return err("getPartitionsList failed in query: " & $error)
|
|
|
|
|
|
|
|
return ok(partitions)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc getMessagesArbitraryQuery(
|
|
|
|
s: PostgresDriver,
|
|
|
|
contentTopic: seq[ContentTopic] = @[],
|
|
|
|
pubsubTopic = none(PubsubTopic),
|
|
|
|
cursor = none(ArchiveCursor),
|
|
|
|
startTime = none(Timestamp),
|
|
|
|
endTime = none(Timestamp),
|
|
|
|
hexHashes: seq[string] = @[],
|
|
|
|
maxPageSize = DefaultPageSize,
|
|
|
|
ascendingOrder = true,
|
|
|
|
): Future[ArchiveDriverResult[seq[ArchiveRow]]] {.async.} =
|
2023-11-07 12:38:37 +00:00
|
|
|
## This proc allows to handle atypical queries. We don't use prepared statements for those.
|
2023-10-31 13:46:46 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
var query =
|
2024-05-06 08:20:21 +00:00
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash, meta FROM messages"""
|
2023-05-31 08:28:48 +00:00
|
|
|
var statements: seq[string]
|
|
|
|
var args: seq[string]
|
|
|
|
|
|
|
|
if contentTopic.len > 0:
|
|
|
|
let cstmt = "contentTopic IN (" & "?".repeat(contentTopic.len).join(",") & ")"
|
|
|
|
statements.add(cstmt)
|
|
|
|
for t in contentTopic:
|
|
|
|
args.add(t)
|
|
|
|
|
2024-03-12 11:51:03 +00:00
|
|
|
if hexHashes.len > 0:
|
|
|
|
let cstmt = "messageHash IN (" & "?".repeat(hexHashes.len).join(",") & ")"
|
|
|
|
statements.add(cstmt)
|
|
|
|
for t in hexHashes:
|
|
|
|
args.add(t)
|
|
|
|
|
2023-05-31 08:28:48 +00:00
|
|
|
if pubsubTopic.isSome():
|
|
|
|
statements.add("pubsubTopic = ?")
|
|
|
|
args.add(pubsubTopic.get())
|
|
|
|
|
2024-04-25 13:09:52 +00:00
|
|
|
if cursor.isSome():
|
|
|
|
let comp = if ascendingOrder: ">" else: "<"
|
|
|
|
statements.add("(storedAt, messageHash) " & comp & " (?,?)")
|
|
|
|
args.add($cursor.get().storeTime)
|
|
|
|
args.add(toHex(cursor.get().hash))
|
|
|
|
|
|
|
|
if startTime.isSome():
|
|
|
|
statements.add("storedAt >= ?")
|
|
|
|
args.add($startTime.get())
|
|
|
|
|
|
|
|
if endTime.isSome():
|
|
|
|
statements.add("storedAt <= ?")
|
|
|
|
args.add($endTime.get())
|
|
|
|
|
|
|
|
if statements.len > 0:
|
|
|
|
query &= " WHERE " & statements.join(" AND ")
|
|
|
|
|
|
|
|
var direction: string
|
|
|
|
if ascendingOrder:
|
|
|
|
direction = "ASC"
|
|
|
|
else:
|
|
|
|
direction = "DESC"
|
|
|
|
|
|
|
|
query &= " ORDER BY storedAt " & direction & ", messageHash " & direction
|
|
|
|
|
|
|
|
query &= " LIMIT ?"
|
|
|
|
args.add($maxPageSize)
|
|
|
|
|
|
|
|
var rows: seq[(PubsubTopic, WakuMessage, seq[byte], Timestamp, WakuMessageHash)]
|
|
|
|
proc rowCallback(pqResult: ptr PGresult) =
|
|
|
|
rowCallbackImpl(pqResult, rows)
|
|
|
|
|
|
|
|
(await s.readConnPool.pgQuery(query, args, rowCallback)).isOkOr:
|
|
|
|
return err("failed to run query: " & $error)
|
|
|
|
|
|
|
|
return ok(rows)
|
|
|
|
|
|
|
|
proc getMessagesV2ArbitraryQuery(
|
|
|
|
s: PostgresDriver,
|
|
|
|
contentTopic: seq[ContentTopic] = @[],
|
|
|
|
pubsubTopic = none(PubsubTopic),
|
|
|
|
cursor = none(ArchiveCursor),
|
|
|
|
startTime = none(Timestamp),
|
|
|
|
endTime = none(Timestamp),
|
|
|
|
maxPageSize = DefaultPageSize,
|
|
|
|
ascendingOrder = true,
|
2024-05-01 18:47:06 +00:00
|
|
|
): Future[ArchiveDriverResult[seq[ArchiveRow]]] {.async, deprecated.} =
|
2024-04-25 13:09:52 +00:00
|
|
|
## This proc allows to handle atypical queries. We don't use prepared statements for those.
|
|
|
|
|
|
|
|
var query =
|
|
|
|
"""SELECT storedAt, contentTopic, payload, pubsubTopic, version, timestamp, id, messageHash FROM messages"""
|
|
|
|
var statements: seq[string]
|
|
|
|
var args: seq[string]
|
|
|
|
|
|
|
|
if contentTopic.len > 0:
|
|
|
|
let cstmt = "contentTopic IN (" & "?".repeat(contentTopic.len).join(",") & ")"
|
|
|
|
statements.add(cstmt)
|
|
|
|
for t in contentTopic:
|
|
|
|
args.add(t)
|
|
|
|
|
|
|
|
if pubsubTopic.isSome():
|
|
|
|
statements.add("pubsubTopic = ?")
|
|
|
|
args.add(pubsubTopic.get())
|
|
|
|
|
2023-05-31 08:28:48 +00:00
|
|
|
if cursor.isSome():
|
|
|
|
let comp = if ascendingOrder: ">" else: "<"
|
|
|
|
statements.add("(storedAt, id) " & comp & " (?,?)")
|
|
|
|
args.add($cursor.get().storeTime)
|
2023-06-09 10:42:33 +00:00
|
|
|
args.add(toHex(cursor.get().digest.data))
|
2023-05-31 08:28:48 +00:00
|
|
|
|
|
|
|
if startTime.isSome():
|
|
|
|
statements.add("storedAt >= ?")
|
|
|
|
args.add($startTime.get())
|
|
|
|
|
|
|
|
if endTime.isSome():
|
|
|
|
statements.add("storedAt <= ?")
|
|
|
|
args.add($endTime.get())
|
|
|
|
|
|
|
|
if statements.len > 0:
|
|
|
|
query &= " WHERE " & statements.join(" AND ")
|
|
|
|
|
|
|
|
var direction: string
|
|
|
|
if ascendingOrder:
|
|
|
|
direction = "ASC"
|
|
|
|
else:
|
|
|
|
direction = "DESC"
|
|
|
|
|
|
|
|
query &= " ORDER BY storedAt " & direction & ", id " & direction
|
|
|
|
|
|
|
|
query &= " LIMIT ?"
|
|
|
|
args.add($maxPageSize)
|
|
|
|
|
2024-03-12 11:51:03 +00:00
|
|
|
var rows: seq[(PubsubTopic, WakuMessage, seq[byte], Timestamp, WakuMessageHash)]
|
2023-10-31 13:46:46 +00:00
|
|
|
proc rowCallback(pqResult: ptr PGresult) =
|
|
|
|
rowCallbackImpl(pqResult, rows)
|
2024-03-15 23:08:47 +00:00
|
|
|
|
2023-10-31 13:46:46 +00:00
|
|
|
(await s.readConnPool.pgQuery(query, args, rowCallback)).isOkOr:
|
|
|
|
return err("failed to run query: " & $error)
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2023-10-31 13:46:46 +00:00
|
|
|
return ok(rows)
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc getMessagesPreparedStmt(
|
|
|
|
s: PostgresDriver,
|
|
|
|
contentTopic: string,
|
|
|
|
pubsubTopic: PubsubTopic,
|
|
|
|
cursor = none(ArchiveCursor),
|
|
|
|
startTime: Timestamp,
|
|
|
|
endTime: Timestamp,
|
2024-04-25 13:09:52 +00:00
|
|
|
hashes: string,
|
2024-03-15 23:08:47 +00:00
|
|
|
maxPageSize = DefaultPageSize,
|
|
|
|
ascOrder = true,
|
|
|
|
): Future[ArchiveDriverResult[seq[ArchiveRow]]] {.async.} =
|
2023-11-07 12:38:37 +00:00
|
|
|
## This proc aims to run the most typical queries in a more performant way, i.e. by means of
|
|
|
|
## prepared statements.
|
|
|
|
##
|
|
|
|
## contentTopic - string with list of conten topics. e.g: "'ctopic1','ctopic2','ctopic3'"
|
|
|
|
|
2024-03-12 11:51:03 +00:00
|
|
|
var rows: seq[(PubsubTopic, WakuMessage, seq[byte], Timestamp, WakuMessageHash)]
|
2023-11-07 12:38:37 +00:00
|
|
|
proc rowCallback(pqResult: ptr PGresult) =
|
|
|
|
rowCallbackImpl(pqResult, rows)
|
|
|
|
|
|
|
|
let startTimeStr = $startTime
|
|
|
|
let endTimeStr = $endTime
|
|
|
|
let limit = $maxPageSize
|
|
|
|
|
|
|
|
if cursor.isSome():
|
2024-03-15 23:08:47 +00:00
|
|
|
var stmtName =
|
|
|
|
if ascOrder: SelectWithCursorAscStmtName else: SelectWithCursorDescStmtName
|
|
|
|
var stmtDef =
|
|
|
|
if ascOrder: SelectWithCursorAscStmtDef else: SelectWithCursorDescStmtDef
|
2023-11-07 12:38:37 +00:00
|
|
|
|
2024-04-25 13:09:52 +00:00
|
|
|
let hash = toHex(cursor.get().hash)
|
|
|
|
let storeTime = $cursor.get().storeTime
|
|
|
|
|
|
|
|
(
|
|
|
|
await s.readConnPool.runStmt(
|
|
|
|
stmtName,
|
|
|
|
stmtDef,
|
|
|
|
@[
|
|
|
|
contentTopic, hashes, pubsubTopic, storeTime, hash, startTimeStr, endTimeStr,
|
|
|
|
limit,
|
|
|
|
],
|
|
|
|
@[
|
|
|
|
int32(contentTopic.len),
|
|
|
|
int32(pubsubTopic.len),
|
|
|
|
int32(storeTime.len),
|
|
|
|
int32(hash.len),
|
|
|
|
int32(startTimeStr.len),
|
|
|
|
int32(endTimeStr.len),
|
|
|
|
int32(limit.len),
|
|
|
|
],
|
|
|
|
@[int32(0), int32(0), int32(0), int32(0), int32(0), int32(0), int32(0)],
|
|
|
|
rowCallback,
|
|
|
|
)
|
|
|
|
).isOkOr:
|
|
|
|
return err("failed to run query with cursor: " & $error)
|
|
|
|
else:
|
|
|
|
var stmtName =
|
|
|
|
if ascOrder: SelectNoCursorAscStmtName else: SelectNoCursorDescStmtName
|
|
|
|
var stmtDef = if ascOrder: SelectNoCursorAscStmtDef else: SelectNoCursorDescStmtDef
|
|
|
|
|
|
|
|
(
|
|
|
|
await s.readConnPool.runStmt(
|
|
|
|
stmtName,
|
|
|
|
stmtDef,
|
|
|
|
@[contentTopic, hashes, pubsubTopic, startTimeStr, endTimeStr, limit],
|
|
|
|
@[
|
|
|
|
int32(contentTopic.len),
|
|
|
|
int32(pubsubTopic.len),
|
|
|
|
int32(startTimeStr.len),
|
|
|
|
int32(endTimeStr.len),
|
|
|
|
int32(limit.len),
|
|
|
|
],
|
|
|
|
@[int32(0), int32(0), int32(0), int32(0), int32(0)],
|
|
|
|
rowCallback,
|
|
|
|
)
|
|
|
|
).isOkOr:
|
|
|
|
return err("failed to run query without cursor: " & $error)
|
|
|
|
|
|
|
|
return ok(rows)
|
|
|
|
|
|
|
|
proc getMessagesV2PreparedStmt(
|
|
|
|
s: PostgresDriver,
|
|
|
|
contentTopic: string,
|
|
|
|
pubsubTopic: PubsubTopic,
|
|
|
|
cursor = none(ArchiveCursor),
|
|
|
|
startTime: Timestamp,
|
|
|
|
endTime: Timestamp,
|
|
|
|
maxPageSize = DefaultPageSize,
|
|
|
|
ascOrder = true,
|
2024-05-01 18:47:06 +00:00
|
|
|
): Future[ArchiveDriverResult[seq[ArchiveRow]]] {.async, deprecated.} =
|
2024-04-25 13:09:52 +00:00
|
|
|
## This proc aims to run the most typical queries in a more performant way, i.e. by means of
|
|
|
|
## prepared statements.
|
|
|
|
##
|
|
|
|
## contentTopic - string with list of conten topics. e.g: "'ctopic1','ctopic2','ctopic3'"
|
|
|
|
|
|
|
|
var rows: seq[(PubsubTopic, WakuMessage, seq[byte], Timestamp, WakuMessageHash)]
|
|
|
|
proc rowCallback(pqResult: ptr PGresult) =
|
|
|
|
rowCallbackImpl(pqResult, rows)
|
|
|
|
|
|
|
|
let startTimeStr = $startTime
|
|
|
|
let endTimeStr = $endTime
|
|
|
|
let limit = $maxPageSize
|
|
|
|
|
|
|
|
if cursor.isSome():
|
|
|
|
var stmtName =
|
|
|
|
if ascOrder: SelectWithCursorV2AscStmtName else: SelectWithCursorV2DescStmtName
|
|
|
|
var stmtDef =
|
|
|
|
if ascOrder: SelectWithCursorV2AscStmtDef else: SelectWithCursorV2DescStmtDef
|
|
|
|
|
2023-11-07 12:38:37 +00:00
|
|
|
let digest = toHex(cursor.get().digest.data)
|
|
|
|
let storeTime = $cursor.get().storeTime
|
2024-03-15 23:08:47 +00:00
|
|
|
|
|
|
|
(
|
|
|
|
await s.readConnPool.runStmt(
|
|
|
|
stmtName,
|
|
|
|
stmtDef,
|
|
|
|
@[contentTopic, pubsubTopic, storeTime, digest, startTimeStr, endTimeStr, limit],
|
|
|
|
@[
|
|
|
|
int32(contentTopic.len),
|
|
|
|
int32(pubsubTopic.len),
|
|
|
|
int32(storeTime.len),
|
|
|
|
int32(digest.len),
|
|
|
|
int32(startTimeStr.len),
|
|
|
|
int32(endTimeStr.len),
|
|
|
|
int32(limit.len),
|
|
|
|
],
|
|
|
|
@[int32(0), int32(0), int32(0), int32(0), int32(0), int32(0), int32(0)],
|
|
|
|
rowCallback,
|
|
|
|
)
|
2023-11-07 12:38:37 +00:00
|
|
|
).isOkOr:
|
|
|
|
return err("failed to run query with cursor: " & $error)
|
|
|
|
else:
|
2024-03-15 23:08:47 +00:00
|
|
|
var stmtName =
|
2024-04-25 13:09:52 +00:00
|
|
|
if ascOrder: SelectNoCursorV2AscStmtName else: SelectNoCursorV2DescStmtName
|
|
|
|
var stmtDef =
|
|
|
|
if ascOrder: SelectNoCursorV2AscStmtDef else: SelectNoCursorV2DescStmtDef
|
2024-03-15 23:08:47 +00:00
|
|
|
|
|
|
|
(
|
|
|
|
await s.readConnPool.runStmt(
|
|
|
|
stmtName,
|
|
|
|
stmtDef,
|
|
|
|
@[contentTopic, pubsubTopic, startTimeStr, endTimeStr, limit],
|
|
|
|
@[
|
|
|
|
int32(contentTopic.len),
|
|
|
|
int32(pubsubTopic.len),
|
|
|
|
int32(startTimeStr.len),
|
|
|
|
int32(endTimeStr.len),
|
|
|
|
int32(limit.len),
|
|
|
|
],
|
|
|
|
@[int32(0), int32(0), int32(0), int32(0), int32(0)],
|
|
|
|
rowCallback,
|
|
|
|
)
|
2023-11-07 12:38:37 +00:00
|
|
|
).isOkOr:
|
|
|
|
return err("failed to run query without cursor: " & $error)
|
|
|
|
|
|
|
|
return ok(rows)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
method getMessages*(
|
|
|
|
s: PostgresDriver,
|
2024-05-01 18:47:06 +00:00
|
|
|
includeData = false,
|
2024-03-15 23:08:47 +00:00
|
|
|
contentTopicSeq = newSeq[ContentTopic](0),
|
|
|
|
pubsubTopic = none(PubsubTopic),
|
|
|
|
cursor = none(ArchiveCursor),
|
|
|
|
startTime = none(Timestamp),
|
|
|
|
endTime = none(Timestamp),
|
|
|
|
hashes = newSeq[WakuMessageHash](0),
|
|
|
|
maxPageSize = DefaultPageSize,
|
|
|
|
ascendingOrder = true,
|
|
|
|
): Future[ArchiveDriverResult[seq[ArchiveRow]]] {.async.} =
|
2024-03-12 11:51:03 +00:00
|
|
|
let hexHashes = hashes.mapIt(toHex(it))
|
2023-11-07 12:38:37 +00:00
|
|
|
|
2024-04-25 13:09:52 +00:00
|
|
|
if contentTopicSeq.len == 1 and hexHashes.len == 1 and pubsubTopic.isSome() and
|
|
|
|
startTime.isSome() and endTime.isSome():
|
2023-11-07 12:38:37 +00:00
|
|
|
## Considered the most common query. Therefore, we use prepared statements to optimize it.
|
2024-03-15 23:08:47 +00:00
|
|
|
return await s.getMessagesPreparedStmt(
|
|
|
|
contentTopicSeq.join(","),
|
|
|
|
PubsubTopic(pubsubTopic.get()),
|
|
|
|
cursor,
|
|
|
|
startTime.get(),
|
|
|
|
endTime.get(),
|
2024-04-25 13:09:52 +00:00
|
|
|
hexHashes.join(","),
|
2024-03-15 23:08:47 +00:00
|
|
|
maxPageSize,
|
|
|
|
ascendingOrder,
|
|
|
|
)
|
2023-11-07 12:38:37 +00:00
|
|
|
else:
|
|
|
|
## We will run atypical query. In this case we don't use prepared statemets
|
2024-03-15 23:08:47 +00:00
|
|
|
return await s.getMessagesArbitraryQuery(
|
|
|
|
contentTopicSeq, pubsubTopic, cursor, startTime, endTime, hexHashes, maxPageSize,
|
|
|
|
ascendingOrder,
|
|
|
|
)
|
|
|
|
|
2024-04-25 13:09:52 +00:00
|
|
|
method getMessagesV2*(
|
|
|
|
s: PostgresDriver,
|
|
|
|
contentTopicSeq = newSeq[ContentTopic](0),
|
|
|
|
pubsubTopic = none(PubsubTopic),
|
|
|
|
cursor = none(ArchiveCursor),
|
|
|
|
startTime = none(Timestamp),
|
|
|
|
endTime = none(Timestamp),
|
|
|
|
maxPageSize = DefaultPageSize,
|
|
|
|
ascendingOrder = true,
|
2024-05-01 18:47:06 +00:00
|
|
|
): Future[ArchiveDriverResult[seq[ArchiveRow]]] {.async, deprecated.} =
|
2024-04-25 13:09:52 +00:00
|
|
|
if contentTopicSeq.len == 1 and pubsubTopic.isSome() and startTime.isSome() and
|
|
|
|
endTime.isSome():
|
|
|
|
## Considered the most common query. Therefore, we use prepared statements to optimize it.
|
|
|
|
return await s.getMessagesV2PreparedStmt(
|
|
|
|
contentTopicSeq.join(","),
|
|
|
|
PubsubTopic(pubsubTopic.get()),
|
|
|
|
cursor,
|
|
|
|
startTime.get(),
|
|
|
|
endTime.get(),
|
|
|
|
maxPageSize,
|
|
|
|
ascendingOrder,
|
|
|
|
)
|
|
|
|
else:
|
|
|
|
## We will run atypical query. In this case we don't use prepared statemets
|
|
|
|
return await s.getMessagesV2ArbitraryQuery(
|
|
|
|
contentTopicSeq, pubsubTopic, cursor, startTime, endTime, maxPageSize,
|
|
|
|
ascendingOrder,
|
|
|
|
)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc getStr(
|
|
|
|
s: PostgresDriver, query: string
|
|
|
|
): Future[ArchiveDriverResult[string]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
# Performs a query that is expected to return a single string
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2024-03-06 19:50:22 +00:00
|
|
|
var ret: string
|
2023-10-31 13:46:46 +00:00
|
|
|
proc rowCallback(pqResult: ptr PGresult) =
|
|
|
|
if pqResult.pqnfields() != 1:
|
2024-03-06 19:50:22 +00:00
|
|
|
error "Wrong number of fields in getStr"
|
2023-10-31 13:46:46 +00:00
|
|
|
return
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2023-10-31 13:46:46 +00:00
|
|
|
if pqResult.pqNtuples() != 1:
|
2024-03-06 19:50:22 +00:00
|
|
|
error "Wrong number of rows in getStr"
|
2023-10-31 13:46:46 +00:00
|
|
|
return
|
2023-06-09 10:42:33 +00:00
|
|
|
|
2024-03-06 19:50:22 +00:00
|
|
|
ret = $(pqgetvalue(pqResult, 0, 0))
|
2023-06-07 08:08:43 +00:00
|
|
|
|
2023-10-31 13:46:46 +00:00
|
|
|
(await s.readConnPool.pgQuery(query, newSeq[string](0), rowCallback)).isOkOr:
|
|
|
|
return err("failed in getRow: " & $error)
|
2023-06-09 10:42:33 +00:00
|
|
|
|
2024-03-06 19:50:22 +00:00
|
|
|
return ok(ret)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc getInt(
|
|
|
|
s: PostgresDriver, query: string
|
|
|
|
): Future[ArchiveDriverResult[int64]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
# Performs a query that is expected to return a single numeric value (int64)
|
|
|
|
|
|
|
|
var retInt = 0'i64
|
|
|
|
let str = (await s.getStr(query)).valueOr:
|
|
|
|
return err("could not get str in getInt: " & $error)
|
|
|
|
|
|
|
|
try:
|
2024-03-15 23:08:47 +00:00
|
|
|
retInt = parseInt(str)
|
2024-03-06 19:50:22 +00:00
|
|
|
except ValueError:
|
2024-05-10 16:31:01 +00:00
|
|
|
return err(
|
|
|
|
"exception in getInt, parseInt, str: " & str & " query: " & query & " exception: " &
|
|
|
|
getCurrentExceptionMsg()
|
|
|
|
)
|
2024-03-06 19:50:22 +00:00
|
|
|
|
2023-06-09 10:42:33 +00:00
|
|
|
return ok(retInt)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
method getDatabaseSize*(
|
|
|
|
s: PostgresDriver
|
|
|
|
): Future[ArchiveDriverResult[int64]] {.async.} =
|
2023-11-24 14:43:47 +00:00
|
|
|
let intRes = (await s.getInt("SELECT pg_database_size(current_database())")).valueOr:
|
|
|
|
return err("error in getDatabaseSize: " & error)
|
|
|
|
|
|
|
|
let databaseSize: int64 = int64(intRes)
|
|
|
|
return ok(databaseSize)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
method getMessagesCount*(
|
|
|
|
s: PostgresDriver
|
|
|
|
): Future[ArchiveDriverResult[int64]] {.async.} =
|
2023-10-06 08:36:00 +00:00
|
|
|
let intRes = await s.getInt("SELECT COUNT(1) FROM messages")
|
2023-06-09 10:42:33 +00:00
|
|
|
if intRes.isErr():
|
|
|
|
return err("error in getMessagesCount: " & intRes.error)
|
|
|
|
|
|
|
|
return ok(intRes.get())
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
method getOldestMessageTimestamp*(
|
|
|
|
s: PostgresDriver
|
|
|
|
): Future[ArchiveDriverResult[Timestamp]] {.async.} =
|
2024-05-10 16:31:01 +00:00
|
|
|
## In some cases it could happen that we have
|
|
|
|
## empty partitions which are older than the current stored rows.
|
|
|
|
## In those cases we want to consider those older partitions as the oldest considered timestamp.
|
|
|
|
let oldestPartition = s.partitionMngr.getOldestPartition().valueOr:
|
|
|
|
return err("could not get oldest partition: " & $error)
|
|
|
|
|
|
|
|
let oldestPartitionTimeNanoSec = oldestPartition.getPartitionStartTimeInNanosec()
|
|
|
|
|
2023-10-06 08:36:00 +00:00
|
|
|
let intRes = await s.getInt("SELECT MIN(storedAt) FROM messages")
|
2023-06-09 10:42:33 +00:00
|
|
|
if intRes.isErr():
|
2024-05-10 16:31:01 +00:00
|
|
|
## Just return the oldest partition time considering the partitions set
|
|
|
|
return ok(Timestamp(oldestPartitionTimeNanoSec))
|
2023-06-09 10:42:33 +00:00
|
|
|
|
2024-05-10 16:31:01 +00:00
|
|
|
return ok(Timestamp(min(intRes.get(), oldestPartitionTimeNanoSec)))
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
method getNewestMessageTimestamp*(
|
|
|
|
s: PostgresDriver
|
|
|
|
): Future[ArchiveDriverResult[Timestamp]] {.async.} =
|
2023-10-06 08:36:00 +00:00
|
|
|
let intRes = await s.getInt("SELECT MAX(storedAt) FROM messages")
|
2023-06-09 10:42:33 +00:00
|
|
|
if intRes.isErr():
|
2023-06-28 16:47:28 +00:00
|
|
|
return err("error in getNewestMessageTimestamp: " & intRes.error)
|
2023-06-09 10:42:33 +00:00
|
|
|
|
|
|
|
return ok(Timestamp(intRes.get()))
|
|
|
|
|
|
|
|
method deleteOldestMessagesNotWithinLimit*(
|
2024-03-15 23:08:47 +00:00
|
|
|
s: PostgresDriver, limit: int
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
2023-10-31 13:46:46 +00:00
|
|
|
let execRes = await s.writeConnPool.pgQuery(
|
2024-03-15 23:08:47 +00:00
|
|
|
"""DELETE FROM messages WHERE id NOT IN
|
2023-06-09 10:42:33 +00:00
|
|
|
(
|
2023-10-06 08:36:00 +00:00
|
|
|
SELECT id FROM messages ORDER BY storedAt DESC LIMIT ?
|
2023-06-09 10:42:33 +00:00
|
|
|
);""",
|
2024-03-15 23:08:47 +00:00
|
|
|
@[$limit],
|
|
|
|
)
|
2023-06-09 10:42:33 +00:00
|
|
|
if execRes.isErr():
|
|
|
|
return err("error in deleteOldestMessagesNotWithinLimit: " & execRes.error)
|
|
|
|
|
|
|
|
return ok()
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
method close*(s: PostgresDriver): Future[ArchiveDriverResult[void]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
## Cancel the partition factory loop
|
|
|
|
s.futLoopPartitionFactory.cancel()
|
|
|
|
|
2023-05-31 08:28:48 +00:00
|
|
|
## Close the database connection
|
2023-10-30 14:16:49 +00:00
|
|
|
let writeCloseRes = await s.writeConnPool.close()
|
|
|
|
let readCloseRes = await s.readConnPool.close()
|
|
|
|
|
|
|
|
writeCloseRes.isOkOr:
|
|
|
|
return err("error closing write pool: " & $error)
|
|
|
|
|
|
|
|
readCloseRes.isOkOr:
|
|
|
|
return err("error closing read pool: " & $error)
|
|
|
|
|
|
|
|
return ok()
|
2023-05-31 08:28:48 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc sleep*(
|
|
|
|
s: PostgresDriver, seconds: int
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
2023-05-31 08:28:48 +00:00
|
|
|
# This is for testing purposes only. It is aimed to test the proper
|
|
|
|
# implementation of asynchronous requests. It merely triggers a sleep in the
|
|
|
|
# database for the amount of seconds given as a parameter.
|
2023-10-31 13:46:46 +00:00
|
|
|
|
|
|
|
proc rowCallback(result: ptr PGresult) =
|
|
|
|
## We are not interested in any value in this case
|
|
|
|
discard
|
|
|
|
|
2023-05-31 08:28:48 +00:00
|
|
|
try:
|
|
|
|
let params = @[$seconds]
|
2023-10-31 13:46:46 +00:00
|
|
|
(await s.writeConnPool.pgQuery("SELECT pg_sleep(?)", params, rowCallback)).isOkOr:
|
|
|
|
return err("error in postgres_driver sleep: " & $error)
|
2023-05-31 08:28:48 +00:00
|
|
|
except DbError:
|
|
|
|
# This always raises an exception although the sleep works
|
|
|
|
return err("exception sleeping: " & getCurrentExceptionMsg())
|
|
|
|
|
2023-06-07 08:08:43 +00:00
|
|
|
return ok()
|
2024-03-01 11:05:27 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc performWriteQuery*(
|
|
|
|
s: PostgresDriver, query: string
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
## Performs a query that somehow changes the state of the database
|
|
|
|
|
|
|
|
(await s.writeConnPool.pgQuery(query)).isOkOr:
|
|
|
|
return err("error in performWriteQuery: " & $error)
|
|
|
|
|
|
|
|
return ok()
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc addPartition(
|
|
|
|
self: PostgresDriver, startTime: Timestamp, duration: timer.Duration
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
## Creates a partition table that will store the messages that fall in the range
|
|
|
|
## `startTime` <= storedAt < `startTime + duration`.
|
|
|
|
## `startTime` is measured in seconds since epoch
|
|
|
|
|
|
|
|
let beginning = startTime
|
|
|
|
let `end` = (startTime + duration.seconds)
|
|
|
|
|
|
|
|
let fromInSec: string = $beginning
|
|
|
|
let untilInSec: string = $`end`
|
|
|
|
|
|
|
|
let fromInNanoSec: string = fromInSec & "000000000"
|
|
|
|
let untilInNanoSec: string = untilInSec & "000000000"
|
|
|
|
|
|
|
|
let partitionName = "messages_" & fromInSec & "_" & untilInSec
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
let createPartitionQuery =
|
|
|
|
"CREATE TABLE IF NOT EXISTS " & partitionName & " PARTITION OF " &
|
|
|
|
"messages FOR VALUES FROM ('" & fromInNanoSec & "') TO ('" & untilInNanoSec & "');"
|
2024-03-06 19:50:22 +00:00
|
|
|
|
|
|
|
(await self.performWriteQuery(createPartitionQuery)).isOkOr:
|
|
|
|
return err(fmt"error adding partition [{partitionName}]: " & $error)
|
|
|
|
|
|
|
|
debug "new partition added", query = createPartitionQuery
|
|
|
|
|
|
|
|
self.partitionMngr.addPartitionInfo(partitionName, beginning, `end`)
|
|
|
|
return ok()
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc initializePartitionsInfo(
|
|
|
|
self: PostgresDriver
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
let partitionNamesRes = await self.getPartitionsList()
|
|
|
|
if not partitionNamesRes.isOk():
|
|
|
|
return err("Could not retrieve partitions list: " & $partitionNamesRes.error)
|
|
|
|
else:
|
|
|
|
let partitionNames = partitionNamesRes.get()
|
|
|
|
for partitionName in partitionNames:
|
|
|
|
## partitionName contains something like 'messages_1708449815_1708449875'
|
|
|
|
let bothTimes = partitionName.replace("messages_", "")
|
|
|
|
let times = bothTimes.split("_")
|
|
|
|
if times.len != 2:
|
|
|
|
return err(fmt"loopPartitionFactory wrong partition name {partitionName}")
|
|
|
|
|
|
|
|
var beginning: int64
|
|
|
|
try:
|
|
|
|
beginning = parseInt(times[0])
|
|
|
|
except ValueError:
|
|
|
|
return err("Could not parse beginning time: " & getCurrentExceptionMsg())
|
|
|
|
|
|
|
|
var `end`: int64
|
|
|
|
try:
|
|
|
|
`end` = parseInt(times[1])
|
|
|
|
except ValueError:
|
|
|
|
return err("Could not parse end time: " & getCurrentExceptionMsg())
|
|
|
|
|
|
|
|
self.partitionMngr.addPartitionInfo(partitionName, beginning, `end`)
|
|
|
|
|
|
|
|
return ok()
|
|
|
|
|
|
|
|
const DefaultDatabasePartitionCheckTimeInterval = timer.minutes(10)
|
|
|
|
const PartitionsRangeInterval = timer.hours(1) ## Time range covered by each parition
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc loopPartitionFactory(
|
|
|
|
self: PostgresDriver, onFatalError: OnFatalErrorHandler
|
|
|
|
) {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
## Loop proc that continuously checks whether we need to create a new partition.
|
|
|
|
## Notice that the deletion of partitions is handled by the retention policy modules.
|
|
|
|
|
|
|
|
debug "starting loopPartitionFactory"
|
|
|
|
|
|
|
|
if PartitionsRangeInterval < DefaultDatabasePartitionCheckTimeInterval:
|
2024-03-15 23:08:47 +00:00
|
|
|
onFatalError(
|
|
|
|
"partition factory partition range interval should be bigger than check interval"
|
|
|
|
)
|
2024-03-06 19:50:22 +00:00
|
|
|
|
|
|
|
## First of all, let's make the 'partition_manager' aware of the current partitions
|
|
|
|
(await self.initializePartitionsInfo()).isOkOr:
|
|
|
|
onFatalError("issue in loopPartitionFactory: " & $error)
|
|
|
|
|
|
|
|
while true:
|
|
|
|
trace "Check if we need to create a new partition"
|
|
|
|
|
|
|
|
let now = times.now().toTime().toUnix()
|
|
|
|
|
|
|
|
if self.partitionMngr.isEmpty():
|
|
|
|
debug "adding partition because now there aren't more partitions"
|
|
|
|
(await self.addPartition(now, PartitionsRangeInterval)).isOkOr:
|
|
|
|
onFatalError("error when creating a new partition from empty state: " & $error)
|
|
|
|
else:
|
|
|
|
let newestPartitionRes = self.partitionMngr.getNewestPartition()
|
|
|
|
if newestPartitionRes.isErr():
|
|
|
|
onFatalError("could not get newest partition: " & $newestPartitionRes.error)
|
|
|
|
|
|
|
|
let newestPartition = newestPartitionRes.get()
|
|
|
|
if newestPartition.containsMoment(now):
|
|
|
|
debug "creating a new partition for the future"
|
|
|
|
## The current used partition is the last one that was created.
|
|
|
|
## Thus, let's create another partition for the future.
|
2024-03-18 14:59:45 +00:00
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
(
|
|
|
|
await self.addPartition(
|
|
|
|
newestPartition.getLastMoment(), PartitionsRangeInterval
|
|
|
|
)
|
|
|
|
).isOkOr:
|
2024-03-06 19:50:22 +00:00
|
|
|
onFatalError("could not add the next partition for 'now': " & $error)
|
|
|
|
elif now >= newestPartition.getLastMoment():
|
|
|
|
debug "creating a new partition to contain current messages"
|
|
|
|
## There is no partition to contain the current time.
|
|
|
|
## This happens if the node has been stopped for quite a long time.
|
|
|
|
## Then, let's create the needed partition to contain 'now'.
|
|
|
|
(await self.addPartition(now, PartitionsRangeInterval)).isOkOr:
|
|
|
|
onFatalError("could not add the next partition: " & $error)
|
|
|
|
|
|
|
|
await sleepAsync(DefaultDatabasePartitionCheckTimeInterval)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc startPartitionFactory*(
|
|
|
|
self: PostgresDriver, onFatalError: OnFatalErrorHandler
|
|
|
|
) {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
self.futLoopPartitionFactory = self.loopPartitionFactory(onFatalError)
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc getTableSize*(
|
|
|
|
self: PostgresDriver, tableName: string
|
|
|
|
): Future[ArchiveDriverResult[string]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
## Returns a human-readable representation of the size for the requested table.
|
|
|
|
## tableName - table of interest.
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
let tableSize = (
|
|
|
|
await self.getStr(
|
|
|
|
fmt"""
|
2024-03-06 19:50:22 +00:00
|
|
|
SELECT pg_size_pretty(pg_total_relation_size(C.oid)) AS "total_size"
|
|
|
|
FROM pg_class C
|
2024-03-15 23:08:47 +00:00
|
|
|
where relname = '{tableName}'"""
|
|
|
|
)
|
|
|
|
).valueOr:
|
2024-03-06 19:50:22 +00:00
|
|
|
return err("error in getDatabaseSize: " & error)
|
|
|
|
|
|
|
|
return ok(tableSize)
|
|
|
|
|
2024-05-07 21:42:01 +00:00
|
|
|
proc removePartition(
|
|
|
|
self: PostgresDriver, partitionName: string
|
2024-03-15 23:08:47 +00:00
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
var partSize = ""
|
2024-05-07 21:42:01 +00:00
|
|
|
let partSizeRes = await self.getTableSize(partitionName)
|
2024-03-06 19:50:22 +00:00
|
|
|
if partSizeRes.isOk():
|
|
|
|
partSize = partSizeRes.get()
|
|
|
|
|
|
|
|
## Detach and remove the partition concurrently to not block the parent table (messages)
|
|
|
|
let detachPartitionQuery =
|
2024-05-07 21:42:01 +00:00
|
|
|
"ALTER TABLE messages DETACH PARTITION " & partitionName & " CONCURRENTLY;"
|
2024-03-06 19:50:22 +00:00
|
|
|
debug "removeOldestPartition", query = detachPartitionQuery
|
|
|
|
(await self.performWriteQuery(detachPartitionQuery)).isOkOr:
|
|
|
|
return err(fmt"error in {detachPartitionQuery}: " & $error)
|
|
|
|
|
|
|
|
## Drop the partition
|
2024-05-07 21:42:01 +00:00
|
|
|
let dropPartitionQuery = "DROP TABLE " & partitionName
|
2024-03-06 19:50:22 +00:00
|
|
|
debug "removeOldestPartition drop partition", query = dropPartitionQuery
|
|
|
|
(await self.performWriteQuery(dropPartitionQuery)).isOkOr:
|
|
|
|
return err(fmt"error in {dropPartitionQuery}: " & $error)
|
|
|
|
|
2024-05-07 21:42:01 +00:00
|
|
|
debug "removed partition", partition_name = partitionName, partition_size = partSize
|
2024-03-06 19:50:22 +00:00
|
|
|
self.partitionMngr.removeOldestPartitionName()
|
|
|
|
|
|
|
|
return ok()
|
|
|
|
|
2024-05-07 21:42:01 +00:00
|
|
|
proc removePartitionsOlderThan(
|
|
|
|
self: PostgresDriver, tsInNanoSec: Timestamp
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
|
|
|
## Removes old partitions that don't contain the specified timestamp
|
|
|
|
|
|
|
|
let tsInSec = Timestamp(float(tsInNanoSec) / 1_000_000_000)
|
|
|
|
|
|
|
|
var oldestPartition = self.partitionMngr.getOldestPartition().valueOr:
|
|
|
|
return err("could not get oldest partition in removePartitionOlderThan: " & $error)
|
|
|
|
|
|
|
|
while not oldestPartition.containsMoment(tsInSec):
|
|
|
|
(await self.removePartition(oldestPartition.getName())).isOkOr:
|
|
|
|
return err("issue in removePartitionsOlderThan: " & $error)
|
|
|
|
|
|
|
|
oldestPartition = self.partitionMngr.getOldestPartition().valueOr:
|
|
|
|
return err(
|
|
|
|
"could not get partition in removePartitionOlderThan in while loop: " & $error
|
|
|
|
)
|
|
|
|
|
|
|
|
## We reached the partition that contains the target timestamp plus don't want to remove it
|
|
|
|
return ok()
|
|
|
|
|
|
|
|
proc removeOldestPartition(
|
|
|
|
self: PostgresDriver, forceRemoval: bool = false, ## To allow cleanup in tests
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
|
|
|
## Indirectly called from the retention policy
|
|
|
|
|
|
|
|
let oldestPartition = self.partitionMngr.getOldestPartition().valueOr:
|
|
|
|
return err("could not remove oldest partition: " & $error)
|
|
|
|
|
|
|
|
if not forceRemoval:
|
|
|
|
let now = times.now().toTime().toUnix()
|
|
|
|
let currentPartitionRes = self.partitionMngr.getPartitionFromDateTime(now)
|
|
|
|
if currentPartitionRes.isOk():
|
|
|
|
## The database contains a partition that would store current messages.
|
|
|
|
|
|
|
|
if currentPartitionRes.get() == oldestPartition:
|
|
|
|
debug "Skipping to remove the current partition"
|
|
|
|
return ok()
|
|
|
|
|
|
|
|
return await self.removePartition(oldestPartition.getName())
|
|
|
|
|
2024-03-06 19:50:22 +00:00
|
|
|
proc containsAnyPartition*(self: PostgresDriver): bool =
|
|
|
|
return not self.partitionMngr.isEmpty()
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
method decreaseDatabaseSize*(
|
|
|
|
driver: PostgresDriver, targetSizeInBytes: int64, forceRemoval: bool = false
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
2024-03-06 19:50:22 +00:00
|
|
|
var dbSize = (await driver.getDatabaseSize()).valueOr:
|
|
|
|
return err("decreaseDatabaseSize failed to get database size: " & $error)
|
|
|
|
|
|
|
|
## database size in bytes
|
|
|
|
var totalSizeOfDB: int64 = int64(dbSize)
|
|
|
|
|
|
|
|
if totalSizeOfDB <= targetSizeInBytes:
|
|
|
|
return ok()
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
debug "start reducing database size",
|
|
|
|
targetSize = $targetSizeInBytes, currentSize = $totalSizeOfDB
|
2024-03-06 19:50:22 +00:00
|
|
|
|
|
|
|
while totalSizeOfDB > targetSizeInBytes and driver.containsAnyPartition():
|
|
|
|
(await driver.removeOldestPartition(forceRemoval)).isOkOr:
|
2024-03-15 23:08:47 +00:00
|
|
|
return err(
|
|
|
|
"decreaseDatabaseSize inside loop failed to remove oldest partition: " & $error
|
|
|
|
)
|
2024-03-06 19:50:22 +00:00
|
|
|
|
|
|
|
dbSize = (await driver.getDatabaseSize()).valueOr:
|
2024-03-15 23:08:47 +00:00
|
|
|
return
|
|
|
|
err("decreaseDatabaseSize inside loop failed to get database size: " & $error)
|
2024-03-06 19:50:22 +00:00
|
|
|
|
|
|
|
let newCurrentSize = int64(dbSize)
|
|
|
|
if newCurrentSize == totalSizeOfDB:
|
|
|
|
return err("the previous partition removal didn't clear database size")
|
|
|
|
|
|
|
|
totalSizeOfDB = newCurrentSize
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
debug "reducing database size",
|
|
|
|
targetSize = $targetSizeInBytes, newCurrentSize = $totalSizeOfDB
|
2024-03-06 19:50:22 +00:00
|
|
|
|
|
|
|
return ok()
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
method existsTable*(
|
|
|
|
s: PostgresDriver, tableName: string
|
|
|
|
): Future[ArchiveDriverResult[bool]] {.async.} =
|
|
|
|
let query: string =
|
|
|
|
fmt"""
|
2024-03-01 11:05:27 +00:00
|
|
|
SELECT EXISTS (
|
|
|
|
SELECT FROM
|
|
|
|
pg_tables
|
|
|
|
WHERE
|
|
|
|
tablename = '{tableName}'
|
|
|
|
);
|
|
|
|
"""
|
|
|
|
|
|
|
|
var exists: string
|
|
|
|
proc rowCallback(pqResult: ptr PGresult) =
|
|
|
|
if pqResult.pqnfields() != 1:
|
|
|
|
error "Wrong number of fields in existsTable"
|
|
|
|
return
|
|
|
|
|
|
|
|
if pqResult.pqNtuples() != 1:
|
|
|
|
error "Wrong number of rows in existsTable"
|
|
|
|
return
|
|
|
|
|
|
|
|
exists = $(pqgetvalue(pqResult, 0, 0))
|
|
|
|
|
|
|
|
(await s.readConnPool.pgQuery(query, newSeq[string](0), rowCallback)).isOkOr:
|
|
|
|
return err("existsTable failed in getRow: " & $error)
|
|
|
|
|
|
|
|
return ok(exists == "t")
|
|
|
|
|
2024-03-15 23:08:47 +00:00
|
|
|
proc getCurrentVersion*(
|
|
|
|
s: PostgresDriver
|
|
|
|
): Future[ArchiveDriverResult[int64]] {.async.} =
|
2024-03-01 11:05:27 +00:00
|
|
|
let existsVersionTable = (await s.existsTable("version")).valueOr:
|
|
|
|
return err("error in getCurrentVersion-existsTable: " & $error)
|
|
|
|
|
|
|
|
if not existsVersionTable:
|
|
|
|
return ok(0)
|
|
|
|
|
|
|
|
let res = (await s.getInt(fmt"SELECT version FROM version")).valueOr:
|
|
|
|
return err("error in getMessagesCount: " & $error)
|
|
|
|
|
|
|
|
return ok(res)
|
2024-05-07 21:42:01 +00:00
|
|
|
|
|
|
|
method deleteMessagesOlderThanTimestamp*(
|
|
|
|
s: PostgresDriver, tsNanoSec: Timestamp
|
|
|
|
): Future[ArchiveDriverResult[void]] {.async.} =
|
|
|
|
## First of all, let's remove the older partitions so that we can reduce
|
|
|
|
## the database size.
|
|
|
|
(await s.removePartitionsOlderThan(tsNanoSec)).isOkOr:
|
|
|
|
return err("error while removing older partitions: " & $error)
|
|
|
|
|
|
|
|
(await s.writeConnPool.pgQuery("DELETE FROM messages WHERE storedAt < " & $tsNanoSec)).isOkOr:
|
|
|
|
return err("error in deleteMessagesOlderThanTimestamp: " & $error)
|
|
|
|
|
|
|
|
return ok()
|