2022-11-22 18:40:24 +00:00
when ( NimMajor , NimMinor ) < ( 1 , 4 ) :
{. push raises : [ Defect ] . }
else :
{. push raises : [ ] . }
import
stew / results ,
2023-05-25 15:34:34 +00:00
chronicles ,
chronos
2022-11-22 18:40:24 +00:00
import
.. / driver ,
.. / retention_policy
logScope :
topics = " waku archive retention_policy "
const DefaultCapacity * : int = 25_000
const MaxOverflow = 1 .3
type
# CapacityRetentionPolicy implements auto deletion as follows:
# - The sqlite DB will driver up to `totalCapacity = capacity` * `MaxOverflow` messages,
# giving an overflowWindow of `capacity * (MaxOverflow - 1) = overflowWindow`.
#
# - In case of an overflow, messages are sorted by `receiverTimestamp` and the oldest ones are
# deleted. The number of messages that get deleted is `(overflowWindow / 2) = deleteWindow`,
# bringing the total number of driverd messages back to `capacity + (overflowWindow / 2)`.
#
# The rationale for batch deleting is efficiency. We keep half of the overflow window in addition
# to `capacity` because we delete the oldest messages with respect to `receiverTimestamp` instead of
# `senderTimestamp`. `ReceiverTimestamp` is guaranteed to be set, while senders could omit setting
# `senderTimestamp`. However, `receiverTimestamp` can differ from node to node for the same message.
# So sorting by `receiverTimestamp` might (slightly) prioritize some actually older messages and we
# compensate that by keeping half of the overflow window.
CapacityRetentionPolicy * = ref object of RetentionPolicy
capacity : int # represents both the number of messages that are persisted in the sqlite DB (excl. the overflow window explained above), and the number of messages that get loaded via `getAll`.
totalCapacity : int # = capacity * MaxOverflow
deleteWindow : int # = capacity * (MaxOverflow - 1) / 2; half of the overflow window, the amount of messages deleted when overflow occurs
proc calculateTotalCapacity ( capacity : int , overflow : float ) : int =
int ( float ( capacity ) * overflow )
proc calculateOverflowWindow ( capacity : int , overflow : float ) : int =
int ( float ( capacity ) * ( overflow - 1 ) )
proc calculateDeleteWindow ( capacity : int , overflow : float ) : int =
calculateOverflowWindow ( capacity , overflow ) div 2
proc init * ( T : type CapacityRetentionPolicy , capacity = DefaultCapacity ) : T =
let
totalCapacity = calculateTotalCapacity ( capacity , MaxOverflow )
deleteWindow = calculateDeleteWindow ( capacity , MaxOverflow )
CapacityRetentionPolicy (
capacity : capacity ,
totalCapacity : totalCapacity ,
deleteWindow : deleteWindow
)
2023-05-25 15:34:34 +00:00
method execute * ( p : CapacityRetentionPolicy ,
driver : ArchiveDriver ) :
Future [ RetentionPolicyResult [ void ] ] {. async . } =
let numMessagesRes = await driver . getMessagesCount ( )
if numMessagesRes . isErr ( ) :
return err ( " failed to get messages count: " & numMessagesRes . error )
let numMessages = numMessagesRes . value
2022-11-22 18:40:24 +00:00
if numMessages < p . totalCapacity :
return ok ( )
2023-05-25 15:34:34 +00:00
let res = await driver . deleteOldestMessagesNotWithinLimit ( limit = p . capacity + p . deleteWindow )
2022-11-22 18:40:24 +00:00
if res . isErr ( ) :
2023-05-25 15:34:34 +00:00
return err ( " deleting oldest messages failed: " & res . error )
2022-11-22 18:40:24 +00:00
2023-10-10 09:59:09 +00:00
# vacuum to get the deleted pages defragments to save storage space
# this will resize the database size
let resVaccum = await driver . performVacuum ( )
if resVaccum . isErr ( ) :
return err ( " vacuumming failed: " & resVaccum . error )
2023-05-25 15:34:34 +00:00
return ok ( )