2024-06-28 16:04:57 +05:30
{. push raises : [ ] . }
2022-11-22 19:40:24 +01:00
2024-07-09 13:14:28 +02:00
import results , chronicles , chronos
2024-03-16 00:08:47 +01:00
import .. / driver , .. / retention_policy
2022-11-22 19:40:24 +01:00
logScope :
topics = " waku archive retention_policy "
const DefaultCapacity * : int = 25_000
const MaxOverflow = 1 .3
type
# CapacityRetentionPolicy implements auto deletion as follows:
# - The sqlite DB will driver up to `totalCapacity = capacity` * `MaxOverflow` messages,
# giving an overflowWindow of `capacity * (MaxOverflow - 1) = overflowWindow`.
#
# - In case of an overflow, messages are sorted by `receiverTimestamp` and the oldest ones are
# deleted. The number of messages that get deleted is `(overflowWindow / 2) = deleteWindow`,
# bringing the total number of driverd messages back to `capacity + (overflowWindow / 2)`.
#
# The rationale for batch deleting is efficiency. We keep half of the overflow window in addition
# to `capacity` because we delete the oldest messages with respect to `receiverTimestamp` instead of
# `senderTimestamp`. `ReceiverTimestamp` is guaranteed to be set, while senders could omit setting
# `senderTimestamp`. However, `receiverTimestamp` can differ from node to node for the same message.
# So sorting by `receiverTimestamp` might (slightly) prioritize some actually older messages and we
# compensate that by keeping half of the overflow window.
CapacityRetentionPolicy * = ref object of RetentionPolicy
2024-03-16 00:08:47 +01:00
capacity : int
# represents both the number of messages that are persisted in the sqlite DB (excl. the overflow window explained above), and the number of messages that get loaded via `getAll`.
totalCapacity : int # = capacity * MaxOverflow
deleteWindow : int
# = capacity * (MaxOverflow - 1) / 2; half of the overflow window, the amount of messages deleted when overflow occurs
2022-11-22 19:40:24 +01:00
proc calculateTotalCapacity ( capacity : int , overflow : float ) : int =
int ( float ( capacity ) * overflow )
proc calculateOverflowWindow ( capacity : int , overflow : float ) : int =
int ( float ( capacity ) * ( overflow - 1 ) )
proc calculateDeleteWindow ( capacity : int , overflow : float ) : int =
calculateOverflowWindow ( capacity , overflow ) div 2
2024-03-16 00:08:47 +01:00
proc new * ( T : type CapacityRetentionPolicy , capacity = DefaultCapacity ) : T =
2022-11-22 19:40:24 +01:00
let
totalCapacity = calculateTotalCapacity ( capacity , MaxOverflow )
deleteWindow = calculateDeleteWindow ( capacity , MaxOverflow )
CapacityRetentionPolicy (
2024-03-16 00:08:47 +01:00
capacity : capacity , totalCapacity : totalCapacity , deleteWindow : deleteWindow
2022-11-22 19:40:24 +01:00
)
2024-03-16 00:08:47 +01:00
method execute * (
p : CapacityRetentionPolicy , driver : ArchiveDriver
) : Future [ RetentionPolicyResult [ void ] ] {. async . } =
2023-11-21 11:27:50 +01:00
let numMessages = ( await driver . getMessagesCount ( ) ) . valueOr :
return err ( " failed to get messages count: " & error )
2022-11-22 19:40:24 +01:00
if numMessages < p . totalCapacity :
return ok ( )
2024-03-16 00:08:47 +01:00
( await driver . deleteOldestMessagesNotWithinLimit ( limit = p . capacity + p . deleteWindow ) ) . isOkOr :
2023-11-21 11:27:50 +01:00
return err ( " deleting oldest messages failed: " & error )
2023-10-10 11:59:09 +02:00
2023-05-25 17:34:34 +02:00
return ok ( )