2023-08-01 13:05:16 +00:00
|
|
|
|
## Waku autosharding utils
|
|
|
|
|
##
|
|
|
|
|
## See 51/WAKU2-RELAY-SHARDING RFC: https://rfc.vac.dev/spec/51/#automatic-sharding
|
|
|
|
|
|
|
|
|
|
when (NimMajor, NimMinor) < (1, 4):
|
|
|
|
|
{.push raises: [Defect].}
|
|
|
|
|
else:
|
|
|
|
|
{.push raises: [].}
|
|
|
|
|
|
|
|
|
|
import
|
|
|
|
|
nimcrypto,
|
|
|
|
|
std/options,
|
2023-08-17 12:11:18 +00:00
|
|
|
|
std/tables,
|
2023-08-01 13:05:16 +00:00
|
|
|
|
stew/endians2,
|
|
|
|
|
stew/results,
|
|
|
|
|
stew/byteutils
|
|
|
|
|
|
|
|
|
|
import
|
|
|
|
|
./content_topic,
|
|
|
|
|
./pubsub_topic
|
|
|
|
|
|
2024-03-13 09:58:13 +00:00
|
|
|
|
type Sharding* = object
|
|
|
|
|
clusterId*: uint32
|
|
|
|
|
# TODO: generations could be stored in a table here
|
|
|
|
|
shardCountGenZero*: uint32
|
2023-08-17 12:11:18 +00:00
|
|
|
|
|
2024-03-13 09:58:13 +00:00
|
|
|
|
proc new*(T: type Sharding, clusterId: uint32, shardCount: uint32): T =
|
|
|
|
|
return Sharding(clusterId: clusterId, shardCountGenZero: shardCount)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
proc getGenZeroShard*(s: Sharding, topic: NsContentTopic, count: int): NsPubsubTopic =
|
2023-08-17 12:11:18 +00:00
|
|
|
|
let bytes = toBytes(topic.application) & toBytes(topic.version)
|
|
|
|
|
|
|
|
|
|
let hash = sha256.digest(bytes)
|
|
|
|
|
|
|
|
|
|
# We only use the last 64 bits of the hash as having more shards is unlikely.
|
|
|
|
|
let hashValue = uint64.fromBytesBE(hash.data[24..31])
|
|
|
|
|
|
|
|
|
|
# This is equilavent to modulo shard count but faster
|
|
|
|
|
let shard = hashValue and uint64((count - 1))
|
|
|
|
|
|
2024-03-13 09:58:13 +00:00
|
|
|
|
NsPubsubTopic.staticSharding(uint16(s.clusterId), uint16(shard))
|
|
|
|
|
|
|
|
|
|
proc getShard*(s: Sharding, topic: NsContentTopic): Result[NsPubsubTopic, string] =
|
2023-08-17 12:11:18 +00:00
|
|
|
|
## Compute the (pubsub topic) shard to use for this content topic.
|
2024-03-13 09:58:13 +00:00
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
if topic.generation.isNone():
|
|
|
|
|
## Implicit generation # is 0 for all content topic
|
2024-03-13 09:58:13 +00:00
|
|
|
|
return ok(s.getGenZeroShard(topic, int(s.shardCountGenZero)))
|
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
case topic.generation.get():
|
2024-03-13 09:58:13 +00:00
|
|
|
|
of 0: return ok(s.getGenZeroShard(topic, int(s.shardCountGenZero)))
|
2023-08-17 12:11:18 +00:00
|
|
|
|
else: return err("Generation > 0 are not supported yet")
|
|
|
|
|
|
2024-03-13 09:58:13 +00:00
|
|
|
|
proc getShard*(s: Sharding, topic: ContentTopic): Result[PubsubTopic, string] =
|
2023-08-31 20:13:45 +00:00
|
|
|
|
let parsedTopic = NsContentTopic.parse(topic).valueOr:
|
|
|
|
|
return err($error)
|
|
|
|
|
|
2024-03-13 09:58:13 +00:00
|
|
|
|
let shard = ?s.getShard(parsedTopic)
|
2023-08-31 20:13:45 +00:00
|
|
|
|
|
|
|
|
|
ok($shard)
|
|
|
|
|
|
2024-03-13 09:58:13 +00:00
|
|
|
|
proc parseSharding*(s: Sharding, pubsubTopic: Option[PubsubTopic], contentTopics: ContentTopic|seq[ContentTopic]): Result[Table[NsPubsubTopic, seq[NsContentTopic]], string] =
|
2023-08-17 12:11:18 +00:00
|
|
|
|
var topics: seq[ContentTopic]
|
|
|
|
|
when contentTopics is seq[ContentTopic]:
|
|
|
|
|
topics = contentTopics
|
|
|
|
|
else:
|
|
|
|
|
topics = @[contentTopics]
|
2024-03-13 09:58:13 +00:00
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
var topicMap = initTable[NsPubsubTopic, seq[NsContentTopic]]()
|
|
|
|
|
for contentTopic in topics:
|
|
|
|
|
let parseRes = NsContentTopic.parse(contentTopic)
|
|
|
|
|
|
|
|
|
|
let content =
|
|
|
|
|
if parseRes.isErr():
|
|
|
|
|
return err("Cannot parse content topic: " & $parseRes.error)
|
|
|
|
|
else: parseRes.get()
|
|
|
|
|
|
|
|
|
|
let pubsub =
|
|
|
|
|
if pubsubTopic.isSome():
|
|
|
|
|
let parseRes = NsPubsubTopic.parse(pubsubTopic.get())
|
|
|
|
|
|
|
|
|
|
if parseRes.isErr():
|
|
|
|
|
return err("Cannot parse pubsub topic: " & $parseRes.error)
|
|
|
|
|
else: parseRes.get()
|
|
|
|
|
else:
|
2024-03-13 09:58:13 +00:00
|
|
|
|
let shardsRes = s.getShard(content)
|
2023-08-17 12:11:18 +00:00
|
|
|
|
|
|
|
|
|
if shardsRes.isErr():
|
|
|
|
|
return err("Cannot autoshard content topic: " & $shardsRes.error)
|
|
|
|
|
else: shardsRes.get()
|
2024-01-04 15:26:27 +00:00
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
if not topicMap.hasKey(pubsub):
|
|
|
|
|
topicMap[pubsub] = @[]
|
2024-03-13 09:58:13 +00:00
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
try:
|
|
|
|
|
topicMap[pubsub].add(content)
|
|
|
|
|
except CatchableError:
|
|
|
|
|
return err(getCurrentExceptionMsg())
|
|
|
|
|
|
|
|
|
|
ok(topicMap)
|
|
|
|
|
|
|
|
|
|
#type ShardsPriority = seq[tuple[topic: NsPubsubTopic, value: float64]]
|
|
|
|
|
|
|
|
|
|
#[ proc shardCount*(topic: NsContentTopic): Result[int, string] =
|
|
|
|
|
## Returns the total shard count from the content topic.
|
2023-08-01 13:05:16 +00:00
|
|
|
|
let shardCount =
|
|
|
|
|
if topic.generation.isNone():
|
|
|
|
|
## Implicit generation # is 0 for all content topic
|
|
|
|
|
GenerationZeroShardsCount
|
|
|
|
|
else:
|
|
|
|
|
case topic.generation.get():
|
|
|
|
|
of 0:
|
|
|
|
|
GenerationZeroShardsCount
|
|
|
|
|
else:
|
|
|
|
|
return err("Generation > 0 are not supported yet")
|
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
ok((shardCount)) ]#
|
2023-08-01 13:05:16 +00:00
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
#[ proc applyWeight(hashValue: uint64, weight: float64): float64 =
|
|
|
|
|
(-weight) / math.ln(float64(hashValue) / float64(high(uint64))) ]#
|
2023-08-01 13:05:16 +00:00
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
#[ proc hashOrder*(x, y: (NsPubsubTopic, float64)): int =
|
|
|
|
|
cmp(x[1], y[1]) ]#
|
2023-08-01 13:05:16 +00:00
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
#[ proc weightedShardList*(topic: NsContentTopic, shardCount: int, weightList: seq[float64]): Result[ShardsPriority, string] =
|
2023-08-01 13:05:16 +00:00
|
|
|
|
## Returns the ordered list of shards and their priority values.
|
|
|
|
|
if weightList.len < shardCount:
|
|
|
|
|
return err("Must provide weights for every shards")
|
|
|
|
|
|
|
|
|
|
let shardsNWeights = zip(toSeq(0..shardCount), weightList)
|
|
|
|
|
|
|
|
|
|
var list = newSeq[(NsPubsubTopic, float64)](shardCount)
|
|
|
|
|
|
|
|
|
|
for (shard, weight) in shardsNWeights:
|
2023-10-05 12:37:05 +00:00
|
|
|
|
let pubsub = NsPubsubTopic.staticSharding(ClusterId, uint16(shard))
|
2023-08-01 13:05:16 +00:00
|
|
|
|
|
2023-10-05 12:37:05 +00:00
|
|
|
|
let clusterBytes = toBytesBE(uint16(ClusterId))
|
2023-08-01 13:05:16 +00:00
|
|
|
|
let shardBytes = toBytesBE(uint16(shard))
|
|
|
|
|
let bytes = toBytes(topic.application) & toBytes(topic.version) & @clusterBytes & @shardBytes
|
|
|
|
|
let hash = sha256.digest(bytes)
|
|
|
|
|
let hashValue = uint64.fromBytesBE(hash.data)
|
|
|
|
|
let value = applyWeight(hashValue, weight)
|
|
|
|
|
|
|
|
|
|
list[shard] = (pubsub, value)
|
|
|
|
|
|
|
|
|
|
list.sort(hashOrder)
|
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
ok(list) ]#
|
2023-08-01 13:05:16 +00:00
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
#[ proc singleHighestWeigthShard*(topic: NsContentTopic): Result[NsPubsubTopic, string] =
|
2023-08-01 13:05:16 +00:00
|
|
|
|
let count = ? shardCount(topic)
|
|
|
|
|
|
2023-08-17 12:11:18 +00:00
|
|
|
|
let weights = repeat(1.0, count)
|
2023-08-01 13:05:16 +00:00
|
|
|
|
|
|
|
|
|
let list = ? weightedShardList(topic, count, weights)
|
|
|
|
|
|
|
|
|
|
let (pubsub, _) = list[list.len - 1]
|
|
|
|
|
|
2024-03-13 09:58:13 +00:00
|
|
|
|
ok(pubsub) ]#
|