2019-02-05 14:01:10 +02:00
|
|
|
import
|
2021-04-06 13:33:24 +02:00
|
|
|
"."/[trie_bitseq, trie_defs, db, binaries, trie_utils]
|
2019-02-05 14:01:10 +02:00
|
|
|
|
|
|
|
export
|
2020-04-20 20:14:39 +02:00
|
|
|
trie_utils
|
2019-02-05 14:01:10 +02:00
|
|
|
|
|
|
|
type
|
|
|
|
DB = TrieDatabaseRef
|
|
|
|
|
|
|
|
BinaryTrie* = object
|
|
|
|
db: DB
|
|
|
|
rootHash: TrieNodeKey
|
|
|
|
|
2020-02-05 13:29:54 +01:00
|
|
|
NodeOverrideError* = object of CatchableError
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
const
|
|
|
|
zeroHash* = default(seq[byte])
|
2019-02-05 14:01:10 +02:00
|
|
|
|
|
|
|
proc init*(x: typedesc[BinaryTrie], db: DB,
|
2020-04-20 20:14:39 +02:00
|
|
|
rootHash: openArray[byte]): BinaryTrie =
|
2019-02-05 14:01:10 +02:00
|
|
|
checkValidHashZ(rootHash)
|
|
|
|
result.db = db
|
2020-04-20 20:14:39 +02:00
|
|
|
result.rootHash = @(rootHash)
|
2019-02-05 14:01:10 +02:00
|
|
|
|
|
|
|
proc getDB*(t: BinaryTrie): auto = t.db
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc initBinaryTrie*(db: DB, rootHash: openArray[byte]): BinaryTrie =
|
2019-02-05 14:01:10 +02:00
|
|
|
init(BinaryTrie, db, rootHash)
|
|
|
|
|
|
|
|
proc initBinaryTrie*(db: DB): BinaryTrie =
|
|
|
|
init(BinaryTrie, db, zeroHash)
|
|
|
|
|
|
|
|
proc getRootHash*(self: BinaryTrie): TrieNodeKey {.inline.} =
|
|
|
|
self.rootHash
|
|
|
|
|
|
|
|
template fetchNode(self: BinaryTrie, nodeHash: TrieNodeKey): TrieNode =
|
2019-03-13 23:15:26 +01:00
|
|
|
doAssert(nodeHash.len == 32)
|
2020-04-20 20:14:39 +02:00
|
|
|
parseNode self.db.get(nodeHash)
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc getAux(self: BinaryTrie, nodeHash: TrieNodeKey, keyPath: TrieBitSeq): seq[byte] =
|
2019-02-05 14:01:10 +02:00
|
|
|
# Empty trie
|
|
|
|
if isZeroHash(nodeHash):
|
2020-04-20 20:14:39 +02:00
|
|
|
return
|
2019-02-05 14:01:10 +02:00
|
|
|
|
|
|
|
let node = self.fetchNode(nodeHash)
|
|
|
|
|
|
|
|
# Key-value node descend
|
|
|
|
if node.kind == LEAF_TYPE:
|
2020-04-20 20:14:39 +02:00
|
|
|
if keyPath.len != 0: return
|
2019-02-05 14:01:10 +02:00
|
|
|
return node.value
|
|
|
|
elif node.kind == KV_TYPE:
|
|
|
|
# keyPath too short
|
2020-04-20 20:14:39 +02:00
|
|
|
if keyPath.len == 0: return
|
2019-02-05 14:01:10 +02:00
|
|
|
let sliceLen = min(node.keyPath.len, keyPath.len)
|
|
|
|
if keyPath[0..<sliceLen] == node.keyPath:
|
|
|
|
return self.getAux(node.child, keyPath.sliceToEnd(node.keyPath.len))
|
|
|
|
else:
|
2020-04-20 20:14:39 +02:00
|
|
|
return
|
2019-02-05 14:01:10 +02:00
|
|
|
# Branch node descend
|
|
|
|
elif node.kind == BRANCH_TYPE:
|
|
|
|
# keyPath too short
|
2020-04-20 20:14:39 +02:00
|
|
|
if keyPath.len == 0: return
|
2019-02-05 14:01:10 +02:00
|
|
|
if keyPath[0]: # first bit == 1
|
|
|
|
return self.getAux(node.rightChild, keyPath.sliceToEnd(1))
|
|
|
|
else:
|
|
|
|
return self.getAux(node.leftChild, keyPath.sliceToEnd(1))
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc get*(self: BinaryTrie, key: openArray[byte]): seq[byte] {.inline.} =
|
|
|
|
var keyBits = key.bits
|
2019-02-05 14:01:10 +02:00
|
|
|
return self.getAux(self.rootHash, keyBits)
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc hashAndSave*(self: BinaryTrie, node: openArray[byte]): TrieNodeKey =
|
|
|
|
result = @(keccakHash(node).data)
|
|
|
|
self.db.put(result, node)
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
template saveKV(self: BinaryTrie, keyPath: TrieBitSeq | bool, child: openArray[byte]): untyped =
|
2021-12-20 13:14:50 +01:00
|
|
|
self.hashAndSave(encodeKVNode(keyPath, child))
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
template saveLeaf(self: BinaryTrie, value: openArray[byte]): untyped =
|
2021-12-20 13:14:50 +01:00
|
|
|
self.hashAndSave(encodeLeafNode(value))
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
template saveBranch(self: BinaryTrie, L, R: openArray[byte]): untyped =
|
2021-12-20 13:14:50 +01:00
|
|
|
self.hashAndSave(encodeBranchNode(L, R))
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc setBranchNode(self: BinaryTrie, keyPath: TrieBitSeq, node: TrieNode,
|
|
|
|
value: openArray[byte], deleteSubtrie = false): TrieNodeKey
|
|
|
|
proc setKVNode(self: BinaryTrie, keyPath: TrieBitSeq, nodeHash: TrieNodeKey,
|
|
|
|
node: TrieNode, value: openArray[byte], deleteSubtrie = false): TrieNodeKey
|
2019-02-05 14:01:10 +02:00
|
|
|
|
|
|
|
const
|
|
|
|
overrideErrorMsg =
|
|
|
|
"Fail to set the value because the prefix of it's key is the same as existing key"
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc setAux(self: BinaryTrie, nodeHash: TrieNodeKey, keyPath: TrieBitSeq,
|
|
|
|
value: openArray[byte], deleteSubtrie = false): TrieNodeKey =
|
2019-02-05 14:01:10 +02:00
|
|
|
## If deleteSubtrie is set to True, what it will do is that it take in a keyPath
|
|
|
|
## and traverse til the end of keyPath, then delete the whole subtrie of that node.
|
|
|
|
## Note: keyPath should be in binary array format, i.e., encoded by encode_to_bin()
|
|
|
|
|
|
|
|
template checkBadKeyPath(): untyped =
|
|
|
|
# keyPath too short
|
|
|
|
if keyPath.len == 0:
|
|
|
|
if deleteSubtrie: return zeroHash
|
|
|
|
else: raise newException(NodeOverrideError, overrideErrorMsg)
|
|
|
|
|
|
|
|
template ifGoodValue(body: untyped): untyped =
|
|
|
|
if value.len != 0: body
|
|
|
|
else: return zeroHash
|
|
|
|
|
|
|
|
# Empty trie
|
|
|
|
if isZeroHash(nodeHash):
|
|
|
|
ifGoodValue:
|
|
|
|
return self.saveKV(keyPath, self.saveLeaf(value))
|
|
|
|
|
|
|
|
let node = self.fetchNode(nodeHash)
|
|
|
|
|
|
|
|
case node.kind
|
|
|
|
of LEAF_TYPE: # Node is a leaf node
|
|
|
|
# keyPath must match, there should be no remaining keyPath
|
|
|
|
if keyPath.len != 0:
|
|
|
|
raise newException(NodeOverrideError, overrideErrorMsg)
|
|
|
|
if deleteSubtrie: return zeroHash
|
|
|
|
|
|
|
|
ifGoodValue:
|
|
|
|
return self.saveLeaf(value)
|
|
|
|
of KV_TYPE: # node is a key-value node
|
|
|
|
checkBadKeyPath()
|
|
|
|
return self.setKVNode(keyPath, nodeHash, node, value, deleteSubtrie)
|
|
|
|
of BRANCH_TYPE: # node is a branch node
|
|
|
|
checkBadKeyPath()
|
|
|
|
return self.setBranchNode(keyPath, node, value, deleteSubtrie)
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc set*(self: var BinaryTrie, key, value: openArray[byte]) {.inline.} =
|
2019-02-05 14:01:10 +02:00
|
|
|
## Sets the value at the given keyPath from the given node
|
|
|
|
## Key will be encoded into binary array format first.
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
var keyBits = key.bits
|
|
|
|
self.rootHash = self.setAux(self.rootHash, keyBits, value)
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc setBranchNode(self: BinaryTrie, keyPath: TrieBitSeq, node: TrieNode,
|
|
|
|
value: openArray[byte], deleteSubtrie = false): TrieNodeKey =
|
2019-02-05 14:01:10 +02:00
|
|
|
# Which child node to update? Depends on first bit in keyPath
|
|
|
|
var newLeftChild, newRightChild: TrieNodeKey
|
|
|
|
|
|
|
|
if keyPath[0]: # first bit == 1
|
|
|
|
newRightChild = self.setAux(node.rightChild, keyPath[1..^1], value, deleteSubtrie)
|
|
|
|
newLeftChild = node.leftChild
|
|
|
|
else:
|
|
|
|
newLeftChild = self.setAux(node.leftChild, keyPath[1..^1], value, deleteSubtrie)
|
|
|
|
newRightChild = node.rightChild
|
|
|
|
|
|
|
|
let blankLeft = isZeroHash(newLeftChild)
|
|
|
|
|
|
|
|
# Compress branch node into kv node
|
|
|
|
if blankLeft or isZeroHash(newRightChild):
|
|
|
|
let childNode = if blankLeft: newRightChild else: newLeftChild
|
|
|
|
var subNode = self.fetchNode(childNode)
|
|
|
|
|
|
|
|
# Compress (k1, (k2, NODE)) -> (k1 + k2, NODE)
|
|
|
|
if subNode.kind == KV_TYPE:
|
|
|
|
# exploit subNode.keyPath unused prefix bit
|
|
|
|
# to avoid bitVector concat
|
|
|
|
subNode.keyPath.pushFront(blankLeft)
|
|
|
|
result = self.saveKV(subNode.keyPath, subNode.child)
|
|
|
|
# kv node pointing to a branch node
|
|
|
|
elif subNode.kind in {BRANCH_TYPE, LEAF_TYPE}:
|
|
|
|
result = self.saveKV(blankLeft, childNode)
|
|
|
|
else:
|
|
|
|
result = self.saveBranch(newLeftChild, newRightChild)
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc setKVNode(self: BinaryTrie, keyPath: TrieBitSeq, nodeHash: TrieNodeKey,
|
|
|
|
node: TrieNode, value: openArray[byte], deleteSubtrie = false): TrieNodeKey =
|
2019-02-05 14:01:10 +02:00
|
|
|
# keyPath prefixes match
|
|
|
|
if deleteSubtrie:
|
|
|
|
if keyPath.len < node.keyPath.len and keyPath == node.keyPath[0..<keyPath.len]:
|
|
|
|
return zeroHash
|
|
|
|
|
|
|
|
let sliceLen = min(node.keyPath.len, keyPath.len)
|
|
|
|
|
|
|
|
if keyPath[0..<sliceLen] == node.keyPath:
|
|
|
|
# Recurse into child
|
|
|
|
let subNodeHash = self.setAux(node.child,
|
|
|
|
keyPath.sliceToEnd(node.keyPath.len), value, deleteSubtrie)
|
|
|
|
|
|
|
|
# If child is empty
|
|
|
|
if isZeroHash(subNodeHash):
|
|
|
|
return zeroHash
|
|
|
|
let subNode = self.fetchNode(subNodeHash)
|
|
|
|
|
|
|
|
# If the child is a key-value node, compress together the keyPaths
|
|
|
|
# into one node
|
|
|
|
if subNode.kind == KV_TYPE:
|
|
|
|
return self.saveKV(node.keyPath & subNode.keyPath, subNode.child)
|
|
|
|
else:
|
|
|
|
return self.saveKV(node.keyPath, subNodeHash)
|
|
|
|
# keyPath prefixes don't match. Here we will be converting a key-value node
|
|
|
|
# of the form (k, CHILD) into a structure of one of the following forms:
|
|
|
|
# 1. (k[:-1], (NEWCHILD, CHILD))
|
|
|
|
# 2. (k[:-1], ((k2, NEWCHILD), CHILD))
|
|
|
|
# 3. (k1, ((k2, CHILD), NEWCHILD))
|
|
|
|
# 4. (k1, ((k2, CHILD), (k2', NEWCHILD))
|
|
|
|
# 5. (CHILD, NEWCHILD)
|
|
|
|
# 6. ((k[1:], CHILD), (k', NEWCHILD))
|
|
|
|
# 7. ((k[1:], CHILD), NEWCHILD)
|
|
|
|
# 8. (CHILD, (k[1:], NEWCHILD))
|
|
|
|
else:
|
|
|
|
let
|
|
|
|
commonPrefixLen = getCommonPrefixLength(node.keyPath, keyPath[0..<sliceLen])
|
|
|
|
cplenPlusOne = commonPrefixLen + 1
|
|
|
|
# New key-value pair can not contain empty value
|
|
|
|
# Or one can not delete non-exist subtrie
|
|
|
|
if value.len == 0 or deleteSubtrie: return nodeHash
|
|
|
|
|
|
|
|
var valNode, oldNode, newSub: TrieNodeKey
|
|
|
|
# valnode: the child node that has the new value we are adding
|
|
|
|
# Case 1: keyPath prefixes almost match, so we are in case (1), (2), (5), (6)
|
|
|
|
if keyPath.len == cplenPlusOne:
|
|
|
|
valNode = self.saveLeaf(value)
|
|
|
|
# Case 2: keyPath prefixes mismatch in the middle, so we need to break
|
|
|
|
# the keyPath in half. We are in case (3), (4), (7), (8)
|
|
|
|
else:
|
|
|
|
if keyPath.len <= commonPrefixLen:
|
|
|
|
raise newException(NodeOverrideError, overrideErrorMsg)
|
|
|
|
valNode = self.saveKV(keyPath[cplenPlusOne..^1], self.saveLeaf(value))
|
|
|
|
|
|
|
|
# oldnode: the child node the has the old child value
|
|
|
|
# Case 1: (1), (3), (5), (6)
|
|
|
|
if node.keyPath.len == cplenPlusOne:
|
|
|
|
oldNode = node.child
|
|
|
|
# (2), (4), (6), (8)
|
|
|
|
else:
|
|
|
|
oldNode = self.saveKV(node.keyPath[cplenPlusOne..^1], node.child)
|
|
|
|
|
|
|
|
# Create the new branch node (because the key paths diverge, there has to
|
|
|
|
# be some "first bit" at which they diverge, so there must be a branch
|
|
|
|
# node somewhere)
|
|
|
|
if keyPath[commonPrefixLen]: # first bit == 1
|
|
|
|
newSub = self.saveBranch(oldNode, valNode)
|
|
|
|
else:
|
|
|
|
newSub = self.saveBranch(valNode, oldNode)
|
|
|
|
|
|
|
|
# Case 1: keyPath prefixes match in the first bit, so we still need
|
|
|
|
# a kv node at the top
|
|
|
|
# (1) (2) (3) (4)
|
|
|
|
if commonPrefixLen != 0:
|
|
|
|
return self.saveKV(node.keyPath[0..<commonPrefixLen], newSub)
|
|
|
|
# Case 2: keyPath prefixes diverge in the first bit, so we replace the
|
|
|
|
# kv node with a branch node
|
|
|
|
# (5) (6) (7) (8)
|
|
|
|
else:
|
|
|
|
return newSub
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
template exists*(self: BinaryTrie, key: openArray[byte]): bool =
|
|
|
|
self.get(key) != []
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc delete*(self: var BinaryTrie, key: openArray[byte]) {.inline.} =
|
2019-02-05 14:01:10 +02:00
|
|
|
## Equals to setting the value to zeroBytesRange
|
2020-04-20 20:14:39 +02:00
|
|
|
var keyBits = key.bits
|
|
|
|
self.rootHash = self.setAux(self.rootHash, keyBits, [])
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc deleteSubtrie*(self: var BinaryTrie, key: openArray[byte]) {.inline.} =
|
2019-02-05 14:01:10 +02:00
|
|
|
## Given a key prefix, delete the whole subtrie that starts with the key prefix.
|
|
|
|
## Key will be encoded into binary array format first.
|
|
|
|
## It will call `setAux` with `deleteSubtrie` set to true.
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
var keyBits = key.bits
|
|
|
|
self.rootHash = self.setAux(self.rootHash, keyBits, [], true)
|
2019-02-05 14:01:10 +02:00
|
|
|
|
|
|
|
# Convenience
|
2020-04-20 20:14:39 +02:00
|
|
|
proc rootNode*(self: BinaryTrie): seq[byte] {.inline.} =
|
|
|
|
self.db.get(self.rootHash)
|
2019-02-05 14:01:10 +02:00
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
proc rootNode*(self: var BinaryTrie, node: openArray[byte]) {.inline.} =
|
|
|
|
self.rootHash = self.hashAndSave(node)
|
2019-02-05 14:01:10 +02:00
|
|
|
|
|
|
|
# Dictionary API
|
2020-04-20 20:14:39 +02:00
|
|
|
template `[]`*(self: BinaryTrie, key: seq[byte]): seq[byte] =
|
2019-02-05 14:01:10 +02:00
|
|
|
self.get(key)
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
template `[]=`*(self: var BinaryTrie, key, value: seq[byte]) =
|
2019-02-05 14:01:10 +02:00
|
|
|
self.set(key, value)
|
|
|
|
|
2020-04-20 20:14:39 +02:00
|
|
|
template contains*(self: BinaryTrie, key: seq[byte]): bool =
|
2019-02-05 14:01:10 +02:00
|
|
|
self.exists(key)
|