mirror of
https://github.com/status-im/nimbus-eth1.git
synced 2025-01-16 15:25:24 +00:00
932a2140f2
* Exclude some storage tests why: These test running on external dumps slipped through. The particular dumps were reported earlier as somehow dodgy. This was changed in `#1457` but having a second look, the change on hexary_interpolate.nim(350) might be incorrect. * Redesign `Aristo DB` descriptor for transaction based layers why: Previous descriptor layout made it cumbersome to push/pop database delta layers. The new architecture keeps each layer with the full delta set relative to the database backend. * Keep root ID as part of the `Patricia Trie` leaf path why; That way, forests are supported
302 lines
10 KiB
Nim
302 lines
10 KiB
Nim
# nimbus-eth1
|
|
# Copyright (c) 2021 Status Research & Development GmbH
|
|
# Licensed under either of
|
|
# * Apache License, version 2.0, ([LICENSE-APACHE](LICENSE-APACHE) or
|
|
# http://www.apache.org/licenses/LICENSE-2.0)
|
|
# * MIT license ([LICENSE-MIT](LICENSE-MIT) or
|
|
# http://opensource.org/licenses/MIT)
|
|
# at your option. This file may not be copied, modified, or distributed
|
|
# except according to those terms.
|
|
|
|
## Aristo DB -- a Patricia Trie with labeled edges
|
|
## ===============================================
|
|
##
|
|
## These data structures allows to overlay the *Patricia Trie* with *Merkel
|
|
## Trie* hashes. See the `README.md` in the `aristo` folder for documentation.
|
|
##
|
|
## Some semantic explanations;
|
|
##
|
|
## * NodeKey, NodeRef etc. refer to the standard/legacy `Merkel Patricia Tree`
|
|
## * VertexID, VertexRef, etc. refer to the `Aristo Trie`
|
|
##
|
|
{.push raises: [].}
|
|
|
|
import
|
|
std/[sets, strutils, tables],
|
|
eth/[common, trie/nibbles],
|
|
stew/results,
|
|
"."/aristo_error
|
|
|
|
import
|
|
../../sync/snap/range_desc
|
|
export
|
|
ByteArray32, NodeKey, NodeTag, digestTo, hash, to, `==`, `$`
|
|
|
|
type
|
|
VertexID* = distinct uint64
|
|
## Tip of edge towards child object in the `Patricia Trie` logic. It is
|
|
## also the key into the structural table of the `Aristo Trie`.
|
|
|
|
LeafKey* = object
|
|
## Generalised access key for a leaf vertex on a dedicated sub-trie
|
|
## defined by the `root` field. The main trie is the sub-trie with
|
|
## root ID `VertexID(1)`.
|
|
root*: VertexID ## Root ID for the sub-trie
|
|
path*: NodeTag ## Path into the `Patricia Trie`
|
|
|
|
# -------------
|
|
|
|
GetVtxFn* =
|
|
proc(vid: VertexID): Result[VertexRef,AristoError] {.gcsafe, raises: [].}
|
|
## Generic backend database retrieval function for a single structural
|
|
## `Aristo DB` data record.
|
|
|
|
GetKeyFn* =
|
|
proc(vid: VertexID): Result[NodeKey,AristoError] {.gcsafe, raises: [].}
|
|
## Generic backend database retrieval function for a single
|
|
## `Aristo DB` hash lookup value.
|
|
|
|
GetIdgFn* =
|
|
proc(): Result[seq[VertexID],AristoError] {.gcsafe, raises: [].}
|
|
## Generic backend database retrieval function for a the ID generator
|
|
## `Aristo DB` state record.
|
|
|
|
# -------------
|
|
|
|
PutHdlRef* = ref object of RootRef
|
|
## Persistent database transaction frame handle. This handle is used to
|
|
## wrap any of `PutVtxFn`, `PutKeyFn`, and `PutIdgFn` into and atomic
|
|
## transaction frame. These transaction frames must not be interleaved
|
|
## by any library function using the backend.
|
|
|
|
PutBegFn* =
|
|
proc(): PutHdlRef {.gcsafe, raises: [].}
|
|
## Generic transaction initialisation function
|
|
|
|
PutVtxFn* =
|
|
proc(hdl: PutHdlRef; vrps: openArray[(VertexID,VertexRef)])
|
|
{.gcsafe, raises: [].}
|
|
## Generic backend database bulk storage function.
|
|
|
|
PutKeyFn* =
|
|
proc(hdl: PutHdlRef; vkps: openArray[(VertexID,NodeKey)])
|
|
{.gcsafe, raises: [].}
|
|
## Generic backend database bulk storage function.
|
|
|
|
PutIdgFn* =
|
|
proc(hdl: PutHdlRef; vs: openArray[VertexID]) {.gcsafe, raises: [].}
|
|
## Generic backend database ID generator state storage function.
|
|
|
|
PutEndFn* =
|
|
proc(hdl: PutHdlRef): AristoError {.gcsafe, raises: [].}
|
|
## Generic transaction termination function
|
|
|
|
# -------------
|
|
|
|
DelVtxFn* =
|
|
proc(vids: openArray[VertexID])
|
|
{.gcsafe, raises: [].}
|
|
## Generic backend database delete function for the structural
|
|
## `Aristo DB` data records
|
|
|
|
DelKeyFn* =
|
|
proc(vids: openArray[VertexID])
|
|
{.gcsafe, raises: [].}
|
|
## Generic backend database delete function for the `Aristo DB`
|
|
## Merkle hash key mappings.
|
|
|
|
# -------------
|
|
|
|
VertexType* = enum
|
|
## Type of `Aristo Trie` vertex
|
|
Leaf
|
|
Extension
|
|
Branch
|
|
|
|
PayloadType* = enum
|
|
## Type of leaf data (to be extended)
|
|
BlobData ## Generic data, typically RLP encoded
|
|
AccountData ## Legacy `Account` with hash references
|
|
# AristoAccount ## `Aristo account` with vertex IDs links
|
|
|
|
PayloadRef* = ref object
|
|
case pType*: PayloadType
|
|
of BlobData:
|
|
blob*: Blob ## Opaque data value reference
|
|
of AccountData:
|
|
account*: Account ## Expanded accounting data
|
|
|
|
VertexRef* = ref object of RootRef
|
|
## Vertex for building a hexary Patricia or Merkle Patricia Trie
|
|
case vType*: VertexType
|
|
of Leaf:
|
|
lPfx*: NibblesSeq ## Portion of path segment
|
|
lData*: PayloadRef ## Reference to data payload
|
|
of Extension:
|
|
ePfx*: NibblesSeq ## Portion of path segment
|
|
eVid*: VertexID ## Edge to vertex with ID `eVid`
|
|
of Branch:
|
|
bVid*: array[16,VertexID] ## Edge list with vertex IDs
|
|
|
|
NodeRef* = ref object of VertexRef
|
|
## Combined record for a *traditional* ``Merkle Patricia Tree` node merged
|
|
## with a structural `VertexRef` type object.
|
|
error*: AristoError ## Can be used for error signalling
|
|
key*: array[16,NodeKey] ## Merkle hash/es for Branch & Extension
|
|
|
|
AristoBackendRef* = ref object
|
|
## Backend interface.
|
|
getVtxFn*: GetVtxFn ## Read vertex record
|
|
getKeyFn*: GetKeyFn ## Read Merkle hash/key
|
|
getIdgFn*: GetIdgFn ## Read ID generator state
|
|
putBegFn*: PutBegFn ## Start bulk store session
|
|
putVtxFn*: PutVtxFn ## Bulk store vertex records
|
|
putKeyFn*: PutKeyFn ## Bulk store vertex hashes
|
|
putIdgFn*: PutIdgFn ## Store ID generator state
|
|
putEndFn*: PutEndFn ## Commit bulk store session
|
|
delVtxFn*: DelVtxFn ## Bulk delete vertex records
|
|
delKeyFn*: DelKeyFn ## Bulk delete vertex Merkle hashes
|
|
|
|
AristoLayerRef* = ref object
|
|
## Hexary trie database layer structures. Any layer holds the full
|
|
## change relative to the backend.
|
|
sTab*: Table[VertexID,VertexRef] ## Structural vertex table
|
|
lTab*: Table[LeafKey,VertexID] ## Direct access, path to leaf vertex
|
|
kMap*: Table[VertexID,NodeKey] ## Merkle hash key mapping
|
|
dKey*: HashSet[VertexID] ## Locally deleted Merkle hash keys
|
|
pAmk*: Table[NodeKey,VertexID] ## Reverse mapper for data import
|
|
pPrf*: HashSet[VertexID] ## Locked vertices (proof nodes)
|
|
vGen*: seq[VertexID] ## Unique vertex ID generator
|
|
|
|
AristoDb* = object
|
|
## Set of database layers, supporting transaction frames
|
|
top*: AristoLayerRef ## Database working layer
|
|
stack*: seq[AristoLayerRef] ## Stashed parent layers
|
|
backend*: AristoBackendRef ## Backend database (may well be `nil`)
|
|
|
|
# Debugging data below, might go away in future
|
|
xMap*: Table[NodeKey,VertexID] ## For pretty printing, extends `pAmk`
|
|
|
|
static:
|
|
# Not that there is no doubt about this ...
|
|
doAssert NodeKey.default.ByteArray32.initNibbleRange.len == 64
|
|
|
|
# ------------------------------------------------------------------------------
|
|
# Public helpers: `VertexID` scalar data model
|
|
# ------------------------------------------------------------------------------
|
|
|
|
proc `<`*(a, b: VertexID): bool {.borrow.}
|
|
proc `==`*(a, b: VertexID): bool {.borrow.}
|
|
proc cmp*(a, b: VertexID): int {.borrow.}
|
|
proc `$`*(a: VertexID): string = $a.uint64
|
|
|
|
# ------------------------------------------------------------------------------
|
|
# Public helpers: `LeafKey` scalar data model
|
|
# ------------------------------------------------------------------------------
|
|
|
|
proc `<`*(a, b: LeafKey): bool =
|
|
a.root < b.root or (a.root == b.root and a.path < b.path)
|
|
|
|
proc `==`*(a, b: LeafKey): bool =
|
|
a.root == b.root and a.path == b.path
|
|
|
|
proc cmp*(a, b: LeafKey): int =
|
|
if a < b: -1 elif a == b: 0 else: 1
|
|
|
|
proc `$`*(a: LeafKey): string =
|
|
let w = $a.root.uint64.toHex & ":" & $a.path.Uint256.toHex
|
|
w.strip(leading=true, trailing=false, chars={'0'}).toLowerAscii
|
|
|
|
# ------------------------------------------------------------------------------
|
|
# Public helpers: `NodeRef` and `PayloadRef`
|
|
# ------------------------------------------------------------------------------
|
|
|
|
proc `==`*(a, b: PayloadRef): bool =
|
|
## Beware, potential deep comparison
|
|
if a.isNil:
|
|
return b.isNil
|
|
if b.isNil:
|
|
return false
|
|
if unsafeAddr(a) != unsafeAddr(b):
|
|
if a.pType != b.pType:
|
|
return false
|
|
case a.pType:
|
|
of BlobData:
|
|
if a.blob != b.blob:
|
|
return false
|
|
of AccountData:
|
|
if a.account != b.account:
|
|
return false
|
|
true
|
|
|
|
proc `==`*(a, b: VertexRef): bool =
|
|
## Beware, potential deep comparison
|
|
if a.isNil:
|
|
return b.isNil
|
|
if b.isNil:
|
|
return false
|
|
if unsafeAddr(a[]) != unsafeAddr(b[]):
|
|
if a.vType != b.vType:
|
|
return false
|
|
case a.vType:
|
|
of Leaf:
|
|
if a.lPfx != b.lPfx or a.lData != b.lData:
|
|
return false
|
|
of Extension:
|
|
if a.ePfx != b.ePfx or a.eVid != b.eVid:
|
|
return false
|
|
of Branch:
|
|
for n in 0..15:
|
|
if a.bVid[n] != b.bVid[n]:
|
|
return false
|
|
true
|
|
|
|
proc `==`*(a, b: NodeRef): bool =
|
|
## Beware, potential deep comparison
|
|
if a.VertexRef != b.VertexRef:
|
|
return false
|
|
case a.vType:
|
|
of Extension:
|
|
if a.key[0] != b.key[0]:
|
|
return false
|
|
of Branch:
|
|
for n in 0..15:
|
|
if a.bVid[n] != 0.VertexID and a.key[n] != b.key[n]:
|
|
return false
|
|
else:
|
|
discard
|
|
true
|
|
|
|
# ------------------------------------------------------------------------------
|
|
# Public helpers, miscellaneous functions
|
|
# ------------------------------------------------------------------------------
|
|
|
|
proc convertTo*(payload: PayloadRef; T: type Blob): T =
|
|
## Probably lossy conversion as the storage type `kind` gets missing
|
|
case payload.pType:
|
|
of BlobData:
|
|
result = payload.blob
|
|
of AccountData:
|
|
result = rlp.encode payload.account
|
|
|
|
proc to*(node: NodeRef; T: type VertexRef): T =
|
|
## Extract a copy of the `VertexRef` part from a `NodeRef`. For a leaf
|
|
## type, the `lData` payload reference will be a shallow copy, i.e. only
|
|
## the reference pointer is copied.
|
|
case node.vType:
|
|
of Leaf:
|
|
T(vType: Leaf,
|
|
lPfx: node.lPfx,
|
|
lData: node.lData)
|
|
of Extension:
|
|
T(vType: Extension,
|
|
ePfx: node.ePfx,
|
|
eVid: node.eVid)
|
|
of Branch:
|
|
T(vType: Branch,
|
|
bVid: node.bVid)
|
|
|
|
# ------------------------------------------------------------------------------
|
|
# End
|
|
# ------------------------------------------------------------------------------
|