nimbus-eth1/stateless/witness_from_tree.nim

350 lines
11 KiB
Nim
Raw Normal View History

2020-04-21 17:20:39 +07:00
import
stew/[byteutils, endians2],
nimcrypto/[keccak, hash], eth/[common, rlp],
2020-04-21 17:20:39 +07:00
eth/trie/[trie_defs, nibbles, db],
2020-05-14 11:09:01 +07:00
faststreams/outputs,
2020-04-29 12:12:24 +07:00
./witness_types, ../nimbus/constants,
../nimbus/db/storage_types, ./multi_keys
2020-04-21 17:20:39 +07:00
type
DB = TrieDatabaseRef
WitnessBuilder* = object
db*: DB
root: KeccakHash
output: OutputStream
2020-04-29 12:46:50 +07:00
flags: WitnessFlags
2020-04-21 17:20:39 +07:00
StackElem = object
node: seq[byte]
parentGroup: Group
keys: MultikeysRef
depth: int
storageMode: bool
2020-04-29 12:46:50 +07:00
proc initWitnessBuilder*(db: DB, rootHash: KeccakHash, flags: WitnessFlags = {}): WitnessBuilder =
2020-04-21 17:20:39 +07:00
result.db = db
result.root = rootHash
result.output = memoryOutput().s
2020-04-29 12:46:50 +07:00
result.flags = flags
2020-04-21 17:20:39 +07:00
template extensionNodeKey(r: Rlp): auto =
hexPrefixDecode r.listElem(0).toBytes
proc expectHash(r: Rlp): seq[byte] =
result = r.toBytes
if result.len != 32:
raise newException(RlpTypeMismatch,
"RLP expected to be a Keccak hash value, but has an incorrect length")
template getNode(elem: untyped): untyped =
if elem.isList: @(elem.rawData)
else: @(get(wb.db, elem.expectHash))
2020-04-21 17:20:39 +07:00
proc rlpListToBitmask(r: var Rlp): uint =
# only bit 1st to 16th are valid
# the 1st bit is the rightmost bit
var i = 0
for branch in r:
if not branch.isEmpty:
result.setBranchMaskBit(i)
inc i
r.position = 0
2020-05-05 20:27:12 +07:00
template write(wb: var WitnessBuilder, x: untyped) =
2020-05-14 11:09:01 +07:00
wb.output.write(x)
2020-05-05 20:27:12 +07:00
2020-07-21 13:15:06 +07:00
when defined(debugHash):
proc writeU32Impl(wb: var WitnessBuilder, x: uint32) =
wb.write(toBytesBE(x))
2020-05-05 20:27:12 +07:00
2020-07-21 13:15:06 +07:00
template writeU32(wb: var WitnessBuilder, x: untyped) =
wb.writeU32Impl(uint32(x))
2020-05-05 20:27:12 +07:00
template writeByte(wb: var WitnessBuilder, x: untyped) =
wb.write(byte(x))
2020-04-24 15:56:03 +07:00
proc writeUVarint(wb: var WitnessBuilder, x: SomeUnsignedInt) =
# LEB128 varint encoding
var value = x
while true:
var b = value and 0x7F # low order 7 bits of value
value = value shr 7
if value != 0: # more bytes to come
b = b or 0x80 # set high order bit of b
wb.writeByte(b)
if value == 0: break
template writeUVarint32(wb: var WitnessBuilder, x: untyped) =
wb.writeUVarint(uint32(x))
proc writeUVarint(wb: var WitnessBuilder, x: UInt256) =
# LEB128 varint encoding
var value = x
while true:
# we don't truncate to byte here, int will be faster
var b = value.truncate(int) and 0x7F # low order 7 bits of value
value = value shr 7
if value != 0: # more bytes to come
b = b or 0x80 # set high order bit of b
wb.writeByte(b)
if value == 0: break
proc writeNibbles(wb: var WitnessBuilder; n: NibblesSeq, withLen: bool = true) =
# convert the NibblesSeq into left aligned byte seq
# perhaps we can optimize it if the NibblesSeq already left aligned
let nibblesLen = n.len
let numBytes = nibblesLen div 2 + nibblesLen mod 2
var bytes: array[32, byte]
2020-05-07 11:28:11 +07:00
doAssert(nibblesLen >= 1 and nibblesLen <= 64)
for pos in 0..<n.len:
if (pos and 1) != 0:
bytes[pos div 2] = bytes[pos div 2] or n[pos]
else:
bytes[pos div 2] = bytes[pos div 2] or (n[pos] shl 4)
if withLen:
# write nibblesLen
2020-05-05 20:27:12 +07:00
wb.writeByte(nibblesLen)
# write nibbles
2020-05-05 20:27:12 +07:00
wb.write(bytes.toOpenArray(0, numBytes-1))
2020-04-22 18:04:19 +07:00
proc writeExtensionNode(wb: var WitnessBuilder, n: NibblesSeq, depth: int, node: openArray[byte]) =
# write type
2020-05-05 20:27:12 +07:00
wb.writeByte(ExtensionNodeType)
# write nibbles
wb.writeNibbles(n)
2020-04-22 18:04:19 +07:00
when defined(debugDepth):
2020-05-05 20:27:12 +07:00
wb.writeByte(depth)
2020-04-22 18:04:19 +07:00
when defined(debugHash):
2020-05-05 20:27:12 +07:00
wb.write(keccak(node).data)
2020-04-22 18:04:19 +07:00
proc writeBranchNode(wb: var WitnessBuilder, mask: uint, depth: int, node: openArray[byte]) =
# write type
# branch node 17th elem should always empty
doAssert mask.branchMaskBitIsSet(16) == false
2020-05-05 20:27:12 +07:00
wb.writeByte(BranchNodeType)
# write branch mask
# countOnes(branch mask) >= 2 and <= 16
2020-05-05 20:27:12 +07:00
wb.writeByte((mask shr 8) and 0xFF)
wb.writeByte(mask and 0xFF)
2020-04-22 18:04:19 +07:00
when defined(debugDepth):
2020-05-05 20:27:12 +07:00
wb.writeByte(depth)
2020-04-22 18:04:19 +07:00
when defined(debugHash):
2020-05-05 20:27:12 +07:00
wb.write(keccak(node).data)
2020-04-22 18:04:19 +07:00
proc writeHashNode(wb: var WitnessBuilder, node: openArray[byte], depth: int, storageMode: bool) =
# usually a hash node means the recursion will not go deeper
# and the information can be represented by the hash
# for chunked witness, a hash node can be a root to another
# sub-trie in one of the chunks
2020-05-05 20:27:12 +07:00
wb.writeByte(HashNodeType)
if depth >= 9 and storageMode and node[0] == 0.byte:
wb.writeByte(ShortRlpPrefix)
wb.write(node)
proc writeShortRlp(wb: var WitnessBuilder, node: openArray[byte], depth: int, storageMode: bool) =
doAssert(node.len < 32 and depth >= 9 and storageMode)
wb.writeByte(HashNodeType)
wb.writeByte(ShortRlpPrefix)
wb.writeByte(node.len)
2020-05-05 20:27:12 +07:00
wb.write(node)
proc getBranchRecurse(wb: var WitnessBuilder, z: var StackElem) {.raises: [ContractCodeError, IOError, Defect, CatchableError, Exception].}
proc writeByteCode(wb: var WitnessBuilder, kd: KeyData, acc: Account, depth: int) =
2020-05-14 11:09:01 +07:00
if not kd.codeTouched:
# the account have code but not touched by the EVM
# in current block execution
wb.writeByte(CodeUntouched)
let code = get(wb.db, contractHashKey(acc.codeHash).toOpenArray)
if wfEIP170 in wb.flags and code.len > EIP170_MAX_CODE_SIZE:
2020-05-14 11:09:01 +07:00
raise newException(ContractCodeError, "code len exceed EIP170 code size limit")
wb.writeUVarint32(code.len)
wb.writeHashNode(acc.codeHash.data, depth, false)
2020-05-14 11:09:01 +07:00
# no need to write 'code' here
return
wb.writeByte(CodeTouched)
if acc.codeHash == blankStringHash:
# no code
wb.writeUVarint32(0'u32)
2020-05-14 11:09:01 +07:00
return
# the account have code and the EVM use it
let code = get(wb.db, contractHashKey(acc.codeHash).toOpenArray)
if wfEIP170 in wb.flags and code.len > EIP170_MAX_CODE_SIZE:
2020-05-14 11:09:01 +07:00
raise newException(ContractCodeError, "code len exceed EIP170 code size limit")
wb.writeUVarint32(code.len)
2020-05-14 11:09:01 +07:00
wb.write(code)
proc writeStorage(wb: var WitnessBuilder, kd: KeyData, acc: Account, depth: int) =
2020-05-14 11:09:01 +07:00
if kd.storageKeys.isNil:
# the account have storage but not touched by EVM
wb.writeHashNode(acc.storageRoot.data, depth, true)
2020-05-14 11:09:01 +07:00
elif acc.storageRoot != emptyRlpHash:
# the account have storage and the EVM use it
var zz = StackElem(
node: wb.db.get(acc.storageRoot.data),
parentGroup: kd.storageKeys.initGroup(),
keys: kd.storageKeys,
depth: 0, # set depth to zero
storageMode: true # switch to storage mode
)
getBranchRecurse(wb, zz)
else:
# no storage at all
wb.writeHashNode(emptyRlpHash.data, depth, true)
2020-05-14 11:09:01 +07:00
proc writeAccountNode(wb: var WitnessBuilder, kd: KeyData, acc: Account,
node: openArray[byte], depth: int) {.raises: [ContractCodeError, IOError, Defect, CatchableError, Exception].} =
# write type
2020-05-05 20:27:12 +07:00
wb.writeByte(AccountNodeType)
when defined(debugHash):
2020-05-05 20:27:12 +07:00
wb.writeU32(node.len)
wb.write(node)
2020-04-22 18:04:19 +07:00
when defined(debugDepth):
2020-05-05 20:27:12 +07:00
wb.writeByte(depth)
2020-04-22 18:04:19 +07:00
var accountType = if acc.codeHash == blankStringHash and acc.storageRoot == emptyRlpHash: SimpleAccountType
else: ExtendedAccountType
2020-05-05 20:27:12 +07:00
wb.writeByte(accountType)
wb.write(kd.address)
wb.writeUVarint(acc.balance)
wb.writeUVarint(acc.nonce)
if accountType != SimpleAccountType:
wb.writeByteCode(kd, acc, depth)
wb.writeStorage(kd, acc, depth)
2020-05-14 11:09:01 +07:00
#0x00 address:<Address> balance:<Bytes32> nonce:<Bytes32>
#0x01 address:<Address> balance:<Bytes32> nonce:<Bytes32> bytecode:<Bytecode> storage:<Tree_Node(0,1)>
2020-05-14 11:09:01 +07:00
proc writeAccountStorageLeafNode(wb: var WitnessBuilder, key: openArray[byte], val: UInt256, node: openArray[byte], depth: int) =
2020-05-05 20:27:12 +07:00
wb.writeByte(StorageLeafNodeType)
when defined(debugHash):
2020-05-05 20:27:12 +07:00
wb.writeU32(node.len)
wb.write(node)
when defined(debugDepth):
2020-05-05 20:27:12 +07:00
wb.writeByte(depth)
2020-05-05 20:27:12 +07:00
wb.write(key)
wb.write(val.toBytesBE)
2020-04-22 18:04:19 +07:00
2020-05-14 11:09:01 +07:00
#<Storage_Leaf_Node(d<65)> := key:<Bytes32> val:<Bytes32>
2020-04-22 18:04:19 +07:00
proc getBranchRecurse(wb: var WitnessBuilder, z: var StackElem) =
if z.node.len == 0: return
if z.node.len < 32:
writeShortRlp(wb, z.node, z.depth, z.storageMode)
return
var nodeRlp = rlpFromBytes z.node
2020-04-21 17:20:39 +07:00
case nodeRlp.listLen
of 2:
let (isLeaf, k) = nodeRlp.extensionNodeKey
let mg = groups(z.keys, z.depth, k, z.parentGroup)
if not mg.match:
# return immediately if there is no match
writeHashNode(wb, keccak(z.node).data, z.depth, z.storageMode)
return
let value = nodeRlp.listElem(1)
if not isLeaf:
# recursion will go deeper depend on the common-prefix length nibbles
writeExtensionNode(wb, k, z.depth, z.node)
var zz = StackElem(
node: value.getNode,
parentGroup: mg.group,
keys: z.keys,
2020-05-07 22:03:00 +07:00
depth: z.depth + k.len, # increase the depth by k.len
storageMode: z.storageMode
)
getBranchRecurse(wb, zz)
return
# there should be only one match
2020-05-24 11:40:01 +07:00
let kd = z.keys.visitMatch(mg, z.depth)
if z.storageMode:
doAssert(kd.storageMode)
2020-05-14 11:09:01 +07:00
writeAccountStorageLeafNode(wb, kd.storageSlot, value.toBytes.decode(UInt256), z.node, z.depth)
else:
doAssert(not kd.storageMode)
2020-05-14 11:09:01 +07:00
writeAccountNode(wb, kd, value.toBytes.decode(Account), z.node, z.depth)
2020-04-21 17:20:39 +07:00
of 17:
let branchMask = rlpListToBitmask(nodeRlp)
writeBranchNode(wb, branchMask, z.depth, z.node)
2020-04-22 18:04:19 +07:00
# if there is a match in any branch elem
# 1st to 16th, the recursion will go deeper
# by one nibble
2020-05-07 22:03:00 +07:00
doAssert(z.depth != 64) # notLeaf or path.len == 0
let path = groups(z.keys, z.parentGroup, z.depth)
for i in nonEmpty(branchMask):
let branch = nodeRlp.listElem(i)
if branchMaskBitIsSet(path.mask, i):
# it is a match between multikeys and Branch Node elem
var zz = StackElem(
node: branch.getNode,
parentGroup: path.groups[i],
keys: z.keys,
2020-05-07 22:03:00 +07:00
depth: z.depth + 1, # increase the depth by one
storageMode: z.storageMode
)
getBranchRecurse(wb, zz)
2020-05-07 22:03:00 +07:00
continue
if branch.isList:
writeShortRlp(wb, branch.rawData, z.depth, z.storageMode)
else:
2020-05-07 22:03:00 +07:00
# if branch elem not empty and not a match, emit hash
writeHashNode(wb, branch.expectHash, z.depth, z.storageMode)
# 17th elem should always empty
# 17th elem appear in yellow paper but never in
# the actual ethereum state trie
# the 17th elem also not included in block witness spec
doAssert branchMask.branchMaskBitIsSet(16) == false
2020-04-21 17:20:39 +07:00
else:
raise newException(CorruptedTrieDatabase,
"HexaryTrie node with an unexpected number of children")
proc buildWitness*(wb: var WitnessBuilder, keys: MultikeysRef): seq[byte]
{.raises: [ContractCodeError, IOError, Defect, CatchableError, Exception].} =
2020-05-03 08:47:14 +07:00
# witness version
2020-05-05 20:27:12 +07:00
wb.writeByte(BlockWitnessVersion)
# one or more trees
# we only output one big tree here
# the condition to split the big tree into chunks of sub-tries
# is not clear in the spec
2020-05-05 20:27:12 +07:00
wb.writeByte(MetadataNothing)
var z = StackElem(
node: @(wb.db.get(wb.root.data)),
parentGroup: keys.initGroup(),
keys: keys,
2020-05-07 22:03:00 +07:00
depth: 0, # always start with a zero depth
storageMode: false # build account witness first
)
getBranchRecurse(wb, z)
# result
result = wb.output.getOutput(seq[byte])