Add hexary tree implementation

This commit is contained in:
Vitalik Buterin 2018-10-09 18:12:41 -04:00
parent c23dcd4ab8
commit d7fd0aa4a5
No known key found for this signature in database
GPG Key ID: A99D082A6179F987
3 changed files with 146 additions and 0 deletions

View File

@ -1,5 +1,6 @@
import new_bintrie as t1 import new_bintrie as t1
import new_bintrie_optimized as t2 import new_bintrie_optimized as t2
import new_bintrie_hex as t3
import time import time
import binascii import binascii
@ -27,3 +28,18 @@ for k in keys[:500]:
for k in keys[-500:]: for k in keys[-500:]:
assert t2.get(d, r, k) == b'\x00' * 32 assert t2.get(d, r, k) == b'\x00' * 32
print("Reads: %d" % d.reads) print("Reads: %d" % d.reads)
d = t3.EphemDB()
r = t3.new_tree(d)
a = time.time()
for k in keys[:1000]:
r = t3.update(d, r, k, k)
print("DB-optimized bintree time to update: %.4f" % (time.time() - a))
print("Root: %s" % binascii.hexlify(r))
print("Writes: %d, reads: %d" % (d.writes, d.reads))
d.reads = 0
for k in keys[:500]:
assert t3.get(d, r, k) == k
for k in keys[-500:]:
assert t3.get(d, r, k) == b'\x00' * 32
print("Reads: %d" % d.reads)

View File

@ -0,0 +1,125 @@
from ethereum.utils import sha3, encode_hex
class EphemDB():
def __init__(self, kv=None):
self.reads = 0
self.writes = 0
self.kv = kv or {}
def get(self, k):
self.reads += 1
return self.kv.get(k, None)
def put(self, k, v):
self.writes += 1
self.kv[k] = v
def delete(self, k):
del self.kv[k]
# Hashes of empty subtrees
zerohashes = [b'\x00' * 32]
for i in range(256):
zerohashes.insert(0, sha3(zerohashes[0] + zerohashes[0]))
# Create a new empty tree
def new_tree(db):
return zerohashes[0]
# Convert a binary key into an integer path value
def key_to_path(k):
return int.from_bytes(k, 'big')
tt256m1 = 2**256 - 1
# And convert back
def path_to_key(k):
return (k & tt256m1).to_bytes(32, 'big')
# Read a key from a given tree
def get(db, root, key):
v = root
path = key_to_path(key)
for i in range(0, 256, 4):
if v == zerohashes[i]:
return b'\x00' * 32
child = db.get(v)
if len(child) == 65:
if (path % 2**256) == key_to_path(child[1:33]):
return child[33:]
else:
return b'\x00' * 32
else:
index = (path >> 252) & 15
v = child[32*index: 32*index+32]
path <<= 4
return v
# Make a root hash of a (sub)tree with a single key/value pair
def make_single_key_hash(path, depth, value):
if depth == 256:
return value
elif (path >> 255) & 1:
return sha3(zerohashes[depth+1] + make_single_key_hash(path << 1, depth + 1, value))
else:
return sha3(make_single_key_hash(path << 1, depth + 1, value) + zerohashes[depth+1])
# Hash together 16 elements
def hash_16_els(vals):
assert len(vals) == 16
for _ in range(4):
vals = [sha3(vals[i] + vals[i+1]) for i in range(0, len(vals), 2)]
return vals[0]
# Make a root hash of a (sub)tree with two key/value pairs, and save intermediate nodes in the DB
def make_double_key_hash(db, path1, path2, depth, value1, value2):
if depth == 256:
raise Exception("Cannot fit two values into one slot!")
if ((path1 >> 252) & 15) == ((path2 >> 252) & 15):
children = [zerohashes[depth+4]] * 16
children[(path1 >> 252) & 15] = make_double_key_hash(db, path1 << 4, path2 << 4, depth + 4, value1, value2)
else:
Lkey = ((path1 >> 252) & 15)
L = make_single_key_hash(path1 << 4, depth + 4, value1)
Rkey = ((path2 >> 252) & 15)
R = make_single_key_hash(path2 << 4, depth + 4, value2)
db.put(L, b'\x01' + path_to_key(path1 << 4) + value1)
db.put(R, b'\x01' + path_to_key(path2 << 4) + value2)
children = [zerohashes[depth+4]] * 16
children[Lkey] = L
children[Rkey] = R
h = hash_16_els(children)
db.put(h, b''.join(children))
return h
# Update a tree with a given key/value pair
def update(db, root, key, value):
return _update(db, root, key_to_path(key), 0, value)
def _update(db, root, path, depth, value):
if depth == 256:
return value
# Update an empty subtree: make a single-key subtree
if root == zerohashes[depth]:
k = make_single_key_hash(path, depth, value)
db.put(k, b'\x01' + path_to_key(path) + value)
return k
child = db.get(root)
# Update a single-key subtree: make a double-key subtree
if len(child) == 65:
origpath, origvalue = key_to_path(child[1:33]), child[33:]
return make_double_key_hash(db, path, origpath, depth, value, origvalue)
# Update a multi-key subtree: recurse down
else:
assert len(child) == 512
index = (path >> 252) & 15
new_value = _update(db, child[index*32: index*32+32], path << 4, depth + 4, value)
new_children = [new_value if i == index else child[32*i:32*i+32] for i in range(16)]
h = hash_16_els(new_children)
db.put(h, b''.join(new_children))
return h
def multi_update(db, root, keys, values):
for k, v in zip(keys, values):
root = update(db, root, k, v)
return root

View File

@ -119,3 +119,8 @@ def _update(db, root, path, depth, value):
new_child = _update(db, child[:32], path << 1, depth + 1, value) + child[32:] new_child = _update(db, child[:32], path << 1, depth + 1, value) + child[32:]
db.put(sha3(new_child), new_child) db.put(sha3(new_child), new_child)
return sha3(new_child) return sha3(new_child)
def multi_update(db, root, keys, values):
for k, v in zip(keys, values):
root = update(db, root, k, v)
return root