mirror of
https://github.com/status-im/research.git
synced 2025-01-13 00:24:08 +00:00
Add hexary tree implementation
This commit is contained in:
parent
c23dcd4ab8
commit
d7fd0aa4a5
@ -1,5 +1,6 @@
|
|||||||
import new_bintrie as t1
|
import new_bintrie as t1
|
||||||
import new_bintrie_optimized as t2
|
import new_bintrie_optimized as t2
|
||||||
|
import new_bintrie_hex as t3
|
||||||
import time
|
import time
|
||||||
import binascii
|
import binascii
|
||||||
|
|
||||||
@ -27,3 +28,18 @@ for k in keys[:500]:
|
|||||||
for k in keys[-500:]:
|
for k in keys[-500:]:
|
||||||
assert t2.get(d, r, k) == b'\x00' * 32
|
assert t2.get(d, r, k) == b'\x00' * 32
|
||||||
print("Reads: %d" % d.reads)
|
print("Reads: %d" % d.reads)
|
||||||
|
|
||||||
|
d = t3.EphemDB()
|
||||||
|
r = t3.new_tree(d)
|
||||||
|
a = time.time()
|
||||||
|
for k in keys[:1000]:
|
||||||
|
r = t3.update(d, r, k, k)
|
||||||
|
print("DB-optimized bintree time to update: %.4f" % (time.time() - a))
|
||||||
|
print("Root: %s" % binascii.hexlify(r))
|
||||||
|
print("Writes: %d, reads: %d" % (d.writes, d.reads))
|
||||||
|
d.reads = 0
|
||||||
|
for k in keys[:500]:
|
||||||
|
assert t3.get(d, r, k) == k
|
||||||
|
for k in keys[-500:]:
|
||||||
|
assert t3.get(d, r, k) == b'\x00' * 32
|
||||||
|
print("Reads: %d" % d.reads)
|
||||||
|
125
trie_research/bintrie2/new_bintrie_hex.py
Normal file
125
trie_research/bintrie2/new_bintrie_hex.py
Normal file
@ -0,0 +1,125 @@
|
|||||||
|
from ethereum.utils import sha3, encode_hex
|
||||||
|
|
||||||
|
class EphemDB():
|
||||||
|
def __init__(self, kv=None):
|
||||||
|
self.reads = 0
|
||||||
|
self.writes = 0
|
||||||
|
self.kv = kv or {}
|
||||||
|
|
||||||
|
def get(self, k):
|
||||||
|
self.reads += 1
|
||||||
|
return self.kv.get(k, None)
|
||||||
|
|
||||||
|
def put(self, k, v):
|
||||||
|
self.writes += 1
|
||||||
|
self.kv[k] = v
|
||||||
|
|
||||||
|
def delete(self, k):
|
||||||
|
del self.kv[k]
|
||||||
|
|
||||||
|
# Hashes of empty subtrees
|
||||||
|
zerohashes = [b'\x00' * 32]
|
||||||
|
for i in range(256):
|
||||||
|
zerohashes.insert(0, sha3(zerohashes[0] + zerohashes[0]))
|
||||||
|
|
||||||
|
# Create a new empty tree
|
||||||
|
def new_tree(db):
|
||||||
|
return zerohashes[0]
|
||||||
|
|
||||||
|
# Convert a binary key into an integer path value
|
||||||
|
def key_to_path(k):
|
||||||
|
return int.from_bytes(k, 'big')
|
||||||
|
|
||||||
|
tt256m1 = 2**256 - 1
|
||||||
|
|
||||||
|
# And convert back
|
||||||
|
def path_to_key(k):
|
||||||
|
return (k & tt256m1).to_bytes(32, 'big')
|
||||||
|
|
||||||
|
# Read a key from a given tree
|
||||||
|
def get(db, root, key):
|
||||||
|
v = root
|
||||||
|
path = key_to_path(key)
|
||||||
|
for i in range(0, 256, 4):
|
||||||
|
if v == zerohashes[i]:
|
||||||
|
return b'\x00' * 32
|
||||||
|
child = db.get(v)
|
||||||
|
if len(child) == 65:
|
||||||
|
if (path % 2**256) == key_to_path(child[1:33]):
|
||||||
|
return child[33:]
|
||||||
|
else:
|
||||||
|
return b'\x00' * 32
|
||||||
|
else:
|
||||||
|
index = (path >> 252) & 15
|
||||||
|
v = child[32*index: 32*index+32]
|
||||||
|
path <<= 4
|
||||||
|
return v
|
||||||
|
|
||||||
|
# Make a root hash of a (sub)tree with a single key/value pair
|
||||||
|
def make_single_key_hash(path, depth, value):
|
||||||
|
if depth == 256:
|
||||||
|
return value
|
||||||
|
elif (path >> 255) & 1:
|
||||||
|
return sha3(zerohashes[depth+1] + make_single_key_hash(path << 1, depth + 1, value))
|
||||||
|
else:
|
||||||
|
return sha3(make_single_key_hash(path << 1, depth + 1, value) + zerohashes[depth+1])
|
||||||
|
|
||||||
|
# Hash together 16 elements
|
||||||
|
def hash_16_els(vals):
|
||||||
|
assert len(vals) == 16
|
||||||
|
for _ in range(4):
|
||||||
|
vals = [sha3(vals[i] + vals[i+1]) for i in range(0, len(vals), 2)]
|
||||||
|
return vals[0]
|
||||||
|
|
||||||
|
# Make a root hash of a (sub)tree with two key/value pairs, and save intermediate nodes in the DB
|
||||||
|
def make_double_key_hash(db, path1, path2, depth, value1, value2):
|
||||||
|
if depth == 256:
|
||||||
|
raise Exception("Cannot fit two values into one slot!")
|
||||||
|
if ((path1 >> 252) & 15) == ((path2 >> 252) & 15):
|
||||||
|
children = [zerohashes[depth+4]] * 16
|
||||||
|
children[(path1 >> 252) & 15] = make_double_key_hash(db, path1 << 4, path2 << 4, depth + 4, value1, value2)
|
||||||
|
else:
|
||||||
|
Lkey = ((path1 >> 252) & 15)
|
||||||
|
L = make_single_key_hash(path1 << 4, depth + 4, value1)
|
||||||
|
Rkey = ((path2 >> 252) & 15)
|
||||||
|
R = make_single_key_hash(path2 << 4, depth + 4, value2)
|
||||||
|
db.put(L, b'\x01' + path_to_key(path1 << 4) + value1)
|
||||||
|
db.put(R, b'\x01' + path_to_key(path2 << 4) + value2)
|
||||||
|
children = [zerohashes[depth+4]] * 16
|
||||||
|
children[Lkey] = L
|
||||||
|
children[Rkey] = R
|
||||||
|
h = hash_16_els(children)
|
||||||
|
db.put(h, b''.join(children))
|
||||||
|
return h
|
||||||
|
|
||||||
|
# Update a tree with a given key/value pair
|
||||||
|
def update(db, root, key, value):
|
||||||
|
return _update(db, root, key_to_path(key), 0, value)
|
||||||
|
|
||||||
|
def _update(db, root, path, depth, value):
|
||||||
|
if depth == 256:
|
||||||
|
return value
|
||||||
|
# Update an empty subtree: make a single-key subtree
|
||||||
|
if root == zerohashes[depth]:
|
||||||
|
k = make_single_key_hash(path, depth, value)
|
||||||
|
db.put(k, b'\x01' + path_to_key(path) + value)
|
||||||
|
return k
|
||||||
|
child = db.get(root)
|
||||||
|
# Update a single-key subtree: make a double-key subtree
|
||||||
|
if len(child) == 65:
|
||||||
|
origpath, origvalue = key_to_path(child[1:33]), child[33:]
|
||||||
|
return make_double_key_hash(db, path, origpath, depth, value, origvalue)
|
||||||
|
# Update a multi-key subtree: recurse down
|
||||||
|
else:
|
||||||
|
assert len(child) == 512
|
||||||
|
index = (path >> 252) & 15
|
||||||
|
new_value = _update(db, child[index*32: index*32+32], path << 4, depth + 4, value)
|
||||||
|
new_children = [new_value if i == index else child[32*i:32*i+32] for i in range(16)]
|
||||||
|
h = hash_16_els(new_children)
|
||||||
|
db.put(h, b''.join(new_children))
|
||||||
|
return h
|
||||||
|
|
||||||
|
def multi_update(db, root, keys, values):
|
||||||
|
for k, v in zip(keys, values):
|
||||||
|
root = update(db, root, k, v)
|
||||||
|
return root
|
@ -119,3 +119,8 @@ def _update(db, root, path, depth, value):
|
|||||||
new_child = _update(db, child[:32], path << 1, depth + 1, value) + child[32:]
|
new_child = _update(db, child[:32], path << 1, depth + 1, value) + child[32:]
|
||||||
db.put(sha3(new_child), new_child)
|
db.put(sha3(new_child), new_child)
|
||||||
return sha3(new_child)
|
return sha3(new_child)
|
||||||
|
|
||||||
|
def multi_update(db, root, keys, values):
|
||||||
|
for k, v in zip(keys, values):
|
||||||
|
root = update(db, root, k, v)
|
||||||
|
return root
|
||||||
|
Loading…
x
Reference in New Issue
Block a user