158 lines
4.9 KiB
Python
Raw Normal View History

2019-06-20 19:57:50 +02:00
from ..merkle_minimal import merkleize_chunks
from ..hash_function import hash
2019-06-20 19:51:38 +02:00
from .ssz_typing import (
SSZValue, SSZType, BasicValue, BasicType, Series, Elements, Bits, boolean, Container, List, ByteList,
Bitlist, Bitvector, uint,
)
2019-05-25 00:05:03 +02:00
# SSZ Serialization
# -----------------------------
2019-05-25 00:05:03 +02:00
BYTES_PER_LENGTH_OFFSET = 4
2019-06-20 19:57:50 +02:00
def serialize_basic(value: SSZValue):
if isinstance(value, uint):
return value.to_bytes(value.type().byte_len, 'little')
elif isinstance(value, boolean):
2019-05-25 00:05:03 +02:00
if value:
return b'\x01'
else:
return b'\x00'
2019-05-30 09:42:42 -04:00
else:
2019-06-20 19:57:50 +02:00
raise Exception(f"Type not supported: {type(value)}")
2019-05-30 09:42:42 -04:00
2019-06-20 19:57:50 +02:00
def deserialize_basic(value, typ: BasicType):
if issubclass(typ, uint):
2019-05-30 09:42:42 -04:00
return typ(int.from_bytes(value, 'little'))
2019-06-27 10:42:14 +01:00
elif issubclass(typ, boolean):
2019-05-30 09:42:42 -04:00
assert value in (b'\x00', b'\x01')
return typ(value == b'\x01')
else:
2019-06-20 19:57:50 +02:00
raise Exception(f"Type not supported: {typ}")
2019-05-25 14:06:42 -04:00
2019-07-25 17:32:27 +08:00
def is_zero(obj: SSZValue):
2019-06-20 19:57:50 +02:00
return type(obj).default() == obj
2019-06-05 15:29:26 +02:00
2019-06-20 19:57:50 +02:00
def serialize(obj: SSZValue):
if isinstance(obj, BasicValue):
return serialize_basic(obj)
elif isinstance(obj, Bitvector):
return obj.as_bytes()
elif isinstance(obj, Bitlist):
as_bytearray = list(obj.as_bytes())
if len(obj) % 8 == 0:
as_bytearray.append(1)
else:
as_bytearray[len(obj) // 8] |= 1 << (len(obj) % 8)
return bytes(as_bytearray)
2019-06-20 19:57:50 +02:00
elif isinstance(obj, Series):
return encode_series(obj)
2019-05-25 14:06:42 -04:00
else:
2019-06-20 19:57:50 +02:00
raise Exception(f"Type not supported: {type(obj)}")
2019-06-20 19:57:50 +02:00
def encode_series(values: Series):
if isinstance(values, bytes): # ByteList and ByteVector are already like serialized output
return values
# Recursively serialize
2019-06-20 19:57:50 +02:00
parts = [(v.type().is_fixed_size(), serialize(v)) for v in values]
# Compute and check lengths
fixed_lengths = [len(serialized) if constant_size else BYTES_PER_LENGTH_OFFSET
for (constant_size, serialized) in parts]
variable_lengths = [len(serialized) if not constant_size else 0
for (constant_size, serialized) in parts]
# Check if integer is not out of bounds (Python)
assert sum(fixed_lengths + variable_lengths) < 2 ** (BYTES_PER_LENGTH_OFFSET * 8)
# Interleave offsets of variable-size parts with fixed-size parts.
# Avoid quadratic complexity in calculation of offsets.
offset = sum(fixed_lengths)
variable_parts = []
fixed_parts = []
for (constant_size, serialized) in parts:
if constant_size:
fixed_parts.append(serialized)
else:
fixed_parts.append(offset.to_bytes(BYTES_PER_LENGTH_OFFSET, 'little'))
variable_parts.append(serialized)
offset += len(serialized)
# Return the concatenation of the fixed-size parts (offsets interleaved) with the variable-size parts
return b''.join(fixed_parts + variable_parts)
2019-05-25 00:05:03 +02:00
2019-05-25 14:06:42 -04:00
# SSZ Hash-tree-root
# -----------------------------
2019-06-20 19:57:50 +02:00
def pack(values: Series):
if isinstance(values, bytes): # ByteList and ByteVector are already packed
return values
elif isinstance(values, Bits):
# packs the bits in bytes, left-aligned.
# Exclusive length delimiting bits for bitlists.
return values.as_bytes()
2019-06-20 19:57:50 +02:00
return b''.join([serialize_basic(value) for value in values])
2019-05-25 14:06:42 -04:00
2019-05-25 14:06:42 -04:00
def chunkify(bytez):
# pad `bytez` to nearest 32-byte multiple
2019-05-25 14:06:42 -04:00
bytez += b'\x00' * (-len(bytez) % 32)
return [bytez[i:i + 32] for i in range(0, len(bytez), 32)]
2019-05-25 14:06:42 -04:00
def mix_in_length(root, length):
return hash(root + length.to_bytes(32, 'little'))
2019-06-20 19:57:50 +02:00
def is_bottom_layer_kind(typ: SSZType):
2019-05-28 14:33:12 -04:00
return (
2019-06-17 01:39:39 +02:00
isinstance(typ, BasicType) or
(issubclass(typ, Elements) and isinstance(typ.elem_type, BasicType))
2019-05-28 14:33:12 -04:00
)
2019-06-20 19:57:50 +02:00
def item_length(typ: SSZType) -> int:
if issubclass(typ, BasicValue):
2019-06-20 19:57:50 +02:00
return typ.byte_len
2019-05-28 14:33:12 -04:00
else:
2019-06-20 19:57:50 +02:00
return 32
2019-05-28 14:33:12 -04:00
2019-06-20 19:57:50 +02:00
def chunk_count(typ: SSZType) -> int:
# note that for lists, .length *on the type* describes the list limit.
2019-06-17 01:39:39 +02:00
if isinstance(typ, BasicType):
return 1
2019-06-28 12:23:22 +01:00
elif issubclass(typ, Bits):
2019-06-27 16:31:33 +01:00
return (typ.length + 255) // 256
2019-06-20 19:57:50 +02:00
elif issubclass(typ, Elements):
return (typ.length * item_length(typ.elem_type) + 31) // 32
elif issubclass(typ, Container):
return len(typ.get_fields())
else:
2019-06-20 19:57:50 +02:00
raise Exception(f"Type not supported: {typ}")
def hash_tree_root(obj: SSZValue):
if isinstance(obj, Series):
if is_bottom_layer_kind(obj.type()):
leaves = chunkify(pack(obj))
else:
leaves = [hash_tree_root(value) for value in obj]
elif isinstance(obj, BasicValue):
leaves = chunkify(serialize_basic(obj))
2019-05-28 14:33:12 -04:00
else:
2019-06-17 01:39:39 +02:00
raise Exception(f"Type not supported: {type(obj)}")
2019-06-20 19:57:50 +02:00
if isinstance(obj, (List, ByteList, Bitlist)):
return mix_in_length(merkleize_chunks(leaves, limit=chunk_count(obj.type())), len(obj))
2019-05-25 14:06:42 -04:00
else:
2019-05-28 14:33:12 -04:00
return merkleize_chunks(leaves)