From b2c85706062d6ce3134ca6a3f02b7d5d9ebb00b9 Mon Sep 17 00:00:00 2001
From: protolambda <proto@protolambda.com>
Date: Fri, 12 Jul 2019 19:09:33 +0200
Subject: [PATCH 1/5] fix merkleization with 0-limit case, and enforce padding
 limit

---
 .../pyspec/eth2spec/utils/merkle_minimal.py   | 10 ++-
 .../eth2spec/utils/test_merkle_minimal.py     | 81 +++++++++++--------
 2 files changed, 53 insertions(+), 38 deletions(-)

diff --git a/test_libs/pyspec/eth2spec/utils/merkle_minimal.py b/test_libs/pyspec/eth2spec/utils/merkle_minimal.py
index e9416ea05..972b32d40 100644
--- a/test_libs/pyspec/eth2spec/utils/merkle_minimal.py
+++ b/test_libs/pyspec/eth2spec/utils/merkle_minimal.py
@@ -1,4 +1,4 @@
-from .hash_function import hash
+from eth2spec.utils.hash_function import hash
 from math import log2
 
 
@@ -21,6 +21,8 @@ def calc_merkle_tree_from_leaves(values, layer_count=32):
 
 
 def get_merkle_root(values, pad_to=1):
+    if pad_to == 0:
+        return zerohashes[0]
     layer_count = int(log2(pad_to))
     if len(values) == 0:
         return zerohashes[layer_count]
@@ -36,9 +38,11 @@ def get_merkle_proof(tree, item_index):
 
 
 def merkleize_chunks(chunks, pad_to: int=1):
-    count = len(chunks)
+    if pad_to == 0:
+        return zerohashes[0]
+    count = min(len(chunks), pad_to)
     depth = max(count - 1, 0).bit_length()
-    max_depth = max(depth, (pad_to - 1).bit_length())
+    max_depth = (pad_to - 1).bit_length()
     tmp = [None for _ in range(max_depth + 1)]
 
     def merge(h, i):
diff --git a/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py b/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py
index f1ed768e6..52e50d57a 100644
--- a/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py
+++ b/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py
@@ -8,7 +8,8 @@ def h(a: bytes, b: bytes) -> bytes:
 
 
 def e(v: int) -> bytes:
-    return v.to_bytes(length=32, byteorder='little')
+    # prefix with 0xfff... to make it non-zero
+    return b'\xff' * 28 + v.to_bytes(length=4, byteorder='little')
 
 
 def z(i: int) -> bytes:
@@ -16,44 +17,54 @@ def z(i: int) -> bytes:
 
 
 cases = [
-    (0, 0, 1, z(0)),
-    (0, 1, 1, e(0)),
-    (1, 0, 2, h(z(0), z(0))),
-    (1, 1, 2, h(e(0), z(0))),
-    (1, 2, 2, h(e(0), e(1))),
-    (2, 0, 4, h(h(z(0), z(0)), z(1))),
-    (2, 1, 4, h(h(e(0), z(0)), z(1))),
-    (2, 2, 4, h(h(e(0), e(1)), z(1))),
-    (2, 3, 4, h(h(e(0), e(1)), h(e(2), z(0)))),
-    (2, 4, 4, h(h(e(0), e(1)), h(e(2), e(3)))),
-    (3, 0, 8, h(h(h(z(0), z(0)), z(1)), z(2))),
-    (3, 1, 8, h(h(h(e(0), z(0)), z(1)), z(2))),
-    (3, 2, 8, h(h(h(e(0), e(1)), z(1)), z(2))),
-    (3, 3, 8, h(h(h(e(0), e(1)), h(e(2), z(0))), z(2))),
-    (3, 4, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), z(2))),
-    (3, 5, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), z(0)), z(1)))),
-    (3, 6, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(z(0), z(0))))),
-    (3, 7, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), z(0))))),
-    (3, 8, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), e(7))))),
-    (4, 0, 16, h(h(h(h(z(0), z(0)), z(1)), z(2)), z(3))),
-    (4, 1, 16, h(h(h(h(e(0), z(0)), z(1)), z(2)), z(3))),
-    (4, 2, 16, h(h(h(h(e(0), e(1)), z(1)), z(2)), z(3))),
-    (4, 3, 16, h(h(h(h(e(0), e(1)), h(e(2), z(0))), z(2)), z(3))),
-    (4, 4, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), z(2)), z(3))),
-    (4, 5, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), z(0)), z(1))), z(3))),
-    (4, 6, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(z(0), z(0)))), z(3))),
-    (4, 7, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), z(0)))), z(3))),
-    (4, 8, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), e(7)))), z(3))),
-    (4, 9, 16,
-     h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), e(7)))), h(h(h(e(8), z(0)), z(1)), z(2)))),
+    # limit 0: always zero hash
+    (0, 0, z(0)),
+    (1, 0, z(0)),  # cut-off due to limit
+    (2, 0, z(0)),  # cut-off due to limit
+    # limit 1: padded to 1 element if not already. Returned (like identity func)
+    (0, 1, z(0)),
+    (1, 1, e(0)),
+    (2, 1, e(0)),  # cut-off due to limit
+    (1, 1, e(0)),
+    (0, 2, h(z(0), z(0))),
+    (1, 2, h(e(0), z(0))),
+    (2, 2, h(e(0), e(1))),
+    (3, 2, h(e(0), e(1))),    # cut-off due to limit
+    (16, 2, h(e(0), e(1))),    # bigger cut-off due to limit
+    (0, 4, h(h(z(0), z(0)), z(1))),
+    (1, 4, h(h(e(0), z(0)), z(1))),
+    (2, 4, h(h(e(0), e(1)), z(1))),
+    (3, 4, h(h(e(0), e(1)), h(e(2), z(0)))),
+    (4, 4, h(h(e(0), e(1)), h(e(2), e(3)))),
+    (5, 4, h(h(e(0), e(1)), h(e(2), e(3)))),  # cut-off due to limit
+    (0, 8, h(h(h(z(0), z(0)), z(1)), z(2))),
+    (1, 8, h(h(h(e(0), z(0)), z(1)), z(2))),
+    (2, 8, h(h(h(e(0), e(1)), z(1)), z(2))),
+    (3, 8, h(h(h(e(0), e(1)), h(e(2), z(0))), z(2))),
+    (4, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), z(2))),
+    (5, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), z(0)), z(1)))),
+    (6, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(z(0), z(0))))),
+    (7, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), z(0))))),
+    (8, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), e(7))))),
+    (9, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), e(7))))),  # cut-off due to limit
+    (0, 16, h(h(h(h(z(0), z(0)), z(1)), z(2)), z(3))),
+    (1, 16, h(h(h(h(e(0), z(0)), z(1)), z(2)), z(3))),
+    (2, 16, h(h(h(h(e(0), e(1)), z(1)), z(2)), z(3))),
+    (3, 16, h(h(h(h(e(0), e(1)), h(e(2), z(0))), z(2)), z(3))),
+    (4, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), z(2)), z(3))),
+    (5, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), z(0)), z(1))), z(3))),
+    (6, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(z(0), z(0)))), z(3))),
+    (7, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), z(0)))), z(3))),
+    (8, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), e(7)))), z(3))),
+    (9, 16, h(h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), e(7)))), h(h(h(e(8), z(0)), z(1)), z(2)))),
 ]
 
 
 @pytest.mark.parametrize(
-    'depth,count,pow2,value',
+    'count,pad_to,value',
     cases,
 )
-def test_merkleize_chunks_and_get_merkle_root(depth, count, pow2, value):
+def test_merkleize_chunks_and_get_merkle_root(count, pad_to, value):
     chunks = [e(i) for i in range(count)]
-    assert merkleize_chunks(chunks, pad_to=pow2) == value
-    assert get_merkle_root(chunks, pad_to=pow2) == value
+    assert merkleize_chunks(chunks, pad_to=pad_to) == value
+    assert get_merkle_root(chunks, pad_to=pad_to) == value

From 65b031158297e7ed938af1f73f3919100c3189d6 Mon Sep 17 00:00:00 2001
From: protolambda <proto@protolambda.com>
Date: Fri, 12 Jul 2019 20:39:55 +0200
Subject: [PATCH 2/5] more explicit about merkleization limit/pad

---
 test_libs/pyspec/eth2spec/utils/merkle_minimal.py   | 13 +++++++++----
 test_libs/pyspec/eth2spec/utils/ssz/ssz_impl.py     |  3 ++-
 .../pyspec/eth2spec/utils/test_merkle_minimal.py    |  8 ++++----
 3 files changed, 15 insertions(+), 9 deletions(-)

diff --git a/test_libs/pyspec/eth2spec/utils/merkle_minimal.py b/test_libs/pyspec/eth2spec/utils/merkle_minimal.py
index 972b32d40..503926517 100644
--- a/test_libs/pyspec/eth2spec/utils/merkle_minimal.py
+++ b/test_libs/pyspec/eth2spec/utils/merkle_minimal.py
@@ -37,12 +37,17 @@ def get_merkle_proof(tree, item_index):
     return proof
 
 
-def merkleize_chunks(chunks, pad_to: int=1):
-    if pad_to == 0:
+def merkleize_chunks(chunks, limit=None):
+    # If no limit is defined, we are just merkleizing chunks (e.g. SSZ container).
+    if limit is None:
+        limit = len(chunks)
+    if limit == 0:
         return zerohashes[0]
-    count = min(len(chunks), pad_to)
+    # Limit strictly. Makes no sense to merkleize objects above the intended padding.
+    # And illegal to exceed list limits, just as with serialization.
+    count = min(len(chunks), limit)
     depth = max(count - 1, 0).bit_length()
-    max_depth = (pad_to - 1).bit_length()
+    max_depth = (limit - 1).bit_length()
     tmp = [None for _ in range(max_depth + 1)]
 
     def merge(h, i):
diff --git a/test_libs/pyspec/eth2spec/utils/ssz/ssz_impl.py b/test_libs/pyspec/eth2spec/utils/ssz/ssz_impl.py
index d5855a755..5b37a2bb7 100644
--- a/test_libs/pyspec/eth2spec/utils/ssz/ssz_impl.py
+++ b/test_libs/pyspec/eth2spec/utils/ssz/ssz_impl.py
@@ -126,6 +126,7 @@ def item_length(typ: SSZType) -> int:
 
 
 def chunk_count(typ: SSZType) -> int:
+    # note that for lists, .length *on the type* describes the list limit.
     if isinstance(typ, BasicType):
         return 1
     elif issubclass(typ, Bits):
@@ -150,7 +151,7 @@ def hash_tree_root(obj: SSZValue):
         raise Exception(f"Type not supported: {type(obj)}")
 
     if isinstance(obj, (List, Bytes, Bitlist)):
-        return mix_in_length(merkleize_chunks(leaves, pad_to=chunk_count(obj.type())), len(obj))
+        return mix_in_length(merkleize_chunks(leaves, limit=chunk_count(obj.type())), len(obj))
     else:
         return merkleize_chunks(leaves)
 
diff --git a/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py b/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py
index 52e50d57a..a40ec05cf 100644
--- a/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py
+++ b/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py
@@ -61,10 +61,10 @@ cases = [
 
 
 @pytest.mark.parametrize(
-    'count,pad_to,value',
+    'count,limit,value',
     cases,
 )
-def test_merkleize_chunks_and_get_merkle_root(count, pad_to, value):
+def test_merkleize_chunks_and_get_merkle_root(count, limit, value):
     chunks = [e(i) for i in range(count)]
-    assert merkleize_chunks(chunks, pad_to=pad_to) == value
-    assert get_merkle_root(chunks, pad_to=pad_to) == value
+    assert merkleize_chunks(chunks, limit=limit) == value
+    assert get_merkle_root(chunks, pad_to=limit) == value

From a8dc9157b8c288a8f2491370762cde89a05dedac Mon Sep 17 00:00:00 2001
From: protolambda <proto@protolambda.com>
Date: Fri, 12 Jul 2019 21:15:28 +0200
Subject: [PATCH 3/5] clean up merkleization text in SSZ spec

---
 specs/simple-serialize.md | 40 ++++++++++++++++++---------------------
 1 file changed, 18 insertions(+), 22 deletions(-)

diff --git a/specs/simple-serialize.md b/specs/simple-serialize.md
index 8efd08c0a..6c6377843 100644
--- a/specs/simple-serialize.md
+++ b/specs/simple-serialize.md
@@ -25,8 +25,6 @@
         - [Vectors, containers, lists, unions](#vectors-containers-lists-unions)
     - [Deserialization](#deserialization)
     - [Merkleization](#merkleization)
-        - [`Bitvector[N]`](#bitvectorn-1)
-        - [`Bitlist[N]`](#bitlistn-1)
     - [Self-signed containers](#self-signed-containers)
     - [Implementations](#implementations)
 
@@ -177,38 +175,36 @@ Note that deserialization requires hardening against invalid inputs. A non-exhau
 
 We first define helper functions:
 
+* `chunk_count(type)`: calculate the amount of leafs for merkleization of the type.
+   * all basic types: `1`
+   * bitlists and bitvectors: `(N + 255) // 256` (dividing by chunk size, rounding up)
+   * lists and vectors of basic types: `N * item_length(elem_type) + 31) // 32` (dividing by chunk size, rounding up)
+   * lists and vectors of composite types: `N`
+   * containers: `len(fields)`
+* `bitfield_bytes(bits)`: return the bits of the bitlist or bitvector, packed in bytes, aligned to the start. Exclusive length-delimiting bit for bitlists.
 * `pack`: Given ordered objects of the same basic type, serialize them, pack them into `BYTES_PER_CHUNK`-byte chunks, right-pad the last chunk with zero bytes, and return the chunks.
 * `next_pow_of_two(i)`: get the next power of 2 of `i`, if not already a power of 2, with 0 mapping to 1. Examples: `0->1, 1->1, 2->2, 3->4, 4->4, 6->8, 9->16`
-* `merkleize(data, pad_for=1)`: Given ordered `BYTES_PER_CHUNK`-byte chunks, if necessary append zero chunks so that the number of chunks is a power of two, Merkleize the chunks, and return the root.
-    * The merkleization depends on the effective input, which can be padded: if `pad_for=L`, then pad the `data` with zeroed chunks to `next_pow_of_two(L)` (virtually for memory efficiency).
+* `merkleize(chunks, limit=None)`: Given ordered `BYTES_PER_CHUNK`-byte chunks, merkleize the chunks, and return the root:
+    * The merkleization depends on the effective input, which can be padded/limited:
+        - if no limit: pad the `chunks` with zeroed chunks to `next_pow_of_two(len(chunks))` (virtually for memory efficiency).
+        - if `limit > len(chunks)`, pad the `chunks` with zeroed chunks to `next_pow_of_two(limit)` (virtually for memory efficiency).
+        - if `limit < len(chunks)`: do not merkleize, input exceeds limit. Raise an error instead.
     * Then, merkleize the chunks (empty input is padded to 1 zero chunk):
-        - If `1` chunk: A single chunk is simply that chunk, i.e. the identity when the number of chunks is one.
-        - If `> 1` chunks: pad to `next_pow_of_two(len(chunks))`, merkleize as binary tree.
+        - If `1` chunk: the root is the chunk itself.
+        - If `> 1` chunks: merkleize as binary tree.
 * `mix_in_length`: Given a Merkle root `root` and a length `length` (`"uint256"` little-endian serialization) return `hash(root + length)`.
 * `mix_in_type`: Given a Merkle root `root` and a type_index `type_index` (`"uint256"` little-endian serialization) return `hash(root + type_index)`.
 
 We now define Merkleization `hash_tree_root(value)` of an object `value` recursively:
 
 * `merkleize(pack(value))` if `value` is a basic object or a vector of basic objects.
-* `mix_in_length(merkleize(pack(value), pad_for=(N * elem_size / BYTES_PER_CHUNK)), len(value))` if `value` is a list of basic objects.
+* `merkleize(bitfield_bytes(value), limit=chunk_count(type))` if `value` is a bitvector.
+* `mix_in_length(merkleize(pack(value), limit=chunk_count(type)), len(value))` if `value` is a list of basic objects.
+* `mix_in_length(merkleize(bitfield_bytes(value), limit=chunk_count(type)), len(value))` if `value` is a bitlist.
 * `merkleize([hash_tree_root(element) for element in value])` if `value` is a vector of composite objects or a container.
-* `mix_in_length(merkleize([hash_tree_root(element) for element in value], pad_for=N), len(value))` if `value` is a list of composite objects.
+* `mix_in_length(merkleize([hash_tree_root(element) for element in value], limit=chunk_count(type)), len(value))` if `value` is a list of composite objects.
 * `mix_in_type(merkleize(value.value), value.type_index)` if `value` is of union type.
 
-### `Bitvector[N]`
-
-```python
-as_integer = sum([value[i] << i for i in range(len(value))])
-return merkleize(pack(as_integer.to_bytes((N + 7) // 8, "little")))
-```
-
-### `Bitlist[N]`
-
-```python
-as_integer = sum([value[i] << i for i in range(len(value))])
-return mix_in_length(merkleize(pack(as_integer.to_bytes((N + 7) // 8, "little"))), len(value))
-```
-
 ## Self-signed containers
 
 Let `value` be a self-signed container object. The convention is that the signature (e.g. a `"bytes96"` BLS12-381 signature) be the last field of `value`. Further, the signed message for `value` is `signing_root(value) = hash_tree_root(truncate_last(value))` where `truncate_last` truncates the last element of `value`.

From 5a13684c7f2a9b274d1772ce6aa2db03cb0112fb Mon Sep 17 00:00:00 2001
From: protolambda <proto@protolambda.com>
Date: Fri, 12 Jul 2019 21:23:45 +0200
Subject: [PATCH 4/5] make exceeding limit raise an error

---
 .../pyspec/eth2spec/utils/merkle_minimal.py   | 10 +++++--
 .../eth2spec/utils/test_merkle_minimal.py     | 28 +++++++++++++------
 2 files changed, 26 insertions(+), 12 deletions(-)

diff --git a/test_libs/pyspec/eth2spec/utils/merkle_minimal.py b/test_libs/pyspec/eth2spec/utils/merkle_minimal.py
index 503926517..9d7138d7d 100644
--- a/test_libs/pyspec/eth2spec/utils/merkle_minimal.py
+++ b/test_libs/pyspec/eth2spec/utils/merkle_minimal.py
@@ -41,11 +41,15 @@ def merkleize_chunks(chunks, limit=None):
     # If no limit is defined, we are just merkleizing chunks (e.g. SSZ container).
     if limit is None:
         limit = len(chunks)
+
+    count = len(chunks)
+    # See if the input is within expected size.
+    # If not, a list-limit is set incorrectly, or a value is unexpectedly large.
+    assert count <= limit
+
     if limit == 0:
         return zerohashes[0]
-    # Limit strictly. Makes no sense to merkleize objects above the intended padding.
-    # And illegal to exceed list limits, just as with serialization.
-    count = min(len(chunks), limit)
+
     depth = max(count - 1, 0).bit_length()
     max_depth = (limit - 1).bit_length()
     tmp = [None for _ in range(max_depth + 1)]
diff --git a/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py b/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py
index a40ec05cf..3746ea6ca 100644
--- a/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py
+++ b/test_libs/pyspec/eth2spec/utils/test_merkle_minimal.py
@@ -19,24 +19,24 @@ def z(i: int) -> bytes:
 cases = [
     # limit 0: always zero hash
     (0, 0, z(0)),
-    (1, 0, z(0)),  # cut-off due to limit
-    (2, 0, z(0)),  # cut-off due to limit
+    (1, 0, None),  # cut-off due to limit
+    (2, 0, None),  # cut-off due to limit
     # limit 1: padded to 1 element if not already. Returned (like identity func)
     (0, 1, z(0)),
     (1, 1, e(0)),
-    (2, 1, e(0)),  # cut-off due to limit
+    (2, 1, None),  # cut-off due to limit
     (1, 1, e(0)),
     (0, 2, h(z(0), z(0))),
     (1, 2, h(e(0), z(0))),
     (2, 2, h(e(0), e(1))),
-    (3, 2, h(e(0), e(1))),    # cut-off due to limit
-    (16, 2, h(e(0), e(1))),    # bigger cut-off due to limit
+    (3, 2, None),  # cut-off due to limit
+    (16, 2, None),  # bigger cut-off due to limit
     (0, 4, h(h(z(0), z(0)), z(1))),
     (1, 4, h(h(e(0), z(0)), z(1))),
     (2, 4, h(h(e(0), e(1)), z(1))),
     (3, 4, h(h(e(0), e(1)), h(e(2), z(0)))),
     (4, 4, h(h(e(0), e(1)), h(e(2), e(3)))),
-    (5, 4, h(h(e(0), e(1)), h(e(2), e(3)))),  # cut-off due to limit
+    (5, 4, None),  # cut-off due to limit
     (0, 8, h(h(h(z(0), z(0)), z(1)), z(2))),
     (1, 8, h(h(h(e(0), z(0)), z(1)), z(2))),
     (2, 8, h(h(h(e(0), e(1)), z(1)), z(2))),
@@ -46,7 +46,7 @@ cases = [
     (6, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(z(0), z(0))))),
     (7, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), z(0))))),
     (8, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), e(7))))),
-    (9, 8, h(h(h(e(0), e(1)), h(e(2), e(3))), h(h(e(4), e(5)), h(e(6), e(7))))),  # cut-off due to limit
+    (9, 8, None),  # cut-off due to limit
     (0, 16, h(h(h(h(z(0), z(0)), z(1)), z(2)), z(3))),
     (1, 16, h(h(h(h(e(0), z(0)), z(1)), z(2)), z(3))),
     (2, 16, h(h(h(h(e(0), e(1)), z(1)), z(2)), z(3))),
@@ -66,5 +66,15 @@ cases = [
 )
 def test_merkleize_chunks_and_get_merkle_root(count, limit, value):
     chunks = [e(i) for i in range(count)]
-    assert merkleize_chunks(chunks, limit=limit) == value
-    assert get_merkle_root(chunks, pad_to=limit) == value
+    if value is None:
+        bad = False
+        try:
+            merkleize_chunks(chunks, limit=limit)
+            bad = True
+        except AssertionError:
+            pass
+        if bad:
+            assert False, "expected merkleization to be invalid"
+    else:
+        assert merkleize_chunks(chunks, limit=limit) == value
+        assert get_merkle_root(chunks, pad_to=limit) == value

From d9fd1d3a2a4c73148757adf92787f5600807a21c Mon Sep 17 00:00:00 2001
From: protolambda <proto@protolambda.com>
Date: Mon, 15 Jul 2019 00:12:12 +0200
Subject: [PATCH 5/5] improve type wording based on PR 1292 feedback

---
 specs/simple-serialize.md | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/specs/simple-serialize.md b/specs/simple-serialize.md
index 6c6377843..01440c1cd 100644
--- a/specs/simple-serialize.md
+++ b/specs/simple-serialize.md
@@ -175,11 +175,12 @@ Note that deserialization requires hardening against invalid inputs. A non-exhau
 
 We first define helper functions:
 
+* `size_of(B)`, where `B` is a basic type: the length, in bytes, of the serialized form of the basic type.
 * `chunk_count(type)`: calculate the amount of leafs for merkleization of the type.
    * all basic types: `1`
-   * bitlists and bitvectors: `(N + 255) // 256` (dividing by chunk size, rounding up)
-   * lists and vectors of basic types: `N * item_length(elem_type) + 31) // 32` (dividing by chunk size, rounding up)
-   * lists and vectors of composite types: `N`
+   * `Bitlist[N]` and `Bitvector[N]`: `(N + 255) // 256` (dividing by chunk size, rounding up)
+   * `List[B, N]` and `Vector[B, N]`, where `B` is a basic type: `(N * size_of(B) + 31) // 32` (dividing by chunk size, rounding up)
+   * `List[C, N]` and `Vector[C, N]`, where `C` is a composite type: `N`
    * containers: `len(fields)`
 * `bitfield_bytes(bits)`: return the bits of the bitlist or bitvector, packed in bytes, aligned to the start. Exclusive length-delimiting bit for bitlists.
 * `pack`: Given ordered objects of the same basic type, serialize them, pack them into `BYTES_PER_CHUNK`-byte chunks, right-pad the last chunk with zero bytes, and return the chunks.