Directory Restructure (#1163)

* Move tests -> testing * Directory restructure * Update Cargo.toml during restructure * Update Makefile during restructure * Fix arbitrary path
2026-04-18 21:38:31 +00:00 · 2020-05-18 21:24:23 +10:00
parent c571afb8d8
commit 4331834003
358 changed files with 217 additions and 229 deletions
--- a/consensus/tree_hash/src/impls.rs
+++ b/consensus/tree_hash/src/impls.rs
@@ -0,0 +1,180 @@
+use super::*;
+use ethereum_types::{H256, U128, U256};
+
+fn int_to_hash256(int: u64) -> Hash256 {
+    let mut bytes = [0; HASHSIZE];
+    bytes[0..8].copy_from_slice(&int.to_le_bytes());
+    Hash256::from_slice(&bytes)
+}
+
+macro_rules! impl_for_bitsize {
+    ($type: ident, $bit_size: expr) => {
+        impl TreeHash for $type {
+            fn tree_hash_type() -> TreeHashType {
+                TreeHashType::Basic
+            }
+
+            fn tree_hash_packed_encoding(&self) -> Vec<u8> {
+                self.to_le_bytes().to_vec()
+            }
+
+            fn tree_hash_packing_factor() -> usize {
+                HASHSIZE / ($bit_size / 8)
+            }
+
+            #[allow(clippy::cast_lossless)]
+            fn tree_hash_root(&self) -> Hash256 {
+                int_to_hash256(*self as u64)
+            }
+        }
+    };
+}
+
+impl_for_bitsize!(u8, 8);
+impl_for_bitsize!(u16, 16);
+impl_for_bitsize!(u32, 32);
+impl_for_bitsize!(u64, 64);
+impl_for_bitsize!(usize, 64);
+
+impl TreeHash for bool {
+    fn tree_hash_type() -> TreeHashType {
+        TreeHashType::Basic
+    }
+
+    fn tree_hash_packed_encoding(&self) -> Vec<u8> {
+        (*self as u8).tree_hash_packed_encoding()
+    }
+
+    fn tree_hash_packing_factor() -> usize {
+        u8::tree_hash_packing_factor()
+    }
+
+    fn tree_hash_root(&self) -> Hash256 {
+        int_to_hash256(*self as u64)
+    }
+}
+
+/// Only valid for byte types less than 32 bytes.
+macro_rules! impl_for_lt_32byte_u8_array {
+    ($len: expr) => {
+        impl TreeHash for [u8; $len] {
+            fn tree_hash_type() -> TreeHashType {
+                TreeHashType::Vector
+            }
+
+            fn tree_hash_packed_encoding(&self) -> Vec<u8> {
+                unreachable!("bytesN should never be packed.")
+            }
+
+            fn tree_hash_packing_factor() -> usize {
+                unreachable!("bytesN should never be packed.")
+            }
+
+            fn tree_hash_root(&self) -> Hash256 {
+                let mut result = [0; 32];
+                result[0..$len].copy_from_slice(&self[..]);
+                Hash256::from_slice(&result)
+            }
+        }
+    };
+}
+
+impl_for_lt_32byte_u8_array!(4);
+impl_for_lt_32byte_u8_array!(32);
+
+impl TreeHash for U128 {
+    fn tree_hash_type() -> TreeHashType {
+        TreeHashType::Basic
+    }
+
+    fn tree_hash_packed_encoding(&self) -> Vec<u8> {
+        let mut result = vec![0; 16];
+        self.to_little_endian(&mut result);
+        result
+    }
+
+    fn tree_hash_packing_factor() -> usize {
+        2
+    }
+
+    fn tree_hash_root(&self) -> Hash256 {
+        let mut result = [0; HASHSIZE];
+        self.to_little_endian(&mut result[0..16]);
+        Hash256::from_slice(&result)
+    }
+}
+
+impl TreeHash for U256 {
+    fn tree_hash_type() -> TreeHashType {
+        TreeHashType::Basic
+    }
+
+    fn tree_hash_packed_encoding(&self) -> Vec<u8> {
+        let mut result = vec![0; 32];
+        self.to_little_endian(&mut result);
+        result
+    }
+
+    fn tree_hash_packing_factor() -> usize {
+        1
+    }
+
+    fn tree_hash_root(&self) -> Hash256 {
+        let mut result = [0; 32];
+        self.to_little_endian(&mut result[..]);
+        Hash256::from_slice(&result)
+    }
+}
+
+impl TreeHash for H256 {
+    fn tree_hash_type() -> TreeHashType {
+        TreeHashType::Vector
+    }
+
+    fn tree_hash_packed_encoding(&self) -> Vec<u8> {
+        self.as_bytes().to_vec()
+    }
+
+    fn tree_hash_packing_factor() -> usize {
+        1
+    }
+
+    fn tree_hash_root(&self) -> Hash256 {
+        *self
+    }
+}
+
+#[cfg(test)]
+mod test {
+    use super::*;
+
+    #[test]
+    fn bool() {
+        let mut true_bytes: Vec<u8> = vec![1];
+        true_bytes.append(&mut vec![0; 31]);
+
+        let false_bytes: Vec<u8> = vec![0; 32];
+
+        assert_eq!(true.tree_hash_root().as_bytes(), true_bytes.as_slice());
+        assert_eq!(false.tree_hash_root().as_bytes(), false_bytes.as_slice());
+    }
+
+    #[test]
+    fn int_to_bytes() {
+        assert_eq!(int_to_hash256(0).as_bytes(), &[0; 32]);
+        assert_eq!(
+            int_to_hash256(1).as_bytes(),
+            &[
+                1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+                0, 0, 0, 0
+            ]
+        );
+        assert_eq!(
+            int_to_hash256(u64::max_value()).as_bytes(),
+            &[
+                255, 255, 255, 255, 255, 255, 255, 255, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+                0, 0, 0, 0, 0, 0, 0, 0, 0, 0
+            ]
+        );
+    }
+}
--- a/consensus/tree_hash/src/lib.rs
+++ b/consensus/tree_hash/src/lib.rs
@@ -0,0 +1,162 @@
+pub mod impls;
+mod merkle_hasher;
+mod merkleize_padded;
+mod merkleize_standard;
+
+pub use merkle_hasher::{Error, MerkleHasher};
+pub use merkleize_padded::merkleize_padded;
+pub use merkleize_standard::merkleize_standard;
+
+use eth2_hashing::{Context, SHA256};
+use eth2_hashing::{ZERO_HASHES, ZERO_HASHES_MAX_INDEX};
+
+pub const BYTES_PER_CHUNK: usize = 32;
+pub const HASHSIZE: usize = 32;
+pub const MERKLE_HASH_CHUNK: usize = 2 * BYTES_PER_CHUNK;
+
+pub type Hash256 = ethereum_types::H256;
+
+/// Convenience method for `MerkleHasher` which also provides some fast-paths for small trees.
+///
+/// `minimum_leaf_count` will only be used if it is greater than or equal to the minimum number of leaves that can be created from `bytes`.
+pub fn merkle_root(bytes: &[u8], minimum_leaf_count: usize) -> Hash256 {
+    let leaves = std::cmp::max(
+        (bytes.len() + (HASHSIZE - 1)) / HASHSIZE,
+        minimum_leaf_count,
+    );
+
+    if leaves == 0 {
+        // If there are no bytes then the hash is always zero.
+        Hash256::zero()
+    } else if leaves == 1 {
+        // If there is only one leaf, the hash is always those leaf bytes padded out to 32-bytes.
+        let mut hash = [0; HASHSIZE];
+        hash[0..bytes.len()].copy_from_slice(bytes);
+        Hash256::from_slice(&hash)
+    } else if leaves == 2 {
+        // If there are only two leaves (this is common with BLS pubkeys), we can avoid some
+        // overhead with `MerkleHasher` and just do a simple 3-node tree here.
+        let mut leaves = [0; HASHSIZE * 2];
+        leaves[0..bytes.len()].copy_from_slice(bytes);
+
+        let mut context = Context::new(&SHA256);
+        context.update(&leaves);
+        let digest = context.finish();
+
+        Hash256::from_slice(digest.as_ref())
+    } else {
+        // If there are 3 or more leaves, use `MerkleHasher`.
+        let mut hasher = MerkleHasher::with_leaves(leaves);
+        hasher
+            .write(bytes)
+            .expect("the number of leaves is adequate for the number of bytes");
+        hasher
+            .finish()
+            .expect("the number of leaves is adequate for the number of bytes")
+    }
+}
+
+/// Returns the node created by hashing `root` and `length`.
+///
+/// Used in `TreeHash` for inserting the length of a list above it's root.
+pub fn mix_in_length(root: &Hash256, length: usize) -> Hash256 {
+    let usize_len = std::mem::size_of::<usize>();
+
+    let mut length_bytes = [0; BYTES_PER_CHUNK];
+    length_bytes[0..usize_len].copy_from_slice(&length.to_le_bytes());
+
+    Hash256::from_slice(&eth2_hashing::hash32_concat(root.as_bytes(), &length_bytes)[..])
+}
+
+/// Returns a cached padding node for a given height.
+fn get_zero_hash(height: usize) -> &'static [u8] {
+    if height <= ZERO_HASHES_MAX_INDEX {
+        &ZERO_HASHES[height]
+    } else {
+        panic!("Tree exceeds MAX_TREE_DEPTH of {}", ZERO_HASHES_MAX_INDEX)
+    }
+}
+
+#[derive(Debug, PartialEq, Clone)]
+pub enum TreeHashType {
+    Basic,
+    Vector,
+    List,
+    Container,
+}
+
+pub trait TreeHash {
+    fn tree_hash_type() -> TreeHashType;
+
+    fn tree_hash_packed_encoding(&self) -> Vec<u8>;
+
+    fn tree_hash_packing_factor() -> usize;
+
+    fn tree_hash_root(&self) -> Hash256;
+}
+
+#[macro_export]
+macro_rules! tree_hash_ssz_encoding_as_vector {
+    ($type: ident) => {
+        impl tree_hash::TreeHash for $type {
+            fn tree_hash_type() -> tree_hash::TreeHashType {
+                tree_hash::TreeHashType::Vector
+            }
+
+            fn tree_hash_packed_encoding(&self) -> Vec<u8> {
+                unreachable!("Vector should never be packed.")
+            }
+
+            fn tree_hash_packing_factor() -> usize {
+                unreachable!("Vector should never be packed.")
+            }
+
+            fn tree_hash_root(&self) -> Vec<u8> {
+                tree_hash::merkle_root(&ssz::ssz_encode(self))
+            }
+        }
+    };
+}
+
+#[macro_export]
+macro_rules! tree_hash_ssz_encoding_as_list {
+    ($type: ident) => {
+        impl tree_hash::TreeHash for $type {
+            fn tree_hash_type() -> tree_hash::TreeHashType {
+                tree_hash::TreeHashType::List
+            }
+
+            fn tree_hash_packed_encoding(&self) -> Vec<u8> {
+                unreachable!("List should never be packed.")
+            }
+
+            fn tree_hash_packing_factor() -> usize {
+                unreachable!("List should never be packed.")
+            }
+
+            fn tree_hash_root(&self) -> Vec<u8> {
+                ssz::ssz_encode(self).tree_hash_root()
+            }
+        }
+    };
+}
+
+#[cfg(test)]
+mod test {
+    use super::*;
+
+    #[test]
+    fn mix_length() {
+        let hash = {
+            let mut preimage = vec![42; BYTES_PER_CHUNK];
+            preimage.append(&mut vec![42]);
+            preimage.append(&mut vec![0; BYTES_PER_CHUNK - 1]);
+            eth2_hashing::hash(&preimage)
+        };
+
+        assert_eq!(
+            mix_in_length(&Hash256::from_slice(&[42; BYTES_PER_CHUNK]), 42).as_bytes(),
+            &hash[..]
+        );
+    }
+}
--- a/consensus/tree_hash/src/merkle_hasher.rs
+++ b/consensus/tree_hash/src/merkle_hasher.rs
@@ -0,0 +1,573 @@
+use crate::{get_zero_hash, Hash256, HASHSIZE};
+use eth2_hashing::{Context, Digest, SHA256};
+use smallvec::{smallvec, SmallVec};
+use std::mem;
+
+type SmallVec8<T> = SmallVec<[T; 8]>;
+
+#[derive(Clone, Debug, PartialEq)]
+pub enum Error {
+    /// The maximum number of leaves defined by the initialization `depth` has been exceed.
+    MaximumLeavesExceeded { max_leaves: usize },
+}
+
+/// Helper struct to store either a hash digest or a slice.
+///
+/// Should be used as a left or right value for some node.
+enum Preimage<'a> {
+    Digest(Digest),
+    Slice(&'a [u8]),
+}
+
+impl<'a> Preimage<'a> {
+    /// Returns a 32-byte slice.
+    fn as_bytes(&self) -> &[u8] {
+        match self {
+            Preimage::Digest(digest) => digest.as_ref(),
+            Preimage::Slice(slice) => slice,
+        }
+    }
+}
+
+/// A node that has had a left child supplied, but not a right child.
+struct HalfNode {
+    /// The hasher context.
+    context: Context,
+    /// The tree id of the node. The root node has in id of `1` and ids increase moving down the
+    /// tree from left to right.
+    id: usize,
+}
+
+impl HalfNode {
+    /// Create a new half-node from the given `left` value.
+    fn new(id: usize, left: Preimage) -> Self {
+        let mut context = Context::new(&SHA256);
+        context.update(left.as_bytes());
+
+        Self { context, id }
+    }
+
+    /// Complete the half-node by providing a `right` value. Returns a digest of the left and right
+    /// nodes.
+    fn finish(mut self, right: Preimage) -> Digest {
+        self.context.update(right.as_bytes());
+        self.context.finish()
+    }
+}
+
+/// Provides a Merkle-root hasher that allows for streaming bytes (i.e., providing any-length byte
+/// slices without need to separate into leaves). Efficiently handles cases where not all leaves
+/// have been provided by assuming all non-provided leaves are `[0; 32]` and pre-computing the
+/// zero-value hashes at all depths of the tree.
+///
+/// This algorithm aims to allocate as little memory as possible and it does this by "folding" up
+/// the tree has each leaf is provided. Consider this step-by-step functional diagram of hashing a
+/// tree with depth three:
+///
+/// ## Functional Diagram
+///
+/// Nodes that are `-` have not been defined and do not occupy memory. Nodes that are `L` are
+/// leaves that are provided but are not stored. Nodes that have integers (`1`, `2`) are stored in
+/// our struct. Finally, nodes that are `X` were stored, but are now removed.
+///
+/// ### Start
+///
+/// ```ignore
+///           -
+///          / \
+///         -   -
+///        / \ / \
+///       -  - -  -
+/// ```
+///
+/// ### Provide first leaf
+///
+/// ```ignore
+///           -
+///          / \
+///         2   -
+///        / \ / \
+///       L  - -  -
+/// ```
+///
+/// ### Provide second leaf
+///
+/// ```ignore
+///           1
+///          / \
+///         X   -
+///        / \ / \
+///       L  L -  -
+/// ```
+///
+/// ### Provide third leaf
+///
+/// ```ignore
+///           1
+///          / \
+///         X   3
+///        / \ / \
+///       L  L L  -
+/// ```
+///
+/// ### Provide fourth and final leaf
+///
+/// ```ignore
+///           1
+///          / \
+///         X   X
+///        / \ / \
+///       L  L L  L
+/// ```
+///
+pub struct MerkleHasher {
+    /// Stores the nodes that are half-complete and awaiting a right node.
+    ///
+    /// A smallvec of size 8 means we can hash a tree with 256 leaves without allocating on the
+    /// heap. Each half-node is 224 bytes, so this smallvec may store 1,792 bytes on the stack.
+    half_nodes: SmallVec8<HalfNode>,
+    /// The depth of the tree that will be produced.
+    ///
+    /// Depth is counted top-down (i.e., the root node is at depth 0). A tree with 1 leaf has a
+    /// depth of 1, a tree with 4 leaves has a depth of 3.
+    depth: usize,
+    /// The next leaf that we are expecting to process.
+    next_leaf: usize,
+    /// A buffer of bytes that are waiting to be written to a leaf.
+    buffer: SmallVec<[u8; 32]>,
+    /// Set to Some(root) when the root of the tree is known.
+    root: Option<Hash256>,
+}
+
+/// Returns the parent of node with id `i`.
+fn get_parent(i: usize) -> usize {
+    i / 2
+}
+
+/// Gets the depth of a node with an id of `i`.
+///
+/// It is a logic error to provide `i == 0`.
+///
+/// E.g., if `i` is 1, depth is 0. If `i` is is 1, depth is 1.
+fn get_depth(i: usize) -> usize {
+    let total_bits = mem::size_of::<usize>() * 8;
+    total_bits - i.leading_zeros() as usize - 1
+}
+
+impl MerkleHasher {
+    /// Instantiate a hasher for a tree with a given number of leaves.
+    ///
+    /// `num_leaves` will be rounded to the next power of two. E.g., if `num_leaves == 6`, then the
+    /// tree will _actually_ be able to accomodate 8 leaves and the resulting hasher is exactly the
+    /// same as one that was instantiated with `Self::with_leaves(8)`.
+    ///
+    /// ## Notes
+    ///
+    /// If `num_leaves == 0`, a tree of depth 1 will be created. If no leaves are provided it will
+    /// return a root of `[0; 32]`.
+    pub fn with_leaves(num_leaves: usize) -> Self {
+        let depth = get_depth(num_leaves.next_power_of_two()) + 1;
+        Self::with_depth(depth)
+    }
+
+    /// Instantiates a new, empty hasher for a tree with `depth` layers which will have capacity
+    /// for `1 << (depth - 1)` leaf nodes.
+    ///
+    /// It is not possible to grow the depth of the tree after instantiation.
+    ///
+    /// ## Panics
+    ///
+    /// Panics if `depth == 0`.
+    fn with_depth(depth: usize) -> Self {
+        assert!(depth > 0, "merkle tree cannot have a depth of zero");
+
+        Self {
+            half_nodes: SmallVec::with_capacity(depth - 1),
+            depth,
+            next_leaf: 1 << (depth - 1),
+            buffer: SmallVec::with_capacity(32),
+            root: None,
+        }
+    }
+
+    /// Write some bytes to the hasher.
+    ///
+    /// ## Errors
+    ///
+    /// Returns an error if the given bytes would create a leaf that would exceed the maximum
+    /// permissible number of leaves defined by the initialization `depth`. E.g., a tree of `depth
+    /// == 2` can only accept 2 leaves. A tree of `depth == 14` can only accept 8,192 leaves.
+    pub fn write(&mut self, bytes: &[u8]) -> Result<(), Error> {
+        let mut ptr = 0;
+        while ptr <= bytes.len() {
+            let slice = &bytes[ptr..std::cmp::min(bytes.len(), ptr + HASHSIZE)];
+
+            if self.buffer.is_empty() && slice.len() == HASHSIZE {
+                self.process_leaf(slice)?;
+                ptr += HASHSIZE
+            } else if self.buffer.len() + slice.len() < HASHSIZE {
+                self.buffer.extend_from_slice(slice);
+                ptr += HASHSIZE
+            } else {
+                let buf_len = self.buffer.len();
+                let required = HASHSIZE - buf_len;
+
+                let mut leaf = [0; HASHSIZE];
+                leaf[..buf_len].copy_from_slice(&self.buffer);
+                leaf[buf_len..].copy_from_slice(&slice[0..required]);
+
+                self.process_leaf(&leaf)?;
+                self.buffer = smallvec![];
+
+                ptr += required
+            }
+        }
+
+        Ok(())
+    }
+
+    /// Process the next leaf in the tree.
+    ///
+    /// ## Errors
+    ///
+    /// Returns an error if the given leaf would exceed the maximum permissible number of leaves
+    /// defined by the initialization `depth`. E.g., a tree of `depth == 2` can only accept 2
+    /// leaves. A tree of `depth == 14` can only accept 8,192 leaves.
+    fn process_leaf(&mut self, leaf: &[u8]) -> Result<(), Error> {
+        assert_eq!(leaf.len(), HASHSIZE, "a leaf must be 32 bytes");
+
+        let max_leaves = 1 << (self.depth + 1);
+
+        if self.next_leaf > max_leaves {
+            return Err(Error::MaximumLeavesExceeded { max_leaves });
+        } else if self.next_leaf == 1 {
+            // A tree of depth one has a root that is equal to the first given leaf.
+            self.root = Some(Hash256::from_slice(leaf))
+        } else if self.next_leaf % 2 == 0 {
+            self.process_left_node(self.next_leaf, Preimage::Slice(leaf))
+        } else {
+            self.process_right_node(self.next_leaf, Preimage::Slice(leaf))
+        }
+
+        self.next_leaf += 1;
+
+        Ok(())
+    }
+
+    /// Returns the root of the Merkle tree.
+    ///
+    /// If not all leaves have been provided, the tree will be efficiently completed under the
+    /// assumption that all not-yet-provided leaves are equal to `[0; 32]`.
+    ///
+    /// ## Errors
+    ///
+    /// Returns an error if the bytes remaining in the buffer would create a leaf that would exceed
+    /// the maximum permissible number of leaves defined by the initialization `depth`.
+    pub fn finish(mut self) -> Result<Hash256, Error> {
+        if !self.buffer.is_empty() {
+            let mut leaf = [0; HASHSIZE];
+            leaf[..self.buffer.len()].copy_from_slice(&self.buffer);
+            self.process_leaf(&leaf)?
+        }
+
+        // If the tree is incomplete, we must complete it by providing zero-hashes.
+        loop {
+            if let Some(root) = self.root {
+                break Ok(root);
+            } else if let Some(node) = self.half_nodes.last() {
+                let right_child = node.id * 2 + 1;
+                self.process_right_node(right_child, self.zero_hash(right_child));
+            } else if self.next_leaf == 1 {
+                // The next_leaf can only be 1 if the tree has a depth of one. If have been no
+                // leaves supplied, assume a root of zero.
+                break Ok(Hash256::zero());
+            } else {
+                // The only scenario where there are (a) no half nodes and (b) a tree of depth
+                // two or more is where no leaves have been supplied at all.
+                //
+                // Once we supply this first zero-hash leaf then all future operations will be
+                // triggered via the `process_right_node` branch.
+                self.process_left_node(self.next_leaf, self.zero_hash(self.next_leaf))
+            }
+        }
+    }
+
+    /// Process a node that will become the left-hand node of some parent. The supplied `id` is
+    /// that of the node (not the parent). The `preimage` is the value of the node (i.e., if this
+    /// is a leaf node it will be the value of that leaf).
+    ///
+    /// In this scenario, the only option is to push a new half-node.
+    fn process_left_node(&mut self, id: usize, preimage: Preimage) {
+        self.half_nodes
+            .push(HalfNode::new(get_parent(id), preimage))
+    }
+
+    /// Process a node that will become the right-hand node of some parent. The supplied `id` is
+    /// that of the node (not the parent). The `preimage` is the value of the node (i.e., if this
+    /// is a leaf node it will be the value of that leaf).
+    ///
+    /// This operation will always complete one node, then it will attempt to crawl up the tree and
+    /// collapse and other viable nodes. For example, consider a tree of depth 3 (see diagram
+    /// below). When providing the node with id `7`, the node with id `3` will be completed which
+    /// will also provide the right-node for the `1` node. This function will complete both of
+    /// those nodes and ultimately find the root of the tree.
+    ///
+    /// ```ignore
+    ///           1 <-- completed
+    ///          / \
+    ///         2   3  <-- completed
+    ///        / \ / \
+    ///       4  5 6  7 <-- supplied right node
+    /// ```
+    fn process_right_node(&mut self, id: usize, mut preimage: Preimage) {
+        let mut parent = get_parent(id);
+
+        loop {
+            match self.half_nodes.last() {
+                Some(node) if node.id == parent => {
+                    preimage = Preimage::Digest(
+                        self.half_nodes
+                            .pop()
+                            .expect("if .last() is Some then .pop() must succeed")
+                            .finish(preimage),
+                    );
+                    if parent == 1 {
+                        self.root = Some(Hash256::from_slice(preimage.as_bytes()));
+                        break;
+                    } else {
+                        parent = get_parent(parent);
+                    }
+                }
+                _ => {
+                    self.half_nodes.push(HalfNode::new(parent, preimage));
+                    break;
+                }
+            }
+        }
+    }
+
+    /// Returns a "zero hash" from a pre-computed set for the given node.
+    ///
+    /// Note: this node is not always zero, instead it is the result of hashing up a tree where the
+    /// leaves are all zeros.  E.g., in a tree of depth 2, the `zero_hash` of a node at depth 1
+    /// will be `[0; 32]`.  However, the `zero_hash` for a node at depth 0 will be
+    /// `hash(concat([0; 32], [0; 32])))`.
+    fn zero_hash(&self, id: usize) -> Preimage<'static> {
+        Preimage::Slice(get_zero_hash(self.depth - (get_depth(id) + 1)))
+    }
+}
+
+#[cfg(test)]
+mod test {
+    use super::*;
+    use crate::merkleize_padded;
+
+    /// This test is just to ensure that the stack size of the `Context` remains the same. We choose
+    /// our smallvec size based upon this, so it's good to know if it suddenly changes in size.
+    #[test]
+    fn context_size() {
+        assert_eq!(
+            mem::size_of::<HalfNode>(),
+            216 + 8,
+            "Halfnode size should be as expected"
+        );
+    }
+
+    fn compare_with_reference(leaves: &[Hash256], depth: usize) {
+        let reference_bytes = leaves
+            .iter()
+            .map(|hash| hash.as_bytes().to_vec())
+            .flatten()
+            .collect::<Vec<_>>();
+
+        let reference_root = merkleize_padded(&reference_bytes, 1 << (depth - 1));
+
+        let merklizer_root_32_bytes = {
+            let mut m = MerkleHasher::with_depth(depth);
+            for leaf in leaves.iter() {
+                m.write(leaf.as_bytes()).expect("should process leaf");
+            }
+            m.finish().expect("should finish")
+        };
+
+        assert_eq!(
+            reference_root, merklizer_root_32_bytes,
+            "32 bytes should match reference root"
+        );
+
+        let merklizer_root_individual_3_bytes = {
+            let mut m = MerkleHasher::with_depth(depth);
+            for bytes in reference_bytes.clone().chunks(3) {
+                m.write(bytes).expect("should process byte");
+            }
+            m.finish().expect("should finish")
+        };
+
+        assert_eq!(
+            reference_root, merklizer_root_individual_3_bytes,
+            "3 bytes should match reference root"
+        );
+
+        let merklizer_root_individual_single_bytes = {
+            let mut m = MerkleHasher::with_depth(depth);
+            for byte in reference_bytes.iter() {
+                m.write(&[*byte]).expect("should process byte");
+            }
+            m.finish().expect("should finish")
+        };
+
+        assert_eq!(
+            reference_root, merklizer_root_individual_single_bytes,
+            "single bytes should match reference root"
+        );
+    }
+
+    /// A simple wrapper to compare MerkleHasher to the reference function by just giving a number
+    /// of leaves and a depth.
+    fn compare_reference_with_len(leaves: u64, depth: usize) {
+        let leaves = (0..leaves)
+            .map(|i| Hash256::from_low_u64_be(i))
+            .collect::<Vec<_>>();
+        compare_with_reference(&leaves, depth)
+    }
+
+    /// Compares the `MerkleHasher::with_depth` and `MerkleHasher::with_leaves` generate consistent
+    /// results.
+    fn compare_new_with_leaf_count(num_leaves: u64, depth: usize) {
+        let leaves = (0..num_leaves)
+            .map(|i| Hash256::from_low_u64_be(i))
+            .collect::<Vec<_>>();
+
+        let from_depth = {
+            let mut m = MerkleHasher::with_depth(depth);
+            for leaf in leaves.iter() {
+                m.write(leaf.as_bytes()).expect("should process leaf");
+            }
+            m.finish()
+        };
+
+        let from_num_leaves = {
+            let mut m = MerkleHasher::with_leaves(num_leaves as usize);
+            for leaf in leaves.iter() {
+                m.process_leaf(leaf.as_bytes())
+                    .expect("should process leaf");
+            }
+            m.finish()
+        };
+
+        assert_eq!(
+            from_depth, from_num_leaves,
+            "hash generated by depth should match that from num leaves"
+        );
+    }
+
+    #[test]
+    fn with_leaves() {
+        compare_new_with_leaf_count(1, 1);
+        compare_new_with_leaf_count(2, 2);
+        compare_new_with_leaf_count(3, 3);
+        compare_new_with_leaf_count(4, 3);
+        compare_new_with_leaf_count(5, 4);
+        compare_new_with_leaf_count(6, 4);
+        compare_new_with_leaf_count(7, 4);
+        compare_new_with_leaf_count(8, 4);
+        compare_new_with_leaf_count(9, 5);
+        compare_new_with_leaf_count(10, 5);
+        compare_new_with_leaf_count(11, 5);
+        compare_new_with_leaf_count(12, 5);
+        compare_new_with_leaf_count(13, 5);
+        compare_new_with_leaf_count(14, 5);
+        compare_new_with_leaf_count(15, 5);
+    }
+
+    #[test]
+    fn depth() {
+        assert_eq!(get_depth(1), 0);
+        assert_eq!(get_depth(2), 1);
+        assert_eq!(get_depth(3), 1);
+        assert_eq!(get_depth(4), 2);
+        assert_eq!(get_depth(5), 2);
+        assert_eq!(get_depth(6), 2);
+        assert_eq!(get_depth(7), 2);
+        assert_eq!(get_depth(8), 3);
+    }
+
+    #[test]
+    fn with_0_leaves() {
+        let hasher = MerkleHasher::with_leaves(0);
+        assert_eq!(hasher.finish().unwrap(), Hash256::zero());
+    }
+
+    #[test]
+    #[should_panic]
+    fn too_many_leaves() {
+        compare_reference_with_len(2, 1);
+    }
+
+    #[test]
+    fn full_trees() {
+        compare_reference_with_len(1, 1);
+        compare_reference_with_len(2, 2);
+        compare_reference_with_len(4, 3);
+        compare_reference_with_len(8, 4);
+        compare_reference_with_len(16, 5);
+        compare_reference_with_len(32, 6);
+        compare_reference_with_len(64, 7);
+        compare_reference_with_len(128, 8);
+        compare_reference_with_len(256, 9);
+        compare_reference_with_len(256, 9);
+        compare_reference_with_len(8192, 14);
+    }
+
+    #[test]
+    fn incomplete_trees() {
+        compare_reference_with_len(0, 1);
+
+        compare_reference_with_len(0, 2);
+        compare_reference_with_len(1, 2);
+
+        for i in 0..=4 {
+            compare_reference_with_len(i, 3);
+        }
+
+        for i in 0..=7 {
+            compare_reference_with_len(i, 4);
+        }
+
+        for i in 0..=15 {
+            compare_reference_with_len(i, 5);
+        }
+
+        for i in 0..=32 {
+            compare_reference_with_len(i, 6);
+        }
+
+        for i in 0..=64 {
+            compare_reference_with_len(i, 7);
+        }
+
+        compare_reference_with_len(0, 14);
+        compare_reference_with_len(13, 14);
+        compare_reference_with_len(8191, 14);
+    }
+
+    #[test]
+    fn remaining_buffer() {
+        let a = {
+            let mut m = MerkleHasher::with_leaves(2);
+            m.write(&[1]).expect("should write");
+            m.finish().expect("should finish")
+        };
+
+        let b = {
+            let mut m = MerkleHasher::with_leaves(2);
+            let mut leaf = vec![1];
+            leaf.extend_from_slice(&[0; 31]);
+            m.write(&leaf).expect("should write");
+            m.write(&[0; 32]).expect("should write");
+            m.finish().expect("should finish")
+        };
+
+        assert_eq!(a, b, "should complete buffer");
+    }
+}
--- a/consensus/tree_hash/src/merkleize_padded.rs
+++ b/consensus/tree_hash/src/merkleize_padded.rs
@@ -0,0 +1,330 @@
+use super::{get_zero_hash, Hash256, BYTES_PER_CHUNK};
+use eth2_hashing::{hash, hash32_concat};
+
+/// Merkleize `bytes` and return the root, optionally padding the tree out to `min_leaves` number of
+/// leaves.
+///
+/// **Note**: This function is generally worse than using the `crate::merkle_root` which uses
+/// `MerkleHasher`. We only keep this function around for reference testing.
+///
+/// First all nodes are extracted from `bytes` and then a padding node is added until the number of
+/// leaf chunks is greater than or equal to `min_leaves`. Callers may set `min_leaves` to `0` if no
+/// adding additional chunks should be added to the given `bytes`.
+///
+/// If `bytes.len() <= BYTES_PER_CHUNK`, no hashing is done and `bytes` is returned, potentially
+/// padded out to `BYTES_PER_CHUNK` length with `0`.
+///
+/// ## CPU Performance
+///
+/// A cache of `MAX_TREE_DEPTH` hashes are stored to avoid re-computing the hashes of padding nodes
+/// (or their parents). Therefore, adding padding nodes only incurs one more hash per additional
+/// height of the tree.
+///
+/// ## Memory Performance
+///
+/// This algorithm has two interesting memory usage properties:
+///
+/// 1. The maximum memory footprint is roughly `O(V / 2)` memory, where `V` is the number of leaf
+///    chunks with values (i.e., leaves that are not padding). The means adding padding nodes to
+///    the tree does not increase the memory footprint.
+/// 2. At each height of the tree half of the memory is freed until only a single chunk is stored.
+/// 3. The input `bytes` are not copied into another list before processing.
+///
+/// _Note: there are some minor memory overheads, including a handful of usizes and a list of
+/// `MAX_TREE_DEPTH` hashes as `lazy_static` constants._
+pub fn merkleize_padded(bytes: &[u8], min_leaves: usize) -> Hash256 {
+    // If the bytes are just one chunk or less, pad to one chunk and return without hashing.
+    if bytes.len() <= BYTES_PER_CHUNK && min_leaves <= 1 {
+        let mut o = bytes.to_vec();
+        o.resize(BYTES_PER_CHUNK, 0);
+        return Hash256::from_slice(&o);
+    }
+
+    assert!(
+        bytes.len() > BYTES_PER_CHUNK || min_leaves > 1,
+        "Merkle hashing only needs to happen if there is more than one chunk"
+    );
+
+    // The number of leaves that can be made directly from `bytes`.
+    let leaves_with_values = (bytes.len() + (BYTES_PER_CHUNK - 1)) / BYTES_PER_CHUNK;
+
+    // The number of parents that have at least one non-padding leaf.
+    //
+    // Since there is more than one node in this tree (see prior assertion), there should always be
+    // one or more initial parent nodes.
+    let initial_parents_with_values = std::cmp::max(1, next_even_number(leaves_with_values) / 2);
+
+    // The number of leaves in the full tree (including padding nodes).
+    let num_leaves = std::cmp::max(leaves_with_values, min_leaves).next_power_of_two();
+
+    // The number of levels in the tree.
+    //
+    // A tree with a single node has `height == 1`.
+    let height = num_leaves.trailing_zeros() as usize + 1;
+
+    assert!(height >= 2, "The tree should have two or more heights");
+
+    // A buffer/scratch-space used for storing each round of hashes at each height.
+    //
+    // This buffer is kept as small as possible; it will shrink so it never stores a padding node.
+    let mut chunks = ChunkStore::with_capacity(initial_parents_with_values);
+
+    // Create a parent in the `chunks` buffer for every two chunks in `bytes`.
+    //
+    // I.e., do the first round of hashing, hashing from the `bytes` slice and filling the `chunks`
+    // struct.
+    for i in 0..initial_parents_with_values {
+        let start = i * BYTES_PER_CHUNK * 2;
+
+        // Hash two chunks, creating a parent chunk.
+        let hash = match bytes.get(start..start + BYTES_PER_CHUNK * 2) {
+            // All bytes are available, hash as usual.
+            Some(slice) => hash(slice),
+            // Unable to get all the bytes, get a small slice and pad it out.
+            None => {
+                let mut preimage = bytes
+                    .get(start..)
+                    .expect("`i` can only be larger than zero if there are bytes to read")
+                    .to_vec();
+                preimage.resize(BYTES_PER_CHUNK * 2, 0);
+                hash(&preimage)
+            }
+        };
+
+        assert_eq!(
+            hash.len(),
+            BYTES_PER_CHUNK,
+            "Hashes should be exactly one chunk"
+        );
+
+        // Store the parent node.
+        chunks
+            .set(i, &hash)
+            .expect("Buffer should always have capacity for parent nodes")
+    }
+
+    // Iterate through all heights above the leaf nodes and either (a) hash two children or, (b)
+    // hash a left child and a right padding node.
+    //
+    // Skip the 0'th height because the leaves have already been processed. Skip the highest-height
+    // in the tree as it is the root does not require hashing.
+    //
+    // The padding nodes for each height are cached via `lazy static` to simulate non-adjacent
+    // padding nodes (i.e., avoid doing unnecessary hashing).
+    for height in 1..height - 1 {
+        let child_nodes = chunks.len();
+        let parent_nodes = next_even_number(child_nodes) / 2;
+
+        // For each pair of nodes stored in `chunks`:
+        //
+        // - If two nodes are available, hash them to form a parent.
+        // - If one node is available, hash it and a cached padding node to form a parent.
+        for i in 0..parent_nodes {
+            let (left, right) = match (chunks.get(i * 2), chunks.get(i * 2 + 1)) {
+                (Ok(left), Ok(right)) => (left, right),
+                (Ok(left), Err(_)) => (left, get_zero_hash(height)),
+                // Deriving `parent_nodes` from `chunks.len()` has ensured that we never encounter the
+                // scenario where we expect two nodes but there are none.
+                (Err(_), Err(_)) => unreachable!("Parent must have one child"),
+                // `chunks` is a contiguous array so it is impossible for an index to be missing
+                // when a higher index is present.
+                (Err(_), Ok(_)) => unreachable!("Parent must have a left child"),
+            };
+
+            assert!(
+                left.len() == right.len() && right.len() == BYTES_PER_CHUNK,
+                "Both children should be `BYTES_PER_CHUNK` bytes."
+            );
+
+            let hash = hash32_concat(left, right);
+
+            // Store a parent node.
+            chunks
+                .set(i, &hash)
+                .expect("Buf is adequate size for parent");
+        }
+
+        // Shrink the buffer so it neatly fits the number of new nodes created in this round.
+        //
+        // The number of `parent_nodes` is either decreasing or stable. It never increases.
+        chunks.truncate(parent_nodes);
+    }
+
+    // There should be a single chunk left in the buffer and it is the Merkle root.
+    let root = chunks.into_vec();
+
+    assert_eq!(root.len(), BYTES_PER_CHUNK, "Only one chunk should remain");
+
+    Hash256::from_slice(&root)
+}
+
+/// A helper struct for storing words of `BYTES_PER_CHUNK` size in a flat byte array.
+#[derive(Debug)]
+struct ChunkStore(Vec<u8>);
+
+impl ChunkStore {
+    /// Creates a new instance with `chunks` padding nodes.
+    fn with_capacity(chunks: usize) -> Self {
+        Self(vec![0; chunks * BYTES_PER_CHUNK])
+    }
+
+    /// Set the `i`th chunk to `value`.
+    ///
+    /// Returns `Err` if `value.len() != BYTES_PER_CHUNK` or `i` is out-of-bounds.
+    fn set(&mut self, i: usize, value: &[u8]) -> Result<(), ()> {
+        if i < self.len() && value.len() == BYTES_PER_CHUNK {
+            let slice = &mut self.0[i * BYTES_PER_CHUNK..i * BYTES_PER_CHUNK + BYTES_PER_CHUNK];
+            slice.copy_from_slice(value);
+            Ok(())
+        } else {
+            Err(())
+        }
+    }
+
+    /// Gets the `i`th chunk.
+    ///
+    /// Returns `Err` if `i` is out-of-bounds.
+    fn get(&self, i: usize) -> Result<&[u8], ()> {
+        if i < self.len() {
+            Ok(&self.0[i * BYTES_PER_CHUNK..i * BYTES_PER_CHUNK + BYTES_PER_CHUNK])
+        } else {
+            Err(())
+        }
+    }
+
+    /// Returns the number of chunks presently stored in `self`.
+    fn len(&self) -> usize {
+        self.0.len() / BYTES_PER_CHUNK
+    }
+
+    /// Truncates 'self' to `num_chunks` chunks.
+    ///
+    /// Functionally identical to `Vec::truncate`.
+    fn truncate(&mut self, num_chunks: usize) {
+        self.0.truncate(num_chunks * BYTES_PER_CHUNK)
+    }
+
+    /// Consumes `self`, returning the underlying byte array.
+    fn into_vec(self) -> Vec<u8> {
+        self.0
+    }
+}
+
+/// Returns the next even number following `n`. If `n` is even, `n` is returned.
+fn next_even_number(n: usize) -> usize {
+    n + n % 2
+}
+
+#[cfg(test)]
+mod test {
+    use super::*;
+    use crate::ZERO_HASHES_MAX_INDEX;
+
+    pub fn reference_root(bytes: &[u8]) -> Hash256 {
+        crate::merkleize_standard(&bytes)
+    }
+
+    macro_rules! common_tests {
+        ($get_bytes: ident) => {
+            #[test]
+            fn zero_value_0_nodes() {
+                test_against_reference(&$get_bytes(0 * BYTES_PER_CHUNK), 0);
+            }
+
+            #[test]
+            fn zero_value_1_nodes() {
+                test_against_reference(&$get_bytes(1 * BYTES_PER_CHUNK), 0);
+            }
+
+            #[test]
+            fn zero_value_2_nodes() {
+                test_against_reference(&$get_bytes(2 * BYTES_PER_CHUNK), 0);
+            }
+
+            #[test]
+            fn zero_value_3_nodes() {
+                test_against_reference(&$get_bytes(3 * BYTES_PER_CHUNK), 0);
+            }
+
+            #[test]
+            fn zero_value_4_nodes() {
+                test_against_reference(&$get_bytes(4 * BYTES_PER_CHUNK), 0);
+            }
+
+            #[test]
+            fn zero_value_8_nodes() {
+                test_against_reference(&$get_bytes(8 * BYTES_PER_CHUNK), 0);
+            }
+
+            #[test]
+            fn zero_value_9_nodes() {
+                test_against_reference(&$get_bytes(9 * BYTES_PER_CHUNK), 0);
+            }
+
+            #[test]
+            fn zero_value_8_nodes_varying_min_length() {
+                for i in 0..64 {
+                    test_against_reference(&$get_bytes(8 * BYTES_PER_CHUNK), i);
+                }
+            }
+
+            #[test]
+            fn zero_value_range_of_nodes() {
+                for i in 0..32 * BYTES_PER_CHUNK {
+                    test_against_reference(&$get_bytes(i), 0);
+                }
+            }
+
+            #[test]
+            fn max_tree_depth_min_nodes() {
+                let input = vec![0; 10 * BYTES_PER_CHUNK];
+                let min_nodes = 2usize.pow(ZERO_HASHES_MAX_INDEX as u32);
+                assert_eq!(
+                    merkleize_padded(&input, min_nodes).as_bytes(),
+                    get_zero_hash(ZERO_HASHES_MAX_INDEX)
+                );
+            }
+        };
+    }
+
+    mod zero_value {
+        use super::*;
+
+        fn zero_bytes(bytes: usize) -> Vec<u8> {
+            vec![0; bytes]
+        }
+
+        common_tests!(zero_bytes);
+    }
+
+    mod random_value {
+        use super::*;
+        use rand::RngCore;
+
+        fn random_bytes(bytes: usize) -> Vec<u8> {
+            let mut bytes = Vec::with_capacity(bytes);
+            rand::thread_rng().fill_bytes(&mut bytes);
+            bytes
+        }
+
+        common_tests!(random_bytes);
+    }
+
+    fn test_against_reference(input: &[u8], min_nodes: usize) {
+        let mut reference_input = input.to_vec();
+        reference_input.resize(
+            std::cmp::max(
+                reference_input.len(),
+                min_nodes.next_power_of_two() * BYTES_PER_CHUNK,
+            ),
+            0,
+        );
+
+        assert_eq!(
+            reference_root(&reference_input),
+            merkleize_padded(&input, min_nodes),
+            "input.len(): {:?}",
+            input.len()
+        );
+    }
+}
--- a/consensus/tree_hash/src/merkleize_standard.rs
+++ b/consensus/tree_hash/src/merkleize_standard.rs
@@ -0,0 +1,81 @@
+use super::*;
+use eth2_hashing::hash;
+
+/// Merkleizes bytes and returns the root, using a simple algorithm that does not optimize to avoid
+/// processing or storing padding bytes.
+///
+/// **Note**: This function is generally worse than using the `crate::merkle_root` which uses
+/// `MerkleHasher`. We only keep this function around for reference testing.
+///
+/// The input `bytes` will be padded to ensure that the number of leaves is a power-of-two.
+///
+/// ## CPU Performance
+///
+/// Will hash all nodes in the tree, even if they are padding and pre-determined.
+///
+/// ## Memory Performance
+///
+///  - Duplicates the input `bytes`.
+///  - Stores all internal nodes, even if they are padding.
+///  - Does not free up unused memory during operation.
+pub fn merkleize_standard(bytes: &[u8]) -> Hash256 {
+    // If the bytes are just one chunk (or less than one chunk) just return them.
+    if bytes.len() <= HASHSIZE {
+        let mut o = bytes.to_vec();
+        o.resize(HASHSIZE, 0);
+        return Hash256::from_slice(&o[0..HASHSIZE]);
+    }
+
+    let leaves = num_sanitized_leaves(bytes.len());
+    let nodes = num_nodes(leaves);
+    let internal_nodes = nodes - leaves;
+
+    let num_bytes = std::cmp::max(internal_nodes, 1) * HASHSIZE + bytes.len();
+
+    let mut o: Vec<u8> = vec![0; internal_nodes * HASHSIZE];
+
+    o.append(&mut bytes.to_vec());
+
+    assert_eq!(o.len(), num_bytes);
+
+    let empty_chunk_hash = hash(&[0; MERKLE_HASH_CHUNK]);
+
+    let mut i = nodes * HASHSIZE;
+    let mut j = internal_nodes * HASHSIZE;
+
+    while i >= MERKLE_HASH_CHUNK {
+        i -= MERKLE_HASH_CHUNK;
+
+        j -= HASHSIZE;
+        let hash = match o.get(i..i + MERKLE_HASH_CHUNK) {
+            // All bytes are available, hash as usual.
+            Some(slice) => hash(slice),
+            // Unable to get all the bytes.
+            None => {
+                match o.get(i..) {
+                    // Able to get some of the bytes, pad them out.
+                    Some(slice) => {
+                        let mut bytes = slice.to_vec();
+                        bytes.resize(MERKLE_HASH_CHUNK, 0);
+                        hash(&bytes)
+                    }
+                    // Unable to get any bytes, use the empty-chunk hash.
+                    None => empty_chunk_hash.clone(),
+                }
+            }
+        };
+
+        o[j..j + HASHSIZE].copy_from_slice(&hash);
+    }
+
+    Hash256::from_slice(&o[0..HASHSIZE])
+}
+
+fn num_sanitized_leaves(num_bytes: usize) -> usize {
+    let leaves = (num_bytes + HASHSIZE - 1) / HASHSIZE;
+    leaves.next_power_of_two()
+}
+
+fn num_nodes(num_leaves: usize) -> usize {
+    2 * num_leaves - 1
+}