add proof_size_to_hashes

paritytech · Sep 21, 2024 · 0c8d189 · 0c8d189
1 parent 3ab4d94
commit 0c8d189
Show file tree

Hide file tree

Showing 3 changed files with 76 additions and 1 deletion.
diff --git a/substrate/primitives/runtime/src/proving_trie/base16.rs b/substrate/primitives/runtime/src/proving_trie/base16.rs
@@ -26,6 +26,7 @@
 
 use super::{ProvingTrie, TrieError};
 use crate::{Decode, DispatchError, Encode};
+use codec::MaxEncodedLen;
 use sp_std::vec::Vec;
 use sp_trie::{
 	trie_types::{TrieDBBuilder, TrieDBMutBuilderV1},
@@ -72,6 +73,7 @@ where
 impl<Hashing, Key, Value> ProvingTrie<Hashing, Key, Value> for BasicProvingTrie<Hashing, Key, Value>
 where
 	Hashing: sp_core::Hasher,
+	Hashing::Out: MaxEncodedLen,
 	Key: Encode,
 	Value: Encode + Decode,
 {
@@ -133,6 +135,13 @@ where
 	) -> Result<(), DispatchError> {
 		verify_proof::<Hashing, Key, Value>(root, proof, key, value)
 	}
+
+	/// A base 16 trie is expected to include the data for 15 hashes per layer.
+	fn proof_size_to_hashes(proof_size: &u32) -> u32 {
+		let hash_len = Hashing::Out::max_encoded_len() as u32;
+		let layer_len = 15 * hash_len;
+		(proof_size + layer_len - 1) / layer_len
+	}
 }
 
 /// Verify the existence of `key` and `value` in a given trie root and proof.

diff --git a/substrate/primitives/runtime/src/proving_trie/base2.rs b/substrate/primitives/runtime/src/proving_trie/base2.rs
@@ -23,6 +23,7 @@
 use super::{ProvingTrie, TrieError};
 use crate::{Decode, DispatchError, Encode};
 use binary_merkle_tree::{merkle_proof, merkle_root, MerkleProof};
+use codec::MaxEncodedLen;
 use sp_std::{collections::btree_map::BTreeMap, vec::Vec};
 
 /// A helper structure for building a basic base-2 merkle trie and creating compact proofs for that
@@ -40,7 +41,7 @@ where
 impl<Hashing, Key, Value> ProvingTrie<Hashing, Key, Value> for BasicProvingTrie<Hashing, Key, Value>
 where
 	Hashing: sp_core::Hasher,
-	Hashing::Out: Encode + Decode,
+	Hashing::Out: Encode + Decode + MaxEncodedLen,
 	Key: Encode + Decode + Ord,
 	Value: Encode + Decode + Clone,
 {
@@ -99,6 +100,16 @@ where
 	) -> Result<(), DispatchError> {
 		verify_proof::<Hashing, Key, Value>(root, proof, key, value)
 	}
+
+	/// A base 2 trie is expected to include the data for 1 hash per layer.
+	fn proof_size_to_hashes(proof_size: &u32) -> u32 {
+		let hash_len = Hashing::Out::max_encoded_len() as u32;
+		let layer_len = 1 * hash_len;
+		// The implementation of this trie also includes the `key` and `value` encoded within the
+		// proof, but since we cannot know the "minimum" size of those items, we count it toward
+		// the number of hashes for a worst case scenario.
+		(proof_size + layer_len - 1) / layer_len
+	}
 }
 
 /// Verify the existence of `key` and `value` in a given trie root and proof.

diff --git a/substrate/primitives/runtime/src/proving_trie/mod.rs b/substrate/primitives/runtime/src/proving_trie/mod.rs
@@ -137,6 +137,15 @@ where
 		key: &Key,
 		value: &Value,
 	) -> Result<(), DispatchError>;
+	/// This function returns the number of hashes we expect to calculate based on the
+	/// size of the proof. This is used for benchmarking, so for worst case scenario, we should
+	/// round up.
+	///
+	/// The major complexity of doing a `verify_proof` is computing the hashes needed
+	/// to calculate the merkle root. For tries, it should be easy to predict the depth
+	/// of the trie (which is equivalent to the hashes), by looking at the size of the proof.
+	/// A rough estimate should be: `proof_size` / (`hash_size` * `num_hashes_per_layer`).
+	fn proof_size_to_hashes(proof_size: &u32) -> u32;
 }
 
 #[cfg(test)]
@@ -169,4 +178,50 @@ mod tests {
 		let proof = balance_trie.create_proof(&69u32).unwrap();
 		assert_eq!(BalanceTrie16::verify_proof(&root, &proof, &69u32, &69u128), Ok(()));
 	}
+
+	#[test]
+	fn proof_size_to_hashes() {
+		use crate::{testing::H256, traits::BlakeTwo256};
+		use codec::MaxEncodedLen;
+
+		// We can be off by up to 2 hashes... should be trivial.
+		let tolerance = 2;
+
+		let abs_dif = |x, y| {
+			if x > y {
+				x - y
+			} else {
+				y - x
+			}
+		};
+
+		let mut i: u32 = 1;
+		while i < 10_000_000 {
+			let trie = BalanceTrie2::generate_for((0..i).map(|i| (i, u128::from(i)))).unwrap();
+			let proof = trie.create_proof(&(i / 2)).unwrap();
+			let hashes = BalanceTrie2::proof_size_to_hashes(&(proof.len() as u32));
+			let log2 = (i as f64).log2().ceil() as u32;
+
+			assert!(abs_dif(hashes, log2) <= tolerance);
+			i = i * 10;
+		}
+
+		// Compute log base 16 and round up
+		let log16 = |x: u32| -> u32 {
+			let x_f64 = x as f64;
+			let log16_x = (x_f64.ln() / 16_f64.ln()).ceil();
+			log16_x as u32
+		};
+
+		let mut i: u32 = 1;
+		while i < 10_000_000 {
+			let trie = BalanceTrie16::generate_for((0..i).map(|i| (i, u128::from(i)))).unwrap();
+			let proof = trie.create_proof(&(i / 2)).unwrap();
+			let hashes = BalanceTrie16::proof_size_to_hashes(&(proof.len() as u32));
+			let log16 = log16(i);
+
+			assert!(abs_dif(hashes, log16) <= tolerance);
+			i = i * 10;
+		}
+	}
 }