paradigmxyz · joshieDo · Jul 31, 2023 · Jul 11, 2023 · Jul 11, 2023 · Jul 11, 2023
@@ -760,12 +760,17 @@ impl Command {
                 .set(AccountHashingStage::new(
                     stage_config.account_hashing.clean_threshold,
                     stage_config.account_hashing.commit_threshold,
+                    config.prune.map(|prune| prune.parts).unwrap_or_default(),
                 ))
                 .set(StorageHashingStage::new(
                     stage_config.storage_hashing.clean_threshold,
                     stage_config.storage_hashing.commit_threshold,
+                    config.prune.map(|prune| prune.parts).unwrap_or_default(),
+                ))
+                .set(MerkleStage::new_execution(
+                    stage_config.merkle.clean_threshold,
+                    config.prune.map(|prune| prune.parts).unwrap_or_default(),
                 ))
-                .set(MerkleStage::new_execution(stage_config.merkle.clean_threshold))
                 .set(TransactionLookupStage::new(stage_config.transaction_lookup.commit_threshold))
                 .set(IndexAccountHistoryStage::new(
                     stage_config.index_account_history.commit_threshold,

@@ -86,14 +86,22 @@ async fn unwind_and_copy<DB: Database>(
 
     // Bring hashes to TO
 
-    AccountHashingStage { clean_threshold: u64::MAX, commit_threshold: u64::MAX }
-        .execute(&provider, execute_input)
-        .await
-        .unwrap();
-    StorageHashingStage { clean_threshold: u64::MAX, commit_threshold: u64::MAX }
-        .execute(&provider, execute_input)
-        .await
-        .unwrap();
+    AccountHashingStage {
+        clean_threshold: u64::MAX,
+        commit_threshold: u64::MAX,
+        prune_modes: PruneModes::none(),
+    }
+    .execute(&provider, execute_input)
+    .await
+    .unwrap();
+    StorageHashingStage {
+        clean_threshold: u64::MAX,
+        commit_threshold: u64::MAX,
+        prune_modes: PruneModes::none(),
+    }
+    .execute(&provider, execute_input)
+    .await
+    .unwrap();
 
     let unwind_inner_tx = provider.into_tx();
 
@@ -124,6 +132,7 @@ async fn dry_run<DB: Database>(
             clean_threshold: u64::MAX, /* Forces updating the root instead of calculating
                                         * from
                                         * scratch */
+            prune_modes: Default::default(),
         }
         .execute(
             &provider,

@@ -208,12 +208,22 @@ impl Command {
                     )
                 }
                 StageEnum::TxLookup => (Box::new(TransactionLookupStage::new(batch_size)), None),
-                StageEnum::AccountHashing => {
-                    (Box::new(AccountHashingStage::new(1, batch_size)), None)
-                }
-                StageEnum::StorageHashing => {
-                    (Box::new(StorageHashingStage::new(1, batch_size)), None)
-                }
+                StageEnum::AccountHashing => (
+                    Box::new(AccountHashingStage::new(
+                        1,
+                        batch_size,
+                        config.prune.map(|prune| prune.parts).unwrap_or_default(),
+                    )),
+                    None,
+                ),
+                StageEnum::StorageHashing => (
+                    Box::new(StorageHashingStage::new(
+                        1,
+                        batch_size,
+                        config.prune.map(|prune| prune.parts).unwrap_or_default(),
+                    )),
+                    None,
+                ),
                 StageEnum::Merkle => (
                     Box::new(MerkleStage::default_execution()),
                     Some(Box::new(MerkleStage::default_unwind())),

@@ -79,7 +79,7 @@ pub use net::{
     SEPOLIA_BOOTNODES,
 };
 pub use peer::{PeerId, WithPeerId};
-pub use prune::{PruneCheckpoint, PruneMode, PruneModes, PrunePart};
+pub use prune::{PruneCheckpoint, PruneMode, PruneModes, PrunePart, PrunePartError};
 pub use receipt::{Receipt, ReceiptWithBloom, ReceiptWithBloomRef};
 pub use revm_primitives::JumpMap;
 pub use serde_helper::JsonU256;

@@ -5,5 +5,5 @@ mod target;
 
 pub use checkpoint::PruneCheckpoint;
 pub use mode::PruneMode;
-pub use part::PrunePart;
+pub use part::{PrunePart, PrunePartError};
 pub use target::PruneModes;
@@ -1,8 +1,10 @@
+use derive_more::Display;
 use reth_codecs::{main_codec, Compact};
+use thiserror::Error;
 
 /// Part of the data that can be pruned.
 #[main_codec]
-#[derive(Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash)]
+#[derive(Debug, Display, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash)]
 pub enum PrunePart {
     /// Prune part responsible for the `TxSenders` table.
     SenderRecovery,
@@ -16,6 +18,14 @@ pub enum PrunePart {
     StorageHistory,
 }
 
+/// PrunePart error type.
+#[derive(Debug, Error)]
+pub enum PrunePartError {
+    /// Invalid configuration of a prune part.
+    #[error("The configuration provided for {0} is invalid.")]
+    Configuration(PrunePart),
+}
+
 #[cfg(test)]
 impl Default for PrunePart {
     fn default() -> Self {

@@ -1,4 +1,7 @@
-use crate::{serde_helper::deserialize_opt_prune_mode_with_min_blocks, BlockNumber, PruneMode};
+use crate::{
+    prune::PrunePartError, serde_helper::deserialize_opt_prune_mode_with_min_blocks, BlockNumber,
+    PruneMode, PrunePart,
+};
 use paste::paste;
 use serde::{Deserialize, Serialize};
 
@@ -19,10 +22,16 @@ pub struct PruneModes {
     )]
     pub receipts: Option<PruneMode>,
     /// Account History pruning configuration.
-    #[serde(skip_serializing_if = "Option::is_none")]
+    #[serde(
+        skip_serializing_if = "Option::is_none",
+        deserialize_with = "deserialize_opt_prune_mode_with_min_blocks::<64, _>"
+    )]
     pub account_history: Option<PruneMode>,
     /// Storage History pruning configuration.
-    #[serde(skip_serializing_if = "Option::is_none")]
+    #[serde(
+        skip_serializing_if = "Option::is_none",
+        deserialize_with = "deserialize_opt_prune_mode_with_min_blocks::<64, _>"
+    )]
     pub storage_history: Option<PruneMode>,
 }
 
@@ -51,12 +60,15 @@ macro_rules! impl_prune_parts {
                     $human_part,
                     " pruning needs to be done, inclusive, according to the provided tip."
                 )]
-                pub fn [<prune_target_block_ $part>](&self, tip: BlockNumber) -> Option<(BlockNumber, PruneMode)> {
-                    self.$part.as_ref().and_then(|mode| {
-                        self.prune_target_block(mode, tip, $min_blocks).map(|block| {
-                            (block, *mode)
-                        })
-                    })
+                pub fn [<prune_target_block_ $part>](&self, tip: BlockNumber) -> Result<Option<(BlockNumber, PruneMode)>, PrunePartError> {
+                    match &self.$part {
+                        Some(mode) =>
+                            match self.prune_target_block(mode, tip, $min_blocks) {
+                                Some(block) => Ok(Some((block, *mode))),
+                                None => Err(PrunePartError::Configuration(PrunePart::[<$human_part>]))
+                            }
+                        None => Ok(None)
+                    }
                 }
             }
         )+
@@ -107,17 +119,17 @@ impl PruneModes {
                 Some(tip.saturating_sub(*distance))
             }
             PruneMode::Before(n) if tip.saturating_sub(*n) >= min_blocks.unwrap_or_default() => {
-                Some(*n)
+                Some(n.saturating_sub(1))
             }
             _ => None,
         }
     }
 
     impl_prune_parts!(
-        (sender_recovery, "Sender Recovery", None),
-        (transaction_lookup, "Transaction Lookup", None),
+        (sender_recovery, "SenderRecovery", None),
+        (transaction_lookup, "TransactionLookup", None),
         (receipts, "Receipts", Some(64)),
-        (account_history, "Account History", None),
-        (storage_history, "Storage History", None)
+        (account_history, "AccountHistory", Some(64)),
+        (storage_history, "StorageHistory", Some(64))
     );
 }
@@ -4,6 +4,9 @@ use thiserror::Error;
 
 #[derive(Error, Debug)]
 pub enum PrunerError {
+    #[error(transparent)]
+    PrunePart(#[from] reth_primitives::PrunePartError),
+
     #[error("Inconsistent data: {0}")]
     InconsistentData(&'static str),
 

@@ -72,13 +72,13 @@ impl<DB: Database> Pruner<DB> {
         let provider = self.provider_factory.provider_rw()?;
 
         if let Some((to_block, prune_mode)) =
-            self.modes.prune_target_block_receipts(tip_block_number)
+            self.modes.prune_target_block_receipts(tip_block_number)?
         {
             self.prune_receipts(&provider, to_block, prune_mode)?;
         }
 
         if let Some((to_block, prune_mode)) =
-            self.modes.prune_target_block_transaction_lookup(tip_block_number)
+            self.modes.prune_target_block_transaction_lookup(tip_block_number)?
         {
             self.prune_transaction_lookup(&provider, to_block, prune_mode)?;
         }

@@ -95,7 +95,7 @@ fn merkle(c: &mut Criterion) {
     // don't need to run each stage for that many times
     group.sample_size(10);
 
-    let stage = MerkleStage::Both { clean_threshold: u64::MAX };
+    let stage = MerkleStage::Both { clean_threshold: u64::MAX, prune_modes: Default::default() };
     measure_stage(
         &mut group,
         setup::unwind_hashes,
@@ -104,7 +104,7 @@ fn merkle(c: &mut Criterion) {
         "Merkle-incremental".to_string(),
     );
 
-    let stage = MerkleStage::Both { clean_threshold: 0 };
+    let stage = MerkleStage::Both { clean_threshold: 0, prune_modes: Default::default() };
     measure_stage(
         &mut group,
         setup::unwind_hashes,

@@ -49,6 +49,9 @@ pub enum StageError {
         #[source]
         error: executor::BlockExecutionError,
     },
+    /// Invalid pruning configuration
+    #[error(transparent)]
+    PruningConfiguration(#[from] reth_primitives::PrunePartError),
     /// Invalid checkpoint passed to the stage
     #[error("Invalid stage checkpoint: {0}")]
     StageCheckpoint(u64),

@@ -60,17 +60,17 @@ pub struct ExecutionStage<EF: ExecutorFactory> {
     /// The commit thresholds of the execution stage.
     thresholds: ExecutionStageThresholds,
     /// Pruning configuration.
-    prune_targets: PruneModes,
+    prune_modes: PruneModes,
 }
 
 impl<EF: ExecutorFactory> ExecutionStage<EF> {
     /// Create new execution stage with specified config.
     pub fn new(
         executor_factory: EF,
         thresholds: ExecutionStageThresholds,
-        prune_targets: PruneModes,
+        prune_modes: PruneModes,
     ) -> Self {
-        Self { metrics_tx: None, executor_factory, thresholds, prune_targets }
+        Self { metrics_tx: None, executor_factory, thresholds, prune_modes }
     }
 
     /// Create an execution stage with the provided  executor factory.
@@ -110,7 +110,7 @@ impl<EF: ExecutorFactory> ExecutionStage<EF> {
 
         // Execute block range
         let mut state = PostState::default();
-        state.add_prune_targets(self.prune_targets);
+        state.add_prune_modes(self.prune_modes);
 
         for block_number in start_block..=max_block {
             let td = provider
@@ -425,8 +425,7 @@ mod tests {
     use reth_db::{models::AccountBeforeTx, test_utils::create_test_rw_db};
     use reth_primitives::{
         hex_literal::hex, keccak256, stage::StageUnitCheckpoint, Account, Bytecode,
-        ChainSpecBuilder, PruneMode, PruneModes, SealedBlock, StorageEntry, H160, H256, MAINNET,
-        U256,
+        ChainSpecBuilder, PruneModes, SealedBlock, StorageEntry, H160, H256, MAINNET, U256,
     };
     use reth_provider::{AccountReader, BlockWriter, ProviderFactory, ReceiptProvider};
     use reth_revm::Factory;
@@ -894,86 +893,4 @@ mod tests {
             ]
         );
     }
-
-    #[tokio::test]
-    async fn test_prune() {
-        let test_tx = TestTransaction::default();
-        let factory = Arc::new(ProviderFactory::new(test_tx.tx.as_ref(), MAINNET.clone()));
-
-        let provider = factory.provider_rw().unwrap();
-        let input = ExecInput {
-            target: Some(1),
-            /// The progress of this stage the last time it was executed.
-            checkpoint: None,
-        };
-        let mut genesis_rlp = hex!("f901faf901f5a00000000000000000000000000000000000000000000000000000000000000000a01dcc4de8dec75d7aab85b567b6ccd41ad312451b948a7413f0a142fd40d49347942adc25665018aa1fe0e6bc666dac8fc2697ff9baa045571b40ae66ca7480791bbb2887286e4e4c4b1b298b191c889d6959023a32eda056e81f171bcc55a6ff8345e692c0f86e5b48e01b996cadc001622fb5e363b421a056e81f171bcc55a6ff8345e692c0f86e5b48e01b996cadc001622fb5e363b421b901000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000083020000808502540be400808000a00000000000000000000000000000000000000000000000000000000000000000880000000000000000c0c0").as_slice();
-        let genesis = SealedBlock::decode(&mut genesis_rlp).unwrap();
-        let mut block_rlp = hex!("f90262f901f9a075c371ba45999d87f4542326910a11af515897aebce5265d3f6acd1f1161f82fa01dcc4de8dec75d7aab85b567b6ccd41ad312451b948a7413f0a142fd40d49347942adc25665018aa1fe0e6bc666dac8fc2697ff9baa098f2dcd87c8ae4083e7017a05456c14eea4b1db2032126e27b3b1563d57d7cc0a08151d548273f6683169524b66ca9fe338b9ce42bc3540046c828fd939ae23bcba03f4e5c2ec5b2170b711d97ee755c160457bb58d8daa338e835ec02ae6860bbabb901000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000083020000018502540be40082a8798203e800a00000000000000000000000000000000000000000000000000000000000000000880000000000000000f863f861800a8405f5e10094100000000000000000000000000000000000000080801ba07e09e26678ed4fac08a249ebe8ed680bf9051a5e14ad223e4b2b9d26e0208f37a05f6e3f188e3e6eab7d7d3b6568f5eac7d687b08d307d3154ccd8c87b4630509bc0").as_slice();
-        let block = SealedBlock::decode(&mut block_rlp).unwrap();
-        provider.insert_block(genesis, None).unwrap();
-        provider.insert_block(block.clone(), None).unwrap();
-        provider.commit().unwrap();
-
-        // insert pre state
-        let provider = factory.provider_rw().unwrap();
-        let code = hex!("5a465a905090036002900360015500");
-        let code_hash = keccak256(hex!("5a465a905090036002900360015500"));
-        provider
-            .tx_ref()
-            .put::<tables::PlainAccountState>(
-                H160(hex!("1000000000000000000000000000000000000000")),
-                Account { nonce: 0, balance: U256::ZERO, bytecode_hash: Some(code_hash) },
-            )
-            .unwrap();
-        provider
-            .tx_ref()
-            .put::<tables::PlainAccountState>(
-                H160(hex!("a94f5374fce5edbc8e2a8697c15331677e6ebf0b")),
-                Account {
-                    nonce: 0,
-                    balance: U256::from(0x3635c9adc5dea00000u128),
-                    bytecode_hash: None,
-                },
-            )
-            .unwrap();
-        provider
-            .tx_ref()
-            .put::<tables::Bytecodes>(code_hash, Bytecode::new_raw(code.to_vec().into()))
-            .unwrap();
-        provider.commit().unwrap();
-
-        let check_pruning = |factory: Arc<ProviderFactory<_>>,
-                             prune_targets: PruneModes,
-                             expect_num_receipts: usize| async move {
-            let provider = factory.provider_rw().unwrap();
-
-            let mut execution_stage = ExecutionStage::new(
-                Factory::new(Arc::new(ChainSpecBuilder::mainnet().berlin_activated().build())),
-                ExecutionStageThresholds { max_blocks: Some(100), max_changes: None },
-                prune_targets,
-            );
-
-            execution_stage.execute(&provider, input).await.unwrap();
-            assert_eq!(
-                provider.receipts_by_block(1.into()).unwrap().unwrap().len(),
-                expect_num_receipts
-            );
-        };
-
-        let mut prune = PruneModes::none();
-
-        check_pruning(factory.clone(), prune, 1).await;
-
-        prune.receipts = Some(PruneMode::Full);
-        check_pruning(factory.clone(), prune, 0).await;
-
-        prune.receipts = Some(PruneMode::Before(1));
-        check_pruning(factory.clone(), prune, 1).await;
-
-        prune.receipts = Some(PruneMode::Before(2));
-        check_pruning(factory.clone(), prune, 0).await;
-
-        prune.receipts = Some(PruneMode::Distance(0));
-        check_pruning(factory.clone(), prune, 1).await;
-    }
 }