Core Benchmarking Infra (#175)

* Implement a solution for the pre-fund account limit * Update the account pre-funding handling * Fix the lighthouse node tracing issue * refactor existing dt infra * Implement the platform driver * Wire up the cleaned up driver implementation * Implement the core benchmarking components * Remove some debug logging * Fix issues in the benchmarks driver * Implement a global concurrency limit on provider requests * Update the concurrency limit * Update the concurrency limit * Cleanups * Update the lighthouse ports * Ignore certain tests * Update the new geth test
2026-07-27 12:45:52 +00:00 · 2025-10-05 18:09:01 +03:00
parent f9dc362c03
commit 74fdeb4a2e
51 changed files with 4308 additions and 1990 deletions
@@ -0,0 +1,770 @@
+use std::{
+    collections::HashMap,
+    ops::ControlFlow,
+    sync::{
+        Arc,
+        atomic::{AtomicUsize, Ordering},
+    },
+    time::Duration,
+};
+
+use alloy::{
+    hex,
+    json_abi::JsonAbi,
+    network::{Ethereum, TransactionBuilder},
+    primitives::{Address, TxHash, U256},
+    rpc::types::{
+        TransactionReceipt, TransactionRequest,
+        trace::geth::{
+            CallFrame, GethDebugBuiltInTracerType, GethDebugTracerConfig, GethDebugTracerType,
+            GethDebugTracingOptions,
+        },
+    },
+};
+use anyhow::{Context as _, Result, bail};
+use indexmap::IndexMap;
+use revive_dt_common::{
+    futures::{PollingWaitBehavior, poll},
+    types::PrivateKeyAllocator,
+};
+use revive_dt_format::{
+    metadata::{ContractInstance, ContractPathAndIdent},
+    steps::{
+        AllocateAccountStep, BalanceAssertionStep, Calldata, EtherValue, FunctionCallStep, Method,
+        RepeatStep, Step, StepAddress, StepIdx, StepPath, StorageEmptyAssertionStep,
+    },
+    traits::{ResolutionContext, ResolverApi},
+};
+use tokio::sync::{Mutex, mpsc::UnboundedSender};
+use tracing::{Instrument, Span, debug, error, field::display, info, info_span, instrument};
+
+use crate::{
+    differential_benchmarks::{ExecutionState, WatcherEvent},
+    helpers::{CachedCompiler, TestDefinition, TestPlatformInformation},
+};
+
+static DRIVER_COUNT: AtomicUsize = AtomicUsize::new(0);
+
+/// The differential tests driver for a single platform.
+pub struct Driver<'a, I> {
+    /// The id of the driver.
+    driver_id: usize,
+
+    /// The information of the platform that this driver is for.
+    platform_information: &'a TestPlatformInformation<'a>,
+
+    /// The resolver of the platform.
+    resolver: Arc<dyn ResolverApi + 'a>,
+
+    /// The definition of the test that the driver is instructed to execute.
+    test_definition: &'a TestDefinition<'a>,
+
+    /// The private key allocator used by this driver and other drivers when account allocations are
+    /// needed.
+    private_key_allocator: Arc<Mutex<PrivateKeyAllocator>>,
+
+    /// The execution state associated with the platform.
+    execution_state: ExecutionState,
+
+    /// The send side of the watcher's unbounded channel associated with this driver.
+    watcher_tx: UnboundedSender<WatcherEvent>,
+
+    /// The number of steps that were executed on the driver.
+    steps_executed: usize,
+
+    /// This is the queue of steps that are to be executed by the driver for this test case. Each
+    /// time `execute_step` is called one of the steps is executed.
+    steps_iterator: I,
+}
+
+impl<'a, I> Driver<'a, I>
+where
+    I: Iterator<Item = (StepPath, Step)>,
+{
+    // region:Constructors & Initialization
+    pub async fn new(
+        platform_information: &'a TestPlatformInformation<'a>,
+        test_definition: &'a TestDefinition<'a>,
+        private_key_allocator: Arc<Mutex<PrivateKeyAllocator>>,
+        cached_compiler: &CachedCompiler<'a>,
+        watcher_tx: UnboundedSender<WatcherEvent>,
+        steps: I,
+    ) -> Result<Self> {
+        let mut this = Driver {
+            driver_id: DRIVER_COUNT.fetch_add(1, Ordering::SeqCst),
+            platform_information,
+            resolver: platform_information
+                .node
+                .resolver()
+                .await
+                .context("Failed to create resolver")?,
+            test_definition,
+            private_key_allocator,
+            execution_state: ExecutionState::empty(),
+            steps_executed: 0,
+            steps_iterator: steps,
+            watcher_tx,
+        };
+        this.init_execution_state(cached_compiler)
+            .await
+            .context("Failed to initialize the execution state of the platform")?;
+        Ok(this)
+    }
+
+    async fn init_execution_state(&mut self, cached_compiler: &CachedCompiler<'a>) -> Result<()> {
+        let compiler_output = cached_compiler
+            .compile_contracts(
+                self.test_definition.metadata,
+                self.test_definition.metadata_file_path,
+                self.test_definition.mode.clone(),
+                None,
+                self.platform_information.compiler.as_ref(),
+                self.platform_information.platform,
+                &self.platform_information.reporter,
+            )
+            .await
+            .inspect_err(|err| {
+                error!(
+                    ?err,
+                    platform_identifier = %self.platform_information.platform.platform_identifier(),
+                    "Pre-linking compilation failed"
+                )
+            })
+            .context("Failed to produce the pre-linking compiled contracts")?;
+
+        let mut deployed_libraries = None::<HashMap<_, _>>;
+        let mut contract_sources = self
+            .test_definition
+            .metadata
+            .contract_sources()
+            .inspect_err(|err| {
+                error!(
+                    ?err,
+                    platform_identifier = %self.platform_information.platform.platform_identifier(),
+                    "Failed to retrieve contract sources from metadata"
+                )
+            })
+            .context("Failed to get the contract instances from the metadata file")?;
+        for library_instance in self
+            .test_definition
+            .metadata
+            .libraries
+            .iter()
+            .flatten()
+            .flat_map(|(_, map)| map.values())
+        {
+            debug!(%library_instance, "Deploying Library Instance");
+
+            let ContractPathAndIdent {
+                contract_source_path: library_source_path,
+                contract_ident: library_ident,
+            } = contract_sources
+                .remove(library_instance)
+                .context("Failed to get the contract sources of the contract instance")?;
+
+            let (code, abi) = compiler_output
+                .contracts
+                .get(&library_source_path)
+                .and_then(|contracts| contracts.get(library_ident.as_str()))
+                .context("Failed to get the code and abi for the instance")?;
+
+            let code = alloy::hex::decode(code)?;
+
+            // Getting the deployer address from the cases themselves. This is to ensure
+            // that we're doing the deployments from different accounts and therefore we're
+            // not slowed down by the nonce.
+            let deployer_address = self
+                .test_definition
+                .case
+                .steps
+                .iter()
+                .filter_map(|step| match step {
+                    Step::FunctionCall(input) => input.caller.as_address().copied(),
+                    Step::BalanceAssertion(..) => None,
+                    Step::StorageEmptyAssertion(..) => None,
+                    Step::Repeat(..) => None,
+                    Step::AllocateAccount(..) => None,
+                })
+                .next()
+                .unwrap_or(FunctionCallStep::default_caller_address());
+            let tx = TransactionBuilder::<Ethereum>::with_deploy_code(
+                TransactionRequest::default().from(deployer_address),
+                code,
+            );
+            let receipt = self.execute_transaction(tx).await.inspect_err(|err| {
+                error!(
+                    ?err,
+                    %library_instance,
+                    platform_identifier = %self.platform_information.platform.platform_identifier(),
+                    "Failed to deploy the library"
+                )
+            })?;
+
+            debug!(
+                ?library_instance,
+                platform_identifier = %self.platform_information.platform.platform_identifier(),
+                "Deployed library"
+            );
+
+            let library_address = receipt
+                .contract_address
+                .expect("Failed to deploy the library");
+
+            deployed_libraries.get_or_insert_default().insert(
+                library_instance.clone(),
+                (library_ident.clone(), library_address, abi.clone()),
+            );
+        }
+
+        let compiler_output = cached_compiler
+            .compile_contracts(
+                self.test_definition.metadata,
+                self.test_definition.metadata_file_path,
+                self.test_definition.mode.clone(),
+                deployed_libraries.as_ref(),
+                self.platform_information.compiler.as_ref(),
+                self.platform_information.platform,
+                &self.platform_information.reporter,
+            )
+            .await
+            .inspect_err(|err| {
+                error!(
+                    ?err,
+                    platform_identifier = %self.platform_information.platform.platform_identifier(),
+                    "Post-linking compilation failed"
+                )
+            })
+            .context("Failed to compile the post-link contracts")?;
+
+        self.execution_state = ExecutionState::new(
+            compiler_output.contracts,
+            deployed_libraries.unwrap_or_default(),
+        );
+
+        Ok(())
+    }
+    // endregion:Constructors & Initialization
+
+    // region:Step Handling
+    pub async fn execute_all(mut self) -> Result<usize> {
+        while let Some(result) = self.execute_next_step().await {
+            result?
+        }
+        Ok(self.steps_executed)
+    }
+
+    pub async fn execute_next_step(&mut self) -> Option<Result<()>> {
+        let (step_path, step) = self.steps_iterator.next()?;
+        info!(%step_path, "Executing Step");
+        Some(
+            self.execute_step(&step_path, &step)
+                .await
+                .inspect(|_| info!(%step_path, "Step execution succeeded"))
+                .inspect_err(|err| error!(%step_path, ?err, "Step execution failed")),
+        )
+    }
+
+    #[instrument(
+        level = "info",
+        skip_all,
+        fields(
+            driver_id = self.driver_id,
+            platform_identifier = %self.platform_information.platform.platform_identifier(),
+            %step_path,
+        ),
+        err(Debug),
+    )]
+    async fn execute_step(&mut self, step_path: &StepPath, step: &Step) -> Result<()> {
+        let steps_executed = match step {
+            Step::FunctionCall(step) => self
+                .execute_function_call(step_path, step.as_ref())
+                .await
+                .context("Function call step Failed"),
+            Step::Repeat(step) => self
+                .execute_repeat_step(step_path, step.as_ref())
+                .await
+                .context("Repetition Step Failed"),
+            Step::AllocateAccount(step) => self
+                .execute_account_allocation(step_path, step.as_ref())
+                .await
+                .context("Account Allocation Step Failed"),
+            // The following steps are disabled in the benchmarking driver.
+            Step::BalanceAssertion(..) | Step::StorageEmptyAssertion(..) => Ok(0),
+        }?;
+        self.steps_executed += steps_executed;
+        Ok(())
+    }
+
+    #[instrument(level = "info", skip_all, fields(driver_id = self.driver_id))]
+    pub async fn execute_function_call(
+        &mut self,
+        _: &StepPath,
+        step: &FunctionCallStep,
+    ) -> Result<usize> {
+        let deployment_receipts = self
+            .handle_function_call_contract_deployment(step)
+            .await
+            .context("Failed to deploy contracts for the function call step")?;
+        let execution_receipt = self
+            .handle_function_call_execution(step, deployment_receipts)
+            .await
+            .context("Failed to handle the function call execution")?;
+        let tracing_result = self
+            .handle_function_call_call_frame_tracing(execution_receipt.transaction_hash)
+            .await
+            .context("Failed to handle the function call call frame tracing")?;
+        self.handle_function_call_variable_assignment(step, &tracing_result)
+            .await
+            .context("Failed to handle function call variable assignment")?;
+        Ok(1)
+    }
+
+    async fn handle_function_call_contract_deployment(
+        &mut self,
+        step: &FunctionCallStep,
+    ) -> Result<HashMap<ContractInstance, TransactionReceipt>> {
+        let mut instances_we_must_deploy = IndexMap::<ContractInstance, bool>::new();
+        for instance in step.find_all_contract_instances().into_iter() {
+            if !self
+                .execution_state
+                .deployed_contracts
+                .contains_key(&instance)
+            {
+                instances_we_must_deploy.entry(instance).or_insert(false);
+            }
+        }
+        if let Method::Deployer = step.method {
+            instances_we_must_deploy.swap_remove(&step.instance);
+            instances_we_must_deploy.insert(step.instance.clone(), true);
+        }
+
+        let mut receipts = HashMap::new();
+        for (instance, deploy_with_constructor_arguments) in instances_we_must_deploy.into_iter() {
+            let calldata = deploy_with_constructor_arguments.then_some(&step.calldata);
+            let value = deploy_with_constructor_arguments
+                .then_some(step.value)
+                .flatten();
+
+            let caller = {
+                let context = self.default_resolution_context();
+                step.caller
+                    .resolve_address(self.resolver.as_ref(), context)
+                    .await?
+            };
+            if let (_, _, Some(receipt)) = self
+                .get_or_deploy_contract_instance(&instance, caller, calldata, value)
+                .await
+                .context("Failed to get or deploy contract instance during input execution")?
+            {
+                receipts.insert(instance.clone(), receipt);
+            }
+        }
+
+        Ok(receipts)
+    }
+
+    async fn handle_function_call_execution(
+        &mut self,
+        step: &FunctionCallStep,
+        mut deployment_receipts: HashMap<ContractInstance, TransactionReceipt>,
+    ) -> Result<TransactionReceipt> {
+        match step.method {
+            // This step was already executed when `handle_step` was called. We just need to
+            // lookup the transaction receipt in this case and continue on.
+            Method::Deployer => deployment_receipts
+                .remove(&step.instance)
+                .context("Failed to find deployment receipt for constructor call"),
+            Method::Fallback | Method::FunctionName(_) => {
+                let tx = step
+                    .as_transaction(self.resolver.as_ref(), self.default_resolution_context())
+                    .await?;
+                self.execute_transaction(tx).await
+            }
+        }
+    }
+
+    async fn handle_function_call_call_frame_tracing(
+        &mut self,
+        tx_hash: TxHash,
+    ) -> Result<CallFrame> {
+        self.platform_information
+            .node
+            .trace_transaction(
+                tx_hash,
+                GethDebugTracingOptions {
+                    tracer: Some(GethDebugTracerType::BuiltInTracer(
+                        GethDebugBuiltInTracerType::CallTracer,
+                    )),
+                    tracer_config: GethDebugTracerConfig(serde_json::json! {{
+                        "onlyTopCall": true,
+                        "withLog": false,
+                        "withStorage": false,
+                        "withMemory": false,
+                        "withStack": false,
+                        "withReturnData": true
+                    }}),
+                    ..Default::default()
+                },
+            )
+            .await
+            .map(|trace| {
+                trace
+                    .try_into_call_frame()
+                    .expect("Impossible - we requested a callframe trace so we must get it back")
+            })
+    }
+
+    async fn handle_function_call_variable_assignment(
+        &mut self,
+        step: &FunctionCallStep,
+        tracing_result: &CallFrame,
+    ) -> Result<()> {
+        let Some(ref assignments) = step.variable_assignments else {
+            return Ok(());
+        };
+
+        // Handling the return data variable assignments.
+        for (variable_name, output_word) in assignments.return_data.iter().zip(
+            tracing_result
+                .output
+                .as_ref()
+                .unwrap_or_default()
+                .to_vec()
+                .chunks(32),
+        ) {
+            let value = U256::from_be_slice(output_word);
+            self.execution_state
+                .variables
+                .insert(variable_name.clone(), value);
+            tracing::info!(
+                variable_name,
+                variable_value = hex::encode(value.to_be_bytes::<32>()),
+                "Assigned variable"
+            );
+        }
+
+        Ok(())
+    }
+
+    #[instrument(level = "info", skip_all, fields(driver_id = self.driver_id))]
+    pub async fn execute_balance_assertion(
+        &mut self,
+        _: &StepPath,
+        _: &BalanceAssertionStep,
+    ) -> anyhow::Result<usize> {
+        // Kept empty intentionally for the benchmark driver.
+        Ok(1)
+    }
+
+    #[instrument(level = "info", skip_all, fields(driver_id = self.driver_id), err(Debug))]
+    async fn execute_storage_empty_assertion_step(
+        &mut self,
+        _: &StepPath,
+        _: &StorageEmptyAssertionStep,
+    ) -> Result<usize> {
+        // Kept empty intentionally for the benchmark driver.
+        Ok(1)
+    }
+
+    #[instrument(level = "info", skip_all, fields(driver_id = self.driver_id), err(Debug))]
+    async fn execute_repeat_step(
+        &mut self,
+        step_path: &StepPath,
+        step: &RepeatStep,
+    ) -> Result<usize> {
+        let tasks = (0..step.repeat)
+            .map(|_| Driver {
+                driver_id: DRIVER_COUNT.fetch_add(1, Ordering::SeqCst),
+                platform_information: self.platform_information,
+                resolver: self.resolver.clone(),
+                test_definition: self.test_definition,
+                private_key_allocator: self.private_key_allocator.clone(),
+                execution_state: self.execution_state.clone(),
+                steps_executed: 0,
+                steps_iterator: {
+                    let steps = step
+                        .steps
+                        .iter()
+                        .cloned()
+                        .enumerate()
+                        .map(|(step_idx, step)| {
+                            let step_idx = StepIdx::new(step_idx);
+                            let step_path = step_path.append(step_idx);
+                            (step_path, step)
+                        })
+                        .collect::<Vec<_>>();
+                    steps.into_iter()
+                },
+                watcher_tx: self.watcher_tx.clone(),
+            })
+            .map(|driver| driver.execute_all());
+
+        // TODO: Determine how we want to know the `ignore_block_before` and if it's through the
+        // receipt and how this would impact the architecture and the possibility of us not waiting
+        // for receipts in the future.
+        self.watcher_tx
+            .send(WatcherEvent::RepetitionStartEvent {
+                ignore_block_before: 0,
+            })
+            .context("Failed to send message on the watcher's tx")?;
+
+        let res = futures::future::try_join_all(tasks)
+            .await
+            .context("Repetition execution failed")?;
+        Ok(res.into_iter().sum())
+    }
+
+    #[instrument(level = "info", fields(driver_id = self.driver_id), skip_all, err(Debug))]
+    pub async fn execute_account_allocation(
+        &mut self,
+        _: &StepPath,
+        step: &AllocateAccountStep,
+    ) -> Result<usize> {
+        let Some(variable_name) = step.variable_name.strip_prefix("$VARIABLE:") else {
+            bail!("Account allocation must start with $VARIABLE:");
+        };
+
+        let private_key = self
+            .private_key_allocator
+            .lock()
+            .await
+            .allocate()
+            .context("Account allocation through the private key allocator failed")?;
+        let account = private_key.address();
+        let variable = U256::from_be_slice(account.0.as_slice());
+
+        self.execution_state
+            .variables
+            .insert(variable_name.to_string(), variable);
+
+        Ok(1)
+    }
+    // endregion:Step Handling
+
+    // region:Contract Deployment
+    #[instrument(
+        level = "info",
+        skip_all,
+        fields(
+            driver_id = self.driver_id,
+            platform_identifier = %self.platform_information.platform.platform_identifier(),
+            %contract_instance,
+            %deployer
+        ),
+        err(Debug),
+    )]
+    async fn get_or_deploy_contract_instance(
+        &mut self,
+        contract_instance: &ContractInstance,
+        deployer: Address,
+        calldata: Option<&Calldata>,
+        value: Option<EtherValue>,
+    ) -> Result<(Address, JsonAbi, Option<TransactionReceipt>)> {
+        if let Some((_, address, abi)) = self
+            .execution_state
+            .deployed_contracts
+            .get(contract_instance)
+        {
+            info!(
+
+                %address,
+                "Contract instance already deployed."
+            );
+            Ok((*address, abi.clone(), None))
+        } else {
+            info!("Contract instance requires deployment.");
+            let (address, abi, receipt) = self
+                .deploy_contract(contract_instance, deployer, calldata, value)
+                .await
+                .context("Failed to deploy contract")?;
+            info!(
+                %address,
+                "Contract instance has been deployed."
+            );
+            Ok((address, abi, Some(receipt)))
+        }
+    }
+
+    #[instrument(
+    level = "info",
+    skip_all,
+        fields(
+            driver_id = self.driver_id,
+            platform_identifier = %self.platform_information.platform.platform_identifier(),
+            %contract_instance,
+            %deployer
+        ),
+        err(Debug),
+    )]
+    async fn deploy_contract(
+        &mut self,
+        contract_instance: &ContractInstance,
+        deployer: Address,
+        calldata: Option<&Calldata>,
+        value: Option<EtherValue>,
+    ) -> Result<(Address, JsonAbi, TransactionReceipt)> {
+        let Some(ContractPathAndIdent {
+            contract_source_path,
+            contract_ident,
+        }) = self
+            .test_definition
+            .metadata
+            .contract_sources()?
+            .remove(contract_instance)
+        else {
+            anyhow::bail!(
+                "Contract source not found for instance {:?}",
+                contract_instance
+            )
+        };
+
+        let Some((code, abi)) = self
+            .execution_state
+            .compiled_contracts
+            .get(&contract_source_path)
+            .and_then(|source_file_contracts| source_file_contracts.get(contract_ident.as_ref()))
+            .cloned()
+        else {
+            anyhow::bail!(
+                "Failed to find information for contract {:?}",
+                contract_instance
+            )
+        };
+
+        let mut code = match alloy::hex::decode(&code) {
+            Ok(code) => code,
+            Err(error) => {
+                tracing::error!(
+                    ?error,
+                    contract_source_path = contract_source_path.display().to_string(),
+                    contract_ident = contract_ident.as_ref(),
+                    "Failed to hex-decode byte code - This could possibly mean that the bytecode requires linking"
+                );
+                anyhow::bail!("Failed to hex-decode the byte code {}", error)
+            }
+        };
+
+        if let Some(calldata) = calldata {
+            let calldata = calldata
+                .calldata(self.resolver.as_ref(), self.default_resolution_context())
+                .await?;
+            code.extend(calldata);
+        }
+
+        let tx = {
+            let tx = TransactionRequest::default().from(deployer);
+            let tx = match value {
+                Some(ref value) => tx.value(value.into_inner()),
+                _ => tx,
+            };
+            TransactionBuilder::<Ethereum>::with_deploy_code(tx, code)
+        };
+
+        let receipt = match self.execute_transaction(tx).await {
+            Ok(receipt) => receipt,
+            Err(error) => {
+                tracing::error!(?error, "Contract deployment transaction failed.");
+                return Err(error);
+            }
+        };
+
+        let Some(address) = receipt.contract_address else {
+            anyhow::bail!("Contract deployment didn't return an address");
+        };
+        tracing::info!(
+            instance_name = ?contract_instance,
+            instance_address = ?address,
+            "Deployed contract"
+        );
+        self.platform_information
+            .reporter
+            .report_contract_deployed_event(contract_instance.clone(), address)?;
+
+        self.execution_state.deployed_contracts.insert(
+            contract_instance.clone(),
+            (contract_ident, address, abi.clone()),
+        );
+
+        Ok((address, abi, receipt))
+    }
+
+    #[instrument(level = "info", fields(driver_id = self.driver_id), skip_all)]
+    async fn step_address_auto_deployment(
+        &mut self,
+        step_address: &StepAddress,
+    ) -> Result<Address> {
+        match step_address {
+            StepAddress::Address(address) => Ok(*address),
+            StepAddress::ResolvableAddress(resolvable) => {
+                let Some(instance) = resolvable
+                    .strip_suffix(".address")
+                    .map(ContractInstance::new)
+                else {
+                    bail!("Not an address variable");
+                };
+
+                self.get_or_deploy_contract_instance(
+                    &instance,
+                    FunctionCallStep::default_caller_address(),
+                    None,
+                    None,
+                )
+                .await
+                .map(|v| v.0)
+            }
+        }
+    }
+    // endregion:Contract Deployment
+
+    // region:Resolution & Resolver
+    fn default_resolution_context(&self) -> ResolutionContext<'_> {
+        ResolutionContext::default()
+            .with_deployed_contracts(&self.execution_state.deployed_contracts)
+            .with_variables(&self.execution_state.variables)
+    }
+    // endregion:Resolution & Resolver
+
+    // region:Transaction Execution
+    /// Executes the transaction on the driver's node with some custom waiting logic for the receipt
+    #[instrument(
+        level = "info",
+        skip_all,
+        fields(driver_id = self.driver_id, transaction_hash = tracing::field::Empty)
+    )]
+    async fn execute_transaction(
+        &self,
+        transaction: TransactionRequest,
+    ) -> anyhow::Result<TransactionReceipt> {
+        let node = self.platform_information.node;
+        let transaction_hash = node
+            .submit_transaction(transaction)
+            .await
+            .context("Failed to submit transaction")?;
+        Span::current().record("transaction_hash", display(transaction_hash));
+
+        info!("Submitted transaction");
+        self.watcher_tx
+            .send(WatcherEvent::SubmittedTransaction { transaction_hash })
+            .context("Failed to send the transaction hash to the watcher")?;
+
+        info!("Starting to poll for transaction receipt");
+        poll(
+            Duration::from_secs(30 * 60),
+            PollingWaitBehavior::Constant(Duration::from_secs(1)),
+            || {
+                async move {
+                    match node.get_receipt(transaction_hash).await {
+                        Ok(receipt) => {
+                            info!("Polling succeeded, receipt found");
+                            Ok(ControlFlow::Break(receipt))
+                        }
+                        Err(_) => Ok(ControlFlow::Continue(())),
+                    }
+                }
+                .instrument(info_span!("Polling for receipt"))
+            },
+        )
+        .await
+    }
+    // endregion:Transaction Execution
+}
@@ -0,0 +1,177 @@
+//! The main entry point for differential benchmarking.
+
+use std::{collections::BTreeMap, sync::Arc};
+
+use anyhow::Context as _;
+use futures::{FutureExt, StreamExt};
+use revive_dt_common::types::PrivateKeyAllocator;
+use revive_dt_core::Platform;
+use revive_dt_format::steps::{Step, StepIdx, StepPath};
+use tokio::sync::Mutex;
+use tracing::{error, info, info_span, instrument, warn};
+
+use revive_dt_config::{BenchmarkingContext, Context};
+use revive_dt_report::Reporter;
+
+use crate::{
+    differential_benchmarks::{Driver, Watcher, WatcherEvent},
+    helpers::{CachedCompiler, NodePool, collect_metadata_files, create_test_definitions_stream},
+};
+
+/// Handles the differential testing executing it according to the information defined in the
+/// context
+#[instrument(level = "info", err(Debug), skip_all)]
+pub async fn handle_differential_benchmarks(
+    mut context: BenchmarkingContext,
+    reporter: Reporter,
+) -> anyhow::Result<()> {
+    // A bit of a hack but we need to override the number of nodes specified through the CLI since
+    // benchmarks can only be run on a single node. Perhaps in the future we'd have a cleaner way to
+    // do this. But, for the time being, we need to override the cli arguments.
+    if context.concurrency_configuration.number_of_nodes != 1 {
+        warn!(
+            specified_number_of_nodes = context.concurrency_configuration.number_of_nodes,
+            updated_number_of_nodes = 1,
+            "Invalid number of nodes specified through the CLI. Benchmarks can only be run on a single node. Updated the arguments."
+        );
+        context.concurrency_configuration.number_of_nodes = 1;
+    };
+    let full_context = Context::Benchmark(Box::new(context.clone()));
+
+    // Discover all of the metadata files that are defined in the context.
+    let metadata_files = collect_metadata_files(&context)
+        .context("Failed to collect metadata files for differential testing")?;
+    info!(len = metadata_files.len(), "Discovered metadata files");
+
+    // Discover the list of platforms that the tests should run on based on the context.
+    let platforms = context
+        .platforms
+        .iter()
+        .copied()
+        .map(Into::<&dyn Platform>::into)
+        .collect::<Vec<_>>();
+
+    // Starting the nodes of the various platforms specified in the context. Note that we use the
+    // node pool since it contains all of the code needed to spawn nodes from A to Z and therefore
+    // it's the preferred way for us to start nodes even when we're starting just a single node. The
+    // added overhead from it is quite small (performance wise) since it's involved only when we're
+    // creating the test definitions, but it might have other maintenance overhead as it obscures
+    // the fact that only a single node is spawned.
+    let platforms_and_nodes = {
+        let mut map = BTreeMap::new();
+
+        for platform in platforms.iter() {
+            let platform_identifier = platform.platform_identifier();
+
+            let node_pool = NodePool::new(full_context.clone(), *platform)
+                .await
+                .inspect_err(|err| {
+                    error!(
+                        ?err,
+                        %platform_identifier,
+                        "Failed to initialize the node pool for the platform."
+                    )
+                })
+                .context("Failed to initialize the node pool")?;
+
+            map.insert(platform_identifier, (*platform, node_pool));
+        }
+
+        map
+    };
+    info!("Spawned the platform nodes");
+
+    // Preparing test definitions for the execution.
+    let test_definitions = create_test_definitions_stream(
+        &full_context,
+        metadata_files.iter(),
+        &platforms_and_nodes,
+        reporter.clone(),
+    )
+    .await
+    .collect::<Vec<_>>()
+    .await;
+    info!(len = test_definitions.len(), "Created test definitions");
+
+    // Creating the objects that will be shared between the various runs. The cached compiler is the
+    // only one at the current moment of time that's safe to share between runs.
+    let cached_compiler = CachedCompiler::new(
+        context
+            .working_directory
+            .as_path()
+            .join("compilation_cache"),
+        context
+            .compilation_configuration
+            .invalidate_compilation_cache,
+    )
+    .await
+    .map(Arc::new)
+    .context("Failed to initialize cached compiler")?;
+
+    // Note: we do not want to run all of the workloads concurrently on all platforms. Rather, we'd
+    // like to run all of the workloads for one platform, and then the next sequentially as we'd
+    // like for the effect of concurrency to be minimized when we're doing the benchmarking.
+    for platform in platforms.iter() {
+        let platform_identifier = platform.platform_identifier();
+
+        let span = info_span!("Benchmarking for the platform", %platform_identifier);
+        let _guard = span.enter();
+
+        for test_definition in test_definitions.iter() {
+            let platform_information = &test_definition.platforms[&platform_identifier];
+
+            let span = info_span!(
+                "Executing workload",
+                metadata_file_path = %test_definition.metadata_file_path.display(),
+                case_idx = %test_definition.case_idx,
+                mode = %test_definition.mode,
+            );
+            let _guard = span.enter();
+
+            // Initializing all of the components requires to execute this particular workload.
+            let private_key_allocator = Arc::new(Mutex::new(PrivateKeyAllocator::new(
+                context.wallet_configuration.highest_private_key_exclusive(),
+            )));
+            let (watcher, watcher_tx) = Watcher::new(
+                platform_identifier,
+                platform_information
+                    .node
+                    .subscribe_to_full_blocks_information()
+                    .await
+                    .context("Failed to subscribe to full blocks information from the node")?,
+            );
+            let driver = Driver::new(
+                platform_information,
+                test_definition,
+                private_key_allocator,
+                cached_compiler.as_ref(),
+                watcher_tx.clone(),
+                test_definition
+                    .case
+                    .steps_iterator_for_benchmarks(context.default_repetition_count)
+                    .enumerate()
+                    .map(|(step_idx, step)| -> (StepPath, Step) {
+                        (StepPath::new(vec![StepIdx::new(step_idx)]), step)
+                    }),
+            )
+            .await
+            .context("Failed to create the benchmarks driver")?;
+
+            futures::future::try_join(
+                watcher.run(),
+                driver.execute_all().inspect(|_| {
+                    info!("All transactions submitted - driver completed execution");
+                    watcher_tx
+                        .send(WatcherEvent::AllTransactionsSubmitted)
+                        .unwrap()
+                }),
+            )
+            .await
+            .context("Failed to run the driver and executor")
+            .inspect(|(_, steps_executed)| info!(steps_executed, "Workload Execution Succeeded"))
+            .inspect_err(|err| error!(?err, "Workload Execution Failed"))?;
+        }
+    }
+
+    Ok(())
+}
@@ -0,0 +1,43 @@
+use std::{collections::HashMap, path::PathBuf};
+
+use alloy::{
+    json_abi::JsonAbi,
+    primitives::{Address, U256},
+};
+
+use revive_dt_format::metadata::{ContractIdent, ContractInstance};
+
+#[derive(Clone)]
+/// The state associated with the test execution of one of the workloads.
+pub struct ExecutionState {
+    /// The compiled contracts, these contracts have been compiled and have had the libraries linked
+    /// against them and therefore they're ready to be deployed on-demand.
+    pub compiled_contracts: HashMap<PathBuf, HashMap<String, (String, JsonAbi)>>,
+
+    /// A map of all of the deployed contracts and information about them.
+    pub deployed_contracts: HashMap<ContractInstance, (ContractIdent, Address, JsonAbi)>,
+
+    /// This map stores the variables used for each one of the cases contained in the metadata file.
+    pub variables: HashMap<String, U256>,
+}
+
+impl ExecutionState {
+    pub fn new(
+        compiled_contracts: HashMap<PathBuf, HashMap<String, (String, JsonAbi)>>,
+        deployed_contracts: HashMap<ContractInstance, (ContractIdent, Address, JsonAbi)>,
+    ) -> Self {
+        Self {
+            compiled_contracts,
+            deployed_contracts,
+            variables: Default::default(),
+        }
+    }
+
+    pub fn empty() -> Self {
+        Self {
+            compiled_contracts: Default::default(),
+            deployed_contracts: Default::default(),
+            variables: Default::default(),
+        }
+    }
+}
@@ -0,0 +1,9 @@
+mod driver;
+mod entry_point;
+mod execution_state;
+mod watcher;
+
+pub use driver::*;
+pub use entry_point::*;
+pub use execution_state::*;
+pub use watcher::*;
@@ -0,0 +1,207 @@
+use std::{collections::HashSet, pin::Pin, sync::Arc};
+
+use alloy::primitives::{BlockNumber, TxHash};
+use anyhow::Result;
+use futures::{Stream, StreamExt};
+use revive_dt_common::types::PlatformIdentifier;
+use revive_dt_node_interaction::MinedBlockInformation;
+use tokio::sync::{
+    RwLock,
+    mpsc::{UnboundedReceiver, UnboundedSender, unbounded_channel},
+};
+use tracing::{info, instrument};
+
+/// This struct defines the watcher used in the benchmarks. A watcher is only valid for 1 workload
+/// and MUST NOT be re-used between workloads since it holds important internal state for a given
+/// workload and is not designed for reuse.
+pub struct Watcher {
+    /// The identifier of the platform that this watcher is for.
+    platform_identifier: PlatformIdentifier,
+
+    /// The receive side of the channel that all of the drivers and various other parts of the code
+    /// send events to the watcher on.
+    rx: UnboundedReceiver<WatcherEvent>,
+
+    /// This is a stream of the blocks that were mined by the node. This is for a single platform
+    /// and a single node from that platform.
+    blocks_stream: Pin<Box<dyn Stream<Item = MinedBlockInformation>>>,
+}
+
+impl Watcher {
+    pub fn new(
+        platform_identifier: PlatformIdentifier,
+        blocks_stream: Pin<Box<dyn Stream<Item = MinedBlockInformation>>>,
+    ) -> (Self, UnboundedSender<WatcherEvent>) {
+        let (tx, rx) = unbounded_channel::<WatcherEvent>();
+        (
+            Self {
+                platform_identifier,
+                rx,
+                blocks_stream,
+            },
+            tx,
+        )
+    }
+
+    #[instrument(level = "info", skip_all)]
+    pub async fn run(mut self) -> Result<()> {
+        // The first event that the watcher receives must be a `RepetitionStartEvent` that informs
+        // the watcher of the last block number that it should ignore and what the block number is
+        // for the first important block that it should look for.
+        let ignore_block_before = loop {
+            let Some(WatcherEvent::RepetitionStartEvent {
+                ignore_block_before,
+            }) = self.rx.recv().await
+            else {
+                continue;
+            };
+            break ignore_block_before;
+        };
+
+        // This is the set of the transaction hashes that the watcher should be looking for and
+        // watch for them in the blocks. The watcher will keep watching for blocks until it sees
+        // that all of the transactions that it was watching for has been seen in the mined blocks.
+        let watch_for_transaction_hashes = Arc::new(RwLock::new(HashSet::<TxHash>::new()));
+
+        // A boolean that keeps track of whether all of the transactions were submitted or if more
+        // txs are expected to come through the receive side of the channel. We do not want to rely
+        // on the channel closing alone for the watcher to know that all of the transactions were
+        // submitted and for there to be an explicit event sent by the core orchestrator that
+        // informs the watcher that no further transactions are to be expected and that it can
+        // safely ignore the channel.
+        let all_transactions_submitted = Arc::new(RwLock::new(false));
+
+        let watcher_event_watching_task = {
+            let watch_for_transaction_hashes = watch_for_transaction_hashes.clone();
+            let all_transactions_submitted = all_transactions_submitted.clone();
+            async move {
+                while let Some(watcher_event) = self.rx.recv().await {
+                    match watcher_event {
+                        // Subsequent repetition starts are ignored since certain workloads can
+                        // contain nested repetitions and therefore there's no use in doing any
+                        // action if the repetitions are nested.
+                        WatcherEvent::RepetitionStartEvent { .. } => {}
+                        WatcherEvent::SubmittedTransaction { transaction_hash } => {
+                            watch_for_transaction_hashes
+                                .write()
+                                .await
+                                .insert(transaction_hash);
+                        }
+                        WatcherEvent::AllTransactionsSubmitted => {
+                            *all_transactions_submitted.write().await = true;
+                            self.rx.close();
+                            info!("Watcher's Events Watching Task Finished");
+                            break;
+                        }
+                    }
+                }
+            }
+        };
+        let block_information_watching_task = {
+            let watch_for_transaction_hashes = watch_for_transaction_hashes.clone();
+            let all_transactions_submitted = all_transactions_submitted.clone();
+            let mut blocks_information_stream = self.blocks_stream;
+            async move {
+                let mut mined_blocks_information = Vec::new();
+
+                while let Some(block) = blocks_information_stream.next().await {
+                    // If the block number is equal to or less than the last block before the
+                    // repetition then we ignore it and continue on to the next block.
+                    if block.block_number <= ignore_block_before {
+                        continue;
+                    }
+
+                    if *all_transactions_submitted.read().await
+                        && watch_for_transaction_hashes.read().await.is_empty()
+                    {
+                        break;
+                    }
+
+                    info!(
+                        remaining_transactions = watch_for_transaction_hashes.read().await.len(),
+                        block_tx_count = block.transaction_hashes.len(),
+                        "Observed a block"
+                    );
+
+                    // Remove all of the transaction hashes observed in this block from the txs we
+                    // are currently watching for.
+                    let mut watch_for_transaction_hashes =
+                        watch_for_transaction_hashes.write().await;
+                    for tx_hash in block.transaction_hashes.iter() {
+                        watch_for_transaction_hashes.remove(tx_hash);
+                    }
+
+                    mined_blocks_information.push(block);
+                }
+
+                info!("Watcher's Block Watching Task Finished");
+                mined_blocks_information
+            }
+        };
+
+        let (_, mined_blocks_information) =
+            futures::future::join(watcher_event_watching_task, block_information_watching_task)
+                .await;
+
+        // region:TEMPORARY
+        {
+            // TODO: The following core is TEMPORARY and will be removed once we have proper
+            // reporting in place and then it can be removed. This serves as as way of doing some
+            // very simple reporting for the time being.
+            use std::io::Write;
+
+            let mut stderr = std::io::stderr().lock();
+            writeln!(
+                stderr,
+                "Watcher information for {}",
+                self.platform_identifier
+            )?;
+            writeln!(
+                stderr,
+                "block_number,block_timestamp,mined_gas,block_gas_limit,tx_count"
+            )?;
+            for block in mined_blocks_information {
+                writeln!(
+                    stderr,
+                    "{},{},{},{},{}",
+                    block.block_number,
+                    block.block_timestamp,
+                    block.mined_gas,
+                    block.block_gas_limit,
+                    block.transaction_hashes.len()
+                )?
+            }
+        }
+        // endregion:TEMPORARY
+
+        Ok(())
+    }
+}
+
+#[derive(Clone, Copy, Debug, PartialEq, Eq, PartialOrd, Ord, Hash)]
+pub enum WatcherEvent {
+    /// Informs the watcher that it should begin watching for the blocks mined by the platforms.
+    /// Before the watcher receives this event it will not be watching for the mined blocks. The
+    /// reason behind this is that we do not want the initialization transactions (e.g., contract
+    /// deployments) to be included in the overall TPS and GPS measurements since these blocks will
+    /// most likely only contain a single transaction since they're just being used for
+    /// initialization.
+    RepetitionStartEvent {
+        /// This is the block number of the last block seen before the repetition started. This is
+        /// used to instruct the watcher to ignore all block prior to this block when it starts
+        /// streaming the blocks.
+        ignore_block_before: BlockNumber,
+    },
+
+    /// Informs the watcher that a transaction was submitted and that the watcher should watch for a
+    /// transaction with this hash in the blocks that it watches.
+    SubmittedTransaction {
+        /// The hash of the submitted transaction.
+        transaction_hash: TxHash,
+    },
+
+    /// Informs the watcher that all of the transactions of this benchmark have been submitted and
+    /// that it can expect to receive no further transaction hashes and not even watch the channel
+    /// any longer.
+    AllTransactionsSubmitted,
+}
@@ -0,0 +1,240 @@
+//! The main entry point into differential testing.
+
+use std::{
+    collections::BTreeMap,
+    io::{BufWriter, Write, stderr},
+    sync::Arc,
+    time::Instant,
+};
+
+use anyhow::Context as _;
+use futures::{FutureExt, StreamExt};
+use revive_dt_common::types::PrivateKeyAllocator;
+use revive_dt_core::Platform;
+use tokio::sync::Mutex;
+use tracing::{Instrument, error, info, info_span, instrument};
+
+use revive_dt_config::{Context, TestExecutionContext};
+use revive_dt_report::{Reporter, ReporterEvent, TestCaseStatus};
+
+use crate::{
+    differential_tests::Driver,
+    helpers::{CachedCompiler, NodePool, collect_metadata_files, create_test_definitions_stream},
+};
+
+/// Handles the differential testing executing it according to the information defined in the
+/// context
+#[instrument(level = "info", err(Debug), skip_all)]
+pub async fn handle_differential_tests(
+    context: TestExecutionContext,
+    reporter: Reporter,
+) -> anyhow::Result<()> {
+    let reporter_clone = reporter.clone();
+
+    // Discover all of the metadata files that are defined in the context.
+    let metadata_files = collect_metadata_files(&context)
+        .context("Failed to collect metadata files for differential testing")?;
+    info!(len = metadata_files.len(), "Discovered metadata files");
+
+    // Discover the list of platforms that the tests should run on based on the context.
+    let platforms = context
+        .platforms
+        .iter()
+        .copied()
+        .map(Into::<&dyn Platform>::into)
+        .collect::<Vec<_>>();
+
+    // Starting the nodes of the various platforms specified in the context.
+    let platforms_and_nodes = {
+        let mut map = BTreeMap::new();
+
+        for platform in platforms.iter() {
+            let platform_identifier = platform.platform_identifier();
+
+            let context = Context::Test(Box::new(context.clone()));
+            let node_pool = NodePool::new(context, *platform)
+                .await
+                .inspect_err(|err| {
+                    error!(
+                        ?err,
+                        %platform_identifier,
+                        "Failed to initialize the node pool for the platform."
+                    )
+                })
+                .context("Failed to initialize the node pool")?;
+
+            map.insert(platform_identifier, (*platform, node_pool));
+        }
+
+        map
+    };
+    info!("Spawned the platform nodes");
+
+    // Preparing test definitions.
+    let full_context = Context::Test(Box::new(context.clone()));
+    let test_definitions = create_test_definitions_stream(
+        &full_context,
+        metadata_files.iter(),
+        &platforms_and_nodes,
+        reporter.clone(),
+    )
+    .await
+    .collect::<Vec<_>>()
+    .await;
+    info!(len = test_definitions.len(), "Created test definitions");
+
+    // Creating everything else required for the driver to run.
+    let cached_compiler = CachedCompiler::new(
+        context
+            .working_directory
+            .as_path()
+            .join("compilation_cache"),
+        context
+            .compilation_configuration
+            .invalidate_compilation_cache,
+    )
+    .await
+    .map(Arc::new)
+    .context("Failed to initialize cached compiler")?;
+    let private_key_allocator = Arc::new(Mutex::new(PrivateKeyAllocator::new(
+        context.wallet_configuration.highest_private_key_exclusive(),
+    )));
+
+    // Creating the driver and executing all of the steps.
+    let driver_task = futures::future::join_all(test_definitions.iter().map(|test_definition| {
+        let private_key_allocator = private_key_allocator.clone();
+        let cached_compiler = cached_compiler.clone();
+        let mode = test_definition.mode.clone();
+        let span = info_span!(
+            "Executing Test Case",
+            metadata_file_path = %test_definition.metadata_file_path.display(),
+            case_idx = %test_definition.case_idx,
+            mode = %mode
+        );
+        async move {
+            let driver =
+                match Driver::new_root(test_definition, private_key_allocator, &cached_compiler)
+                    .await
+                {
+                    Ok(driver) => driver,
+                    Err(error) => {
+                        test_definition
+                            .reporter
+                            .report_test_failed_event(format!("{error:#}"))
+                            .expect("Can't fail");
+                        error!("Test Case Failed");
+                        return;
+                    }
+                };
+            info!("Created the driver for the test case");
+
+            match driver.execute_all().await {
+                Ok(steps_executed) => test_definition
+                    .reporter
+                    .report_test_succeeded_event(steps_executed)
+                    .expect("Can't fail"),
+                Err(error) => {
+                    test_definition
+                        .reporter
+                        .report_test_failed_event(format!("{error:#}"))
+                        .expect("Can't fail");
+                    error!("Test Case Failed");
+                }
+            };
+            info!("Finished the execution of the test case")
+        }
+        .instrument(span)
+    }))
+    .inspect(|_| {
+        info!("Finished executing all test cases");
+        reporter_clone
+            .report_completion_event()
+            .expect("Can't fail")
+    });
+    let cli_reporting_task = start_cli_reporting_task(reporter);
+
+    futures::future::join(driver_task, cli_reporting_task).await;
+
+    Ok(())
+}
+
+#[allow(irrefutable_let_patterns, clippy::uninlined_format_args)]
+async fn start_cli_reporting_task(reporter: Reporter) {
+    let mut aggregator_events_rx = reporter.subscribe().await.expect("Can't fail");
+    drop(reporter);
+
+    let start = Instant::now();
+
+    const GREEN: &str = "\x1B[32m";
+    const RED: &str = "\x1B[31m";
+    const GREY: &str = "\x1B[90m";
+    const COLOR_RESET: &str = "\x1B[0m";
+    const BOLD: &str = "\x1B[1m";
+    const BOLD_RESET: &str = "\x1B[22m";
+
+    let mut number_of_successes = 0;
+    let mut number_of_failures = 0;
+
+    let mut buf = BufWriter::new(stderr());
+    while let Ok(event) = aggregator_events_rx.recv().await {
+        let ReporterEvent::MetadataFileSolcModeCombinationExecutionCompleted {
+            metadata_file_path,
+            mode,
+            case_status,
+        } = event
+        else {
+            continue;
+        };
+
+        let _ = writeln!(buf, "{} - {}", mode, metadata_file_path.display());
+        for (case_idx, case_status) in case_status.into_iter() {
+            let _ = write!(buf, "\tCase Index {case_idx:>3}: ");
+            let _ = match case_status {
+                TestCaseStatus::Succeeded { steps_executed } => {
+                    number_of_successes += 1;
+                    writeln!(
+                        buf,
+                        "{}{}Case Succeeded{} - Steps Executed: {}{}",
+                        GREEN, BOLD, BOLD_RESET, steps_executed, COLOR_RESET
+                    )
+                }
+                TestCaseStatus::Failed { reason } => {
+                    number_of_failures += 1;
+                    writeln!(
+                        buf,
+                        "{}{}Case Failed{} - Reason: {}{}",
+                        RED,
+                        BOLD,
+                        BOLD_RESET,
+                        reason.trim(),
+                        COLOR_RESET,
+                    )
+                }
+                TestCaseStatus::Ignored { reason, .. } => writeln!(
+                    buf,
+                    "{}{}Case Ignored{} - Reason: {}{}",
+                    GREY,
+                    BOLD,
+                    BOLD_RESET,
+                    reason.trim(),
+                    COLOR_RESET,
+                ),
+            };
+        }
+        let _ = writeln!(buf);
+    }
+
+    // Summary at the end.
+    let _ = writeln!(
+        buf,
+        "{} cases: {}{}{} cases succeeded, {}{}{} cases failed in {} seconds",
+        number_of_successes + number_of_failures,
+        GREEN,
+        number_of_successes,
+        COLOR_RESET,
+        RED,
+        number_of_failures,
+        COLOR_RESET,
+        start.elapsed().as_secs()
+    );
+}
@@ -0,0 +1,35 @@
+use std::{collections::HashMap, path::PathBuf};
+
+use alloy::{
+    json_abi::JsonAbi,
+    primitives::{Address, U256},
+};
+
+use revive_dt_format::metadata::{ContractIdent, ContractInstance};
+
+#[derive(Clone)]
+/// The state associated with the test execution of one of the tests.
+pub struct ExecutionState {
+    /// The compiled contracts, these contracts have been compiled and have had the libraries linked
+    /// against them and therefore they're ready to be deployed on-demand.
+    pub compiled_contracts: HashMap<PathBuf, HashMap<String, (String, JsonAbi)>>,
+
+    /// A map of all of the deployed contracts and information about them.
+    pub deployed_contracts: HashMap<ContractInstance, (ContractIdent, Address, JsonAbi)>,
+
+    /// This map stores the variables used for each one of the cases contained in the metadata file.
+    pub variables: HashMap<String, U256>,
+}
+
+impl ExecutionState {
+    pub fn new(
+        compiled_contracts: HashMap<PathBuf, HashMap<String, (String, JsonAbi)>>,
+        deployed_contracts: HashMap<ContractInstance, (ContractIdent, Address, JsonAbi)>,
+    ) -> Self {
+        Self {
+            compiled_contracts,
+            deployed_contracts,
+            variables: Default::default(),
+        }
+    }
+}
@@ -0,0 +1,11 @@
+//! This module contains all of the code responsible for performing differential tests including the
+//! driver implementation, state implementation, and the core logic that allows for tests to be
+//! executed.
+
+mod driver;
+mod entry_point;
+mod execution_state;
+
+pub use driver::*;
+pub use entry_point::*;
+pub use execution_state::*;
@@ -1,900 +0,0 @@
-//! The test driver handles the compilation and execution of the test cases.
-
-use std::collections::HashMap;
-use std::path::PathBuf;
-use std::sync::Arc;
-
-use alloy::consensus::EMPTY_ROOT_HASH;
-use alloy::hex;
-use alloy::json_abi::JsonAbi;
-use alloy::network::{Ethereum, TransactionBuilder};
-use alloy::primitives::{TxHash, U256};
-use alloy::rpc::types::TransactionReceipt;
-use alloy::rpc::types::trace::geth::{
-    CallFrame, GethDebugBuiltInTracerType, GethDebugTracerConfig, GethDebugTracerType,
-    GethDebugTracingOptions, GethTrace, PreStateConfig,
-};
-use alloy::{
-    primitives::Address,
-    rpc::types::{TransactionRequest, trace::geth::DiffMode},
-};
-use anyhow::{Context as _, bail};
-use futures::{TryStreamExt, future::try_join_all};
-use indexmap::IndexMap;
-use revive_dt_common::types::{PlatformIdentifier, PrivateKeyAllocator};
-use revive_dt_format::traits::{ResolutionContext, ResolverApi};
-use revive_dt_report::ExecutionSpecificReporter;
-use semver::Version;
-
-use revive_dt_format::case::Case;
-use revive_dt_format::metadata::{ContractIdent, ContractInstance, ContractPathAndIdent};
-use revive_dt_format::steps::{
-    BalanceAssertionStep, Calldata, EtherValue, Expected, ExpectedOutput, FunctionCallStep, Method,
-    StepIdx, StepPath, StorageEmptyAssertionStep,
-};
-use revive_dt_format::{metadata::Metadata, steps::Step};
-use revive_dt_node_interaction::EthereumNode;
-use tokio::sync::Mutex;
-use tokio::try_join;
-use tracing::{Instrument, info, info_span, instrument};
-
-#[derive(Clone)]
-pub struct CaseState {
-    /// A map of all of the compiled contracts for the given metadata file.
-    compiled_contracts: HashMap<PathBuf, HashMap<String, (String, JsonAbi)>>,
-
-    /// This map stores the contracts deployments for this case.
-    deployed_contracts: HashMap<ContractInstance, (ContractIdent, Address, JsonAbi)>,
-
-    /// This map stores the variables used for each one of the cases contained in the metadata
-    /// file.
-    variables: HashMap<String, U256>,
-
-    /// Stores the version used for the current case.
-    compiler_version: Version,
-
-    /// The execution reporter.
-    execution_reporter: ExecutionSpecificReporter,
-
-    /// The private key allocator used for this case state. This is an Arc Mutex to allow for the
-    /// state to be cloned and for all of the clones to refer to the same allocator.
-    private_key_allocator: Arc<Mutex<PrivateKeyAllocator>>,
-}
-
-impl CaseState {
-    pub fn new(
-        compiler_version: Version,
-        compiled_contracts: HashMap<PathBuf, HashMap<String, (String, JsonAbi)>>,
-        deployed_contracts: HashMap<ContractInstance, (ContractIdent, Address, JsonAbi)>,
-        execution_reporter: ExecutionSpecificReporter,
-        private_key_allocator: Arc<Mutex<PrivateKeyAllocator>>,
-    ) -> Self {
-        Self {
-            compiled_contracts,
-            deployed_contracts,
-            variables: Default::default(),
-            compiler_version,
-            execution_reporter,
-            private_key_allocator,
-        }
-    }
-
-    pub async fn handle_step(
-        &mut self,
-        metadata: &Metadata,
-        step: &Step,
-        step_path: &StepPath,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<StepOutput> {
-        match step {
-            Step::FunctionCall(input) => {
-                let (receipt, geth_trace, diff_mode) = self
-                    .handle_input(metadata, input, node)
-                    .await
-                    .context("Failed to handle function call step")?;
-                Ok(StepOutput::FunctionCall(receipt, geth_trace, diff_mode))
-            }
-            Step::BalanceAssertion(balance_assertion) => {
-                self.handle_balance_assertion(metadata, balance_assertion, node)
-                    .await
-                    .context("Failed to handle balance assertion step")?;
-                Ok(StepOutput::BalanceAssertion)
-            }
-            Step::StorageEmptyAssertion(storage_empty) => {
-                self.handle_storage_empty(metadata, storage_empty, node)
-                    .await
-                    .context("Failed to handle storage empty assertion step")?;
-                Ok(StepOutput::StorageEmptyAssertion)
-            }
-            Step::Repeat(repetition_step) => {
-                self.handle_repeat(
-                    metadata,
-                    repetition_step.repeat,
-                    &repetition_step.steps,
-                    step_path,
-                    node,
-                )
-                .await
-                .context("Failed to handle the repetition step")?;
-                Ok(StepOutput::Repetition)
-            }
-            Step::AllocateAccount(account_allocation) => {
-                self.handle_account_allocation(account_allocation.variable_name.as_str())
-                    .await
-                    .context("Failed to allocate account")?;
-                Ok(StepOutput::AccountAllocation)
-            }
-        }
-        .inspect(|_| info!("Step Succeeded"))
-    }
-
-    #[instrument(level = "info", name = "Handling Input", skip_all)]
-    pub async fn handle_input(
-        &mut self,
-        metadata: &Metadata,
-        input: &FunctionCallStep,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<(TransactionReceipt, GethTrace, DiffMode)> {
-        let resolver = node.resolver().await?;
-
-        let deployment_receipts = self
-            .handle_input_contract_deployment(metadata, input, node)
-            .await
-            .context("Failed during contract deployment phase of input handling")?;
-        let execution_receipt = self
-            .handle_input_execution(input, deployment_receipts, node)
-            .await
-            .context("Failed during transaction execution phase of input handling")?;
-        let tracing_result = self
-            .handle_input_call_frame_tracing(execution_receipt.transaction_hash, node)
-            .await
-            .context("Failed during callframe tracing phase of input handling")?;
-        self.handle_input_variable_assignment(input, &tracing_result)
-            .context("Failed to assign variables from callframe output")?;
-        let (_, (geth_trace, diff_mode)) = try_join!(
-            self.handle_input_expectations(
-                input,
-                &execution_receipt,
-                resolver.as_ref(),
-                &tracing_result
-            ),
-            self.handle_input_diff(execution_receipt.transaction_hash, node)
-        )
-        .context("Failed while evaluating expectations and diffs in parallel")?;
-        Ok((execution_receipt, geth_trace, diff_mode))
-    }
-
-    #[instrument(level = "info", name = "Handling Balance Assertion", skip_all)]
-    pub async fn handle_balance_assertion(
-        &mut self,
-        metadata: &Metadata,
-        balance_assertion: &BalanceAssertionStep,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<()> {
-        self.handle_balance_assertion_contract_deployment(metadata, balance_assertion, node)
-            .await
-            .context("Failed to deploy contract for balance assertion")?;
-        self.handle_balance_assertion_execution(balance_assertion, node)
-            .await
-            .context("Failed to execute balance assertion")?;
-        Ok(())
-    }
-
-    #[instrument(level = "info", name = "Handling Storage Assertion", skip_all)]
-    pub async fn handle_storage_empty(
-        &mut self,
-        metadata: &Metadata,
-        storage_empty: &StorageEmptyAssertionStep,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<()> {
-        self.handle_storage_empty_assertion_contract_deployment(metadata, storage_empty, node)
-            .await
-            .context("Failed to deploy contract for storage empty assertion")?;
-        self.handle_storage_empty_assertion_execution(storage_empty, node)
-            .await
-            .context("Failed to execute storage empty assertion")?;
-        Ok(())
-    }
-
-    #[instrument(level = "info", name = "Handling Repetition", skip_all)]
-    pub async fn handle_repeat(
-        &mut self,
-        metadata: &Metadata,
-        repetitions: usize,
-        steps: &[Step],
-        step_path: &StepPath,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<()> {
-        let tasks = (0..repetitions).map(|_| {
-            let mut state = self.clone();
-            async move {
-                for (step_idx, step) in steps.iter().enumerate() {
-                    let step_path = step_path.append(step_idx);
-                    state.handle_step(metadata, step, &step_path, node).await?;
-                }
-                Ok::<(), anyhow::Error>(())
-            }
-        });
-        try_join_all(tasks).await?;
-        Ok(())
-    }
-
-    #[instrument(level = "info", name = "Handling Account Allocation", skip_all)]
-    pub async fn handle_account_allocation(&mut self, variable_name: &str) -> anyhow::Result<()> {
-        let Some(variable_name) = variable_name.strip_prefix("$VARIABLE:") else {
-            bail!("Account allocation must start with $VARIABLE:");
-        };
-
-        let private_key = self.private_key_allocator.lock().await.allocate()?;
-        let account = private_key.address();
-        let variable = U256::from_be_slice(account.0.as_slice());
-
-        self.variables.insert(variable_name.to_string(), variable);
-
-        Ok(())
-    }
-
-    /// Handles the contract deployment for a given input performing it if it needs to be performed.
-    #[instrument(level = "info", skip_all)]
-    async fn handle_input_contract_deployment(
-        &mut self,
-        metadata: &Metadata,
-        input: &FunctionCallStep,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<HashMap<ContractInstance, TransactionReceipt>> {
-        let mut instances_we_must_deploy = IndexMap::<ContractInstance, bool>::new();
-        for instance in input.find_all_contract_instances().into_iter() {
-            if !self.deployed_contracts.contains_key(&instance) {
-                instances_we_must_deploy.entry(instance).or_insert(false);
-            }
-        }
-        if let Method::Deployer = input.method {
-            instances_we_must_deploy.swap_remove(&input.instance);
-            instances_we_must_deploy.insert(input.instance.clone(), true);
-        }
-
-        let mut receipts = HashMap::new();
-        for (instance, deploy_with_constructor_arguments) in instances_we_must_deploy.into_iter() {
-            let calldata = deploy_with_constructor_arguments.then_some(&input.calldata);
-            let value = deploy_with_constructor_arguments
-                .then_some(input.value)
-                .flatten();
-
-            let caller = {
-                let context = self.default_resolution_context();
-                let resolver = node.resolver().await?;
-                input
-                    .caller
-                    .resolve_address(resolver.as_ref(), context)
-                    .await?
-            };
-            if let (_, _, Some(receipt)) = self
-                .get_or_deploy_contract_instance(&instance, metadata, caller, calldata, value, node)
-                .await
-                .context("Failed to get or deploy contract instance during input execution")?
-            {
-                receipts.insert(instance.clone(), receipt);
-            }
-        }
-
-        Ok(receipts)
-    }
-
-    /// Handles the execution of the input in terms of the calls that need to be made.
-    #[instrument(level = "info", skip_all)]
-    async fn handle_input_execution(
-        &mut self,
-        input: &FunctionCallStep,
-        mut deployment_receipts: HashMap<ContractInstance, TransactionReceipt>,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<TransactionReceipt> {
-        match input.method {
-            // This input was already executed when `handle_input` was called. We just need to
-            // lookup the transaction receipt in this case and continue on.
-            Method::Deployer => deployment_receipts
-                .remove(&input.instance)
-                .context("Failed to find deployment receipt for constructor call"),
-            Method::Fallback | Method::FunctionName(_) => {
-                let resolver = node.resolver().await?;
-                let tx = match input
-                    .legacy_transaction(resolver.as_ref(), self.default_resolution_context())
-                    .await
-                {
-                    Ok(tx) => tx,
-                    Err(err) => {
-                        return Err(err);
-                    }
-                };
-
-                match node.execute_transaction(tx).await {
-                    Ok(receipt) => Ok(receipt),
-                    Err(err) => Err(err),
-                }
-            }
-        }
-    }
-
-    #[instrument(level = "info", skip_all)]
-    async fn handle_input_call_frame_tracing(
-        &self,
-        tx_hash: TxHash,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<CallFrame> {
-        node.trace_transaction(
-            tx_hash,
-            GethDebugTracingOptions {
-                tracer: Some(GethDebugTracerType::BuiltInTracer(
-                    GethDebugBuiltInTracerType::CallTracer,
-                )),
-                tracer_config: GethDebugTracerConfig(serde_json::json! {{
-                    "onlyTopCall": true,
-                    "withLog": false,
-                    "withStorage": false,
-                    "withMemory": false,
-                    "withStack": false,
-                    "withReturnData": true
-                }}),
-                ..Default::default()
-            },
-        )
-        .await
-        .map(|trace| {
-            trace
-                .try_into_call_frame()
-                .expect("Impossible - we requested a callframe trace so we must get it back")
-        })
-    }
-
-    #[instrument(level = "info", skip_all)]
-    fn handle_input_variable_assignment(
-        &mut self,
-        input: &FunctionCallStep,
-        tracing_result: &CallFrame,
-    ) -> anyhow::Result<()> {
-        let Some(ref assignments) = input.variable_assignments else {
-            return Ok(());
-        };
-
-        // Handling the return data variable assignments.
-        for (variable_name, output_word) in assignments.return_data.iter().zip(
-            tracing_result
-                .output
-                .as_ref()
-                .unwrap_or_default()
-                .to_vec()
-                .chunks(32),
-        ) {
-            let value = U256::from_be_slice(output_word);
-            self.variables.insert(variable_name.clone(), value);
-            tracing::info!(
-                variable_name,
-                variable_value = hex::encode(value.to_be_bytes::<32>()),
-                "Assigned variable"
-            );
-        }
-
-        Ok(())
-    }
-
-    #[instrument(level = "info", skip_all)]
-    async fn handle_input_expectations(
-        &self,
-        input: &FunctionCallStep,
-        execution_receipt: &TransactionReceipt,
-        resolver: &(impl ResolverApi + ?Sized),
-        tracing_result: &CallFrame,
-    ) -> anyhow::Result<()> {
-        // Resolving the `input.expected` into a series of expectations that we can then assert on.
-        let mut expectations = match input {
-            FunctionCallStep {
-                expected: Some(Expected::Calldata(calldata)),
-                ..
-            } => vec![ExpectedOutput::new().with_calldata(calldata.clone())],
-            FunctionCallStep {
-                expected: Some(Expected::Expected(expected)),
-                ..
-            } => vec![expected.clone()],
-            FunctionCallStep {
-                expected: Some(Expected::ExpectedMany(expected)),
-                ..
-            } => expected.clone(),
-            FunctionCallStep { expected: None, .. } => vec![ExpectedOutput::new().with_success()],
-        };
-
-        // This is a bit of a special case and we have to support it separately on it's own. If it's
-        // a call to the deployer method, then the tests will assert that it "returns" the address
-        // of the contract. Deployments do not return the address of the contract but the runtime
-        // code of the contracts. Therefore, this assertion would always fail. So, we replace it
-        // with an assertion of "check if it succeeded"
-        if let Method::Deployer = &input.method {
-            for expectation in expectations.iter_mut() {
-                expectation.return_data = None;
-            }
-        }
-
-        futures::stream::iter(expectations.into_iter().map(Ok))
-            .try_for_each_concurrent(None, |expectation| async move {
-                self.handle_input_expectation_item(
-                    execution_receipt,
-                    resolver,
-                    expectation,
-                    tracing_result,
-                )
-                .await
-            })
-            .await
-    }
-
-    #[instrument(level = "info", skip_all)]
-    async fn handle_input_expectation_item(
-        &self,
-        execution_receipt: &TransactionReceipt,
-        resolver: &(impl ResolverApi + ?Sized),
-        expectation: ExpectedOutput,
-        tracing_result: &CallFrame,
-    ) -> anyhow::Result<()> {
-        if let Some(ref version_requirement) = expectation.compiler_version {
-            if !version_requirement.matches(&self.compiler_version) {
-                return Ok(());
-            }
-        }
-
-        let resolution_context = self
-            .default_resolution_context()
-            .with_block_number(execution_receipt.block_number.as_ref())
-            .with_transaction_hash(&execution_receipt.transaction_hash);
-
-        // Handling the receipt state assertion.
-        let expected = !expectation.exception;
-        let actual = execution_receipt.status();
-        if actual != expected {
-            tracing::error!(
-                expected,
-                actual,
-                ?execution_receipt,
-                ?tracing_result,
-                "Transaction status assertion failed"
-            );
-            anyhow::bail!(
-                "Transaction status assertion failed - Expected {expected} but got {actual}",
-            );
-        }
-
-        // Handling the calldata assertion
-        if let Some(ref expected_calldata) = expectation.return_data {
-            let expected = expected_calldata;
-            let actual = &tracing_result.output.as_ref().unwrap_or_default();
-            if !expected
-                .is_equivalent(actual, resolver, resolution_context)
-                .await
-                .context("Failed to resolve calldata equivalence for return data assertion")?
-            {
-                tracing::error!(
-                    ?execution_receipt,
-                    ?expected,
-                    %actual,
-                    "Calldata assertion failed"
-                );
-                anyhow::bail!("Calldata assertion failed - Expected {expected:?} but got {actual}",);
-            }
-        }
-
-        // Handling the events assertion
-        if let Some(ref expected_events) = expectation.events {
-            // Handling the events length assertion.
-            let expected = expected_events.len();
-            let actual = execution_receipt.logs().len();
-            if actual != expected {
-                tracing::error!(expected, actual, "Event count assertion failed",);
-                anyhow::bail!(
-                    "Event count assertion failed - Expected {expected} but got {actual}",
-                );
-            }
-
-            // Handling the events assertion.
-            for (event_idx, (expected_event, actual_event)) in expected_events
-                .iter()
-                .zip(execution_receipt.logs())
-                .enumerate()
-            {
-                // Handling the emitter assertion.
-                if let Some(ref expected_address) = expected_event.address {
-                    let expected = expected_address
-                        .resolve_address(resolver, resolution_context)
-                        .await?;
-                    let actual = actual_event.address();
-                    if actual != expected {
-                        tracing::error!(
-                            event_idx,
-                            %expected,
-                            %actual,
-                            "Event emitter assertion failed",
-                        );
-                        anyhow::bail!(
-                            "Event emitter assertion failed - Expected {expected} but got {actual}",
-                        );
-                    }
-                }
-
-                // Handling the topics assertion.
-                for (expected, actual) in expected_event
-                    .topics
-                    .as_slice()
-                    .iter()
-                    .zip(actual_event.topics())
-                {
-                    let expected = Calldata::new_compound([expected]);
-                    if !expected
-                        .is_equivalent(&actual.0, resolver, resolution_context)
-                        .await
-                        .context("Failed to resolve event topic equivalence")?
-                    {
-                        tracing::error!(
-                            event_idx,
-                            ?execution_receipt,
-                            ?expected,
-                            ?actual,
-                            "Event topics assertion failed",
-                        );
-                        anyhow::bail!(
-                            "Event topics assertion failed - Expected {expected:?} but got {actual:?}",
-                        );
-                    }
-                }
-
-                // Handling the values assertion.
-                let expected = &expected_event.values;
-                let actual = &actual_event.data().data;
-                if !expected
-                    .is_equivalent(&actual.0, resolver, resolution_context)
-                    .await
-                    .context("Failed to resolve event value equivalence")?
-                {
-                    tracing::error!(
-                        event_idx,
-                        ?execution_receipt,
-                        ?expected,
-                        ?actual,
-                        "Event value assertion failed",
-                    );
-                    anyhow::bail!(
-                        "Event value assertion failed - Expected {expected:?} but got {actual:?}",
-                    );
-                }
-            }
-        }
-
-        Ok(())
-    }
-
-    #[instrument(level = "info", skip_all)]
-    async fn handle_input_diff(
-        &self,
-        tx_hash: TxHash,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<(GethTrace, DiffMode)> {
-        let trace_options = GethDebugTracingOptions::prestate_tracer(PreStateConfig {
-            diff_mode: Some(true),
-            disable_code: None,
-            disable_storage: None,
-        });
-
-        let trace = node
-            .trace_transaction(tx_hash, trace_options)
-            .await
-            .context("Failed to obtain geth prestate tracer output")?;
-        let diff = node
-            .state_diff(tx_hash)
-            .await
-            .context("Failed to obtain state diff for transaction")?;
-
-        Ok((trace, diff))
-    }
-
-    #[instrument(level = "info", skip_all)]
-    pub async fn handle_balance_assertion_contract_deployment(
-        &mut self,
-        metadata: &Metadata,
-        balance_assertion: &BalanceAssertionStep,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<()> {
-        let Some(address) = balance_assertion.address.as_resolvable_address() else {
-            return Ok(());
-        };
-        let Some(instance) = address.strip_suffix(".address").map(ContractInstance::new) else {
-            return Ok(());
-        };
-
-        self.get_or_deploy_contract_instance(
-            &instance,
-            metadata,
-            FunctionCallStep::default_caller_address(),
-            None,
-            None,
-            node,
-        )
-        .await?;
-        Ok(())
-    }
-
-    #[instrument(level = "info", skip_all)]
-    pub async fn handle_balance_assertion_execution(
-        &mut self,
-        BalanceAssertionStep {
-            address,
-            expected_balance: amount,
-            ..
-        }: &BalanceAssertionStep,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<()> {
-        let resolver = node.resolver().await?;
-        let address = address
-            .resolve_address(resolver.as_ref(), self.default_resolution_context())
-            .await?;
-
-        let balance = node.balance_of(address).await?;
-
-        let expected = *amount;
-        let actual = balance;
-        if expected != actual {
-            tracing::error!(%expected, %actual, %address, "Balance assertion failed");
-            anyhow::bail!(
-                "Balance assertion failed - Expected {} but got {} for {} resolved to {}",
-                expected,
-                actual,
-                address,
-                address,
-            )
-        }
-
-        Ok(())
-    }
-
-    #[instrument(level = "info", skip_all)]
-    pub async fn handle_storage_empty_assertion_contract_deployment(
-        &mut self,
-        metadata: &Metadata,
-        storage_empty_assertion: &StorageEmptyAssertionStep,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<()> {
-        let Some(address) = storage_empty_assertion.address.as_resolvable_address() else {
-            return Ok(());
-        };
-        let Some(instance) = address.strip_suffix(".address").map(ContractInstance::new) else {
-            return Ok(());
-        };
-
-        self.get_or_deploy_contract_instance(
-            &instance,
-            metadata,
-            FunctionCallStep::default_caller_address(),
-            None,
-            None,
-            node,
-        )
-        .await?;
-        Ok(())
-    }
-
-    #[instrument(level = "info", skip_all)]
-    pub async fn handle_storage_empty_assertion_execution(
-        &mut self,
-        StorageEmptyAssertionStep {
-            address,
-            is_storage_empty,
-            ..
-        }: &StorageEmptyAssertionStep,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<()> {
-        let resolver = node.resolver().await?;
-        let address = address
-            .resolve_address(resolver.as_ref(), self.default_resolution_context())
-            .await?;
-
-        let storage = node.latest_state_proof(address, Default::default()).await?;
-        let is_empty = storage.storage_hash == EMPTY_ROOT_HASH;
-
-        let expected = is_storage_empty;
-        let actual = is_empty;
-
-        if *expected != actual {
-            tracing::error!(%expected, %actual, %address, "Storage Empty Assertion failed");
-            anyhow::bail!(
-                "Storage Empty Assertion failed - Expected {} but got {} for {} resolved to {}",
-                expected,
-                actual,
-                address,
-                address,
-            )
-        };
-
-        Ok(())
-    }
-
-    /// Gets the information of a deployed contract or library from the state. If it's found to not
-    /// be deployed then it will be deployed.
-    ///
-    /// If a [`CaseIdx`] is not specified then this contact instance address will be stored in the
-    /// cross-case deployed contracts address mapping.
-    #[allow(clippy::too_many_arguments)]
-    pub async fn get_or_deploy_contract_instance(
-        &mut self,
-        contract_instance: &ContractInstance,
-        metadata: &Metadata,
-        deployer: Address,
-        calldata: Option<&Calldata>,
-        value: Option<EtherValue>,
-        node: &dyn EthereumNode,
-    ) -> anyhow::Result<(Address, JsonAbi, Option<TransactionReceipt>)> {
-        if let Some((_, address, abi)) = self.deployed_contracts.get(contract_instance) {
-            return Ok((*address, abi.clone(), None));
-        }
-
-        let Some(ContractPathAndIdent {
-            contract_source_path,
-            contract_ident,
-        }) = metadata.contract_sources()?.remove(contract_instance)
-        else {
-            anyhow::bail!(
-                "Contract source not found for instance {:?}",
-                contract_instance
-            )
-        };
-
-        let Some((code, abi)) = self
-            .compiled_contracts
-            .get(&contract_source_path)
-            .and_then(|source_file_contracts| source_file_contracts.get(contract_ident.as_ref()))
-            .cloned()
-        else {
-            anyhow::bail!(
-                "Failed to find information for contract {:?}",
-                contract_instance
-            )
-        };
-
-        let mut code = match alloy::hex::decode(&code) {
-            Ok(code) => code,
-            Err(error) => {
-                tracing::error!(
-                    ?error,
-                    contract_source_path = contract_source_path.display().to_string(),
-                    contract_ident = contract_ident.as_ref(),
-                    "Failed to hex-decode byte code - This could possibly mean that the bytecode requires linking"
-                );
-                anyhow::bail!("Failed to hex-decode the byte code {}", error)
-            }
-        };
-
-        if let Some(calldata) = calldata {
-            let resolver = node.resolver().await?;
-            let calldata = calldata
-                .calldata(resolver.as_ref(), self.default_resolution_context())
-                .await?;
-            code.extend(calldata);
-        }
-
-        let tx = {
-            let tx = TransactionRequest::default().from(deployer);
-            let tx = match value {
-                Some(ref value) => tx.value(value.into_inner()),
-                _ => tx,
-            };
-            TransactionBuilder::<Ethereum>::with_deploy_code(tx, code)
-        };
-
-        let receipt = match node.execute_transaction(tx).await {
-            Ok(receipt) => receipt,
-            Err(error) => {
-                tracing::error!(?error, "Contract deployment transaction failed.");
-                return Err(error);
-            }
-        };
-
-        let Some(address) = receipt.contract_address else {
-            anyhow::bail!("Contract deployment didn't return an address");
-        };
-        tracing::info!(
-            instance_name = ?contract_instance,
-            instance_address = ?address,
-            "Deployed contract"
-        );
-        self.execution_reporter
-            .report_contract_deployed_event(contract_instance.clone(), address)?;
-
-        self.deployed_contracts.insert(
-            contract_instance.clone(),
-            (contract_ident, address, abi.clone()),
-        );
-
-        Ok((address, abi, Some(receipt)))
-    }
-
-    fn default_resolution_context(&self) -> ResolutionContext<'_> {
-        ResolutionContext::default()
-            .with_deployed_contracts(&self.deployed_contracts)
-            .with_variables(&self.variables)
-    }
-}
-
-pub struct CaseDriver<'a> {
-    metadata: &'a Metadata,
-    case: &'a Case,
-    platform_state: Vec<(&'a dyn EthereumNode, PlatformIdentifier, CaseState)>,
-}
-
-impl<'a> CaseDriver<'a> {
-    #[allow(clippy::too_many_arguments)]
-    pub fn new(
-        metadata: &'a Metadata,
-        case: &'a Case,
-        platform_state: Vec<(&'a dyn EthereumNode, PlatformIdentifier, CaseState)>,
-    ) -> CaseDriver<'a> {
-        Self {
-            metadata,
-            case,
-            platform_state,
-        }
-    }
-
-    #[instrument(level = "info", name = "Executing Case", skip_all)]
-    pub async fn execute(&mut self) -> anyhow::Result<usize> {
-        let mut steps_executed = 0;
-        for (step_idx, step) in self
-            .case
-            .steps_iterator()
-            .enumerate()
-            .map(|(idx, v)| (StepIdx::new(idx), v))
-        {
-            let metadata = self.metadata;
-            let step_futures =
-                self.platform_state
-                    .iter_mut()
-                    .map(|(node, platform_id, case_state)| {
-                        let platform_id = *platform_id;
-                        let node_ref = *node;
-                        let step = step.clone();
-                        let span = info_span!(
-                            "Handling Step",
-                            %step_idx,
-                            platform = %platform_id,
-                        );
-                        async move {
-                            let step_path = StepPath::from_iterator([step_idx]);
-                            case_state
-                                .handle_step(metadata, &step, &step_path, node_ref)
-                                .await
-                                .map_err(|e| (platform_id, e))
-                        }
-                        .instrument(span)
-                    });
-
-            match try_join_all(step_futures).await {
-                Ok(_outputs) => {
-                    steps_executed += 1;
-                }
-                Err((platform_id, error)) => {
-                    tracing::error!(
-                        %step_idx,
-                        platform = %platform_id,
-                        ?error,
-                        "Step failed on platform",
-                    );
-                    return Err(error);
-                }
-            }
-        }
-
-        Ok(steps_executed)
-    }
-}
-
-#[derive(Clone, Debug)]
-#[allow(clippy::large_enum_variant)]
-pub enum StepOutput {
-    FunctionCall(TransactionReceipt, GethTrace, DiffMode),
-    BalanceAssertion,
-    StorageEmptyAssertion,
-    Repetition,
-    AccountAllocation,
-}
@@ -5,7 +5,7 @@ use std::{
    borrow::Cow,
    collections::HashMap,
    path::{Path, PathBuf},
-    sync::Arc,
+    sync::{Arc, LazyLock},
 };

 use futures::FutureExt;
@@ -19,7 +19,7 @@ use anyhow::{Context as _, Error, Result};
 use revive_dt_report::ExecutionSpecificReporter;
 use semver::Version;
 use serde::{Deserialize, Serialize};
-use tokio::sync::{Mutex, RwLock};
+use tokio::sync::{Mutex, RwLock, Semaphore};
 use tracing::{Instrument, debug, debug_span, instrument};

 pub struct CachedCompiler<'a> {
@@ -165,10 +165,22 @@ impl<'a> CachedCompiler<'a> {
                        cache_value.compiler_output
                    }
                    None => {
-                        compilation_callback()
+                        let compiler_output = compilation_callback()
                            .await
                            .context("Compilation callback failed (cache miss path)")?
-                            .compiler_output
+                            .compiler_output;
+                        self.artifacts_cache
+                            .insert(
+                                &cache_key,
+                                &CacheValue {
+                                    compiler_output: compiler_output.clone(),
+                                },
+                            )
+                            .await
+                            .context(
+                                "Failed to write the cached value of the compilation artifacts",
+                            )?;
+                        compiler_output
                    }
                }
            }
@@ -186,6 +198,12 @@ async fn compile_contracts(
    compiler: &dyn SolidityCompiler,
    reporter: &ExecutionSpecificReporter,
 ) -> Result<CompilerOutput> {
+    // Puts a limit on how many compilations we can perform at any given instance which helps us
+    // with some of the errors we've been seeing with high concurrency on MacOS (we have not tried
+    // it on Linux so we don't know if these issues also persist there or not.)
+    static SPAWN_GATE: LazyLock<Semaphore> = LazyLock::new(|| Semaphore::new(100));
+    let _permit = SPAWN_GATE.acquire().await?;
+
    let all_sources_in_dir = FilesWithExtensionIterator::new(metadata_directory.as_ref())
        .with_allowed_extension("sol")
        .with_use_cached_fs(true)
@@ -0,0 +1,33 @@
+use revive_dt_config::CorpusConfiguration;
+use revive_dt_format::{corpus::Corpus, metadata::MetadataFile};
+use tracing::{info, info_span, instrument};
+
+/// Given an object that implements [`AsRef<CorpusConfiguration>`], this function finds all of the
+/// corpus files and produces a map containing all of the [`MetadataFile`]s discovered.
+#[instrument(level = "debug", name = "Collecting Corpora", skip_all)]
+pub fn collect_metadata_files(
+    context: impl AsRef<CorpusConfiguration>,
+) -> anyhow::Result<Vec<MetadataFile>> {
+    let mut metadata_files = Vec::new();
+
+    let corpus_configuration = AsRef::<CorpusConfiguration>::as_ref(&context);
+    for path in &corpus_configuration.paths {
+        let span = info_span!("Processing corpus file", path = %path.display());
+        let _guard = span.enter();
+
+        let corpus = Corpus::try_from_path(path)?;
+        info!(
+            name = corpus.name(),
+            number_of_contained_paths = corpus.path_count(),
+            "Deserialized corpus file"
+        );
+        metadata_files.extend(corpus.enumerate_tests());
+    }
+
+    // There's a possibility that there are certain paths that all lead to the same metadata files
+    // and therefore it's important that we sort them and then deduplicate them.
+    metadata_files.sort_by(|a, b| a.metadata_file_path.cmp(&b.metadata_file_path));
+    metadata_files.dedup_by(|a, b| a.metadata_file_path == b.metadata_file_path);
+
+    Ok(metadata_files)
+}
@@ -0,0 +1,9 @@
+mod cached_compiler;
+mod metadata;
+mod pool;
+mod test;
+
+pub use cached_compiler::*;
+pub use metadata::*;
+pub use pool::*;
+pub use test::*;
@@ -16,7 +16,7 @@ pub struct NodePool {

 impl NodePool {
    /// Create a new Pool. This will start as many nodes as there are workers in `config`.
-    pub fn new(context: Context, platform: &dyn Platform) -> anyhow::Result<Self> {
+    pub async fn new(context: Context, platform: &dyn Platform) -> anyhow::Result<Self> {
        let concurrency_configuration = AsRef::<ConcurrencyConfiguration>::as_ref(&context);
        let nodes = concurrency_configuration.number_of_nodes;

@@ -33,11 +33,18 @@ impl NodePool {
                    .join()
                    .map_err(|error| anyhow::anyhow!("failed to spawn node: {:?}", error))
                    .context("Failed to join node spawn thread")?
-                    .map_err(|error| anyhow::anyhow!("node failed to spawn: {error}"))
                    .context("Node failed to spawn")?,
            );
        }

+        let pre_transactions_tasks = nodes
+            .iter_mut()
+            .map(|node| node.pre_transactions())
+            .collect::<Vec<_>>();
+        futures::future::try_join_all(pre_transactions_tasks)
+            .await
+            .context("Failed to run the pre-transactions task")?;
+
        Ok(Self {
            nodes,
            next: Default::default(),
@@ -0,0 +1,325 @@
+use std::collections::BTreeMap;
+use std::sync::Arc;
+use std::{borrow::Cow, path::Path};
+
+use futures::{Stream, StreamExt, stream};
+use indexmap::{IndexMap, indexmap};
+use revive_dt_common::iterators::EitherIter;
+use revive_dt_common::types::PlatformIdentifier;
+use revive_dt_config::Context;
+use revive_dt_format::mode::ParsedMode;
+use serde_json::{Value, json};
+
+use revive_dt_compiler::Mode;
+use revive_dt_compiler::SolidityCompiler;
+use revive_dt_format::{
+    case::{Case, CaseIdx},
+    metadata::MetadataFile,
+};
+use revive_dt_node_interaction::EthereumNode;
+use revive_dt_report::{ExecutionSpecificReporter, Reporter};
+use revive_dt_report::{TestSpecificReporter, TestSpecifier};
+use tracing::{debug, error, info};
+
+use crate::Platform;
+use crate::helpers::NodePool;
+
+pub async fn create_test_definitions_stream<'a>(
+    // This is only required for creating the compiler objects and is not used anywhere else in the
+    // function.
+    context: &Context,
+    metadata_files: impl IntoIterator<Item = &'a MetadataFile>,
+    platforms_and_nodes: &'a BTreeMap<PlatformIdentifier, (&dyn Platform, NodePool)>,
+    reporter: Reporter,
+) -> impl Stream<Item = TestDefinition<'a>> {
+    stream::iter(
+        metadata_files
+            .into_iter()
+            // Flatten over the cases.
+            .flat_map(|metadata_file| {
+                metadata_file
+                    .cases
+                    .iter()
+                    .enumerate()
+                    .map(move |(case_idx, case)| (metadata_file, case_idx, case))
+            })
+            // Flatten over the modes, prefer the case modes over the metadata file modes.
+            .flat_map(move |(metadata_file, case_idx, case)| {
+                let reporter = reporter.clone();
+
+                let modes = case.modes.as_ref().or(metadata_file.modes.as_ref());
+                let modes = match modes {
+                    Some(modes) => EitherIter::A(
+                        ParsedMode::many_to_modes(modes.iter()).map(Cow::<'static, _>::Owned),
+                    ),
+                    None => EitherIter::B(Mode::all().map(Cow::<'static, _>::Borrowed)),
+                };
+
+                modes.into_iter().map(move |mode| {
+                    (
+                        metadata_file,
+                        case_idx,
+                        case,
+                        mode.clone(),
+                        reporter.test_specific_reporter(Arc::new(TestSpecifier {
+                            solc_mode: mode.as_ref().clone(),
+                            metadata_file_path: metadata_file.metadata_file_path.clone(),
+                            case_idx: CaseIdx::new(case_idx),
+                        })),
+                    )
+                })
+            })
+            // Inform the reporter of each one of the test cases that were discovered which we expect to
+            // run.
+            .inspect(|(_, _, _, _, reporter)| {
+                reporter
+                    .report_test_case_discovery_event()
+                    .expect("Can't fail");
+            }),
+    )
+    // Creating the Test Definition objects from all of the various objects we have and creating
+    // their required dependencies (e.g., compiler).
+    .filter_map(
+        move |(metadata_file, case_idx, case, mode, reporter)| async move {
+            let mut platforms = BTreeMap::new();
+            for (platform, node_pool) in platforms_and_nodes.values() {
+                let node = node_pool.round_robbin();
+                let compiler = platform
+                    .new_compiler(context.clone(), mode.version.clone().map(Into::into))
+                    .await
+                    .inspect_err(|err| {
+                        error!(
+                            ?err,
+                            platform_identifier = %platform.platform_identifier(),
+                            "Failed to instantiate the compiler"
+                        )
+                    })
+                    .ok()?;
+
+                reporter
+                    .report_node_assigned_event(
+                        node.id(),
+                        platform.platform_identifier(),
+                        node.connection_string(),
+                    )
+                    .expect("Can't fail");
+
+                let reporter =
+                    reporter.execution_specific_reporter(node.id(), platform.platform_identifier());
+
+                platforms.insert(
+                    platform.platform_identifier(),
+                    TestPlatformInformation {
+                        platform: *platform,
+                        node,
+                        compiler,
+                        reporter,
+                    },
+                );
+            }
+
+            Some(TestDefinition {
+                /* Metadata file information */
+                metadata: metadata_file,
+                metadata_file_path: metadata_file.metadata_file_path.as_path(),
+
+                /* Mode Information */
+                mode: mode.clone(),
+
+                /* Case Information */
+                case_idx: CaseIdx::new(case_idx),
+                case,
+
+                /* Platform and Node Assignment Information */
+                platforms,
+
+                /* Reporter */
+                reporter,
+            })
+        },
+    )
+    // Filter out the test cases which are incompatible or that can't run in the current setup.
+    .filter_map(move |test| async move {
+        match test.check_compatibility() {
+            Ok(()) => Some(test),
+            Err((reason, additional_information)) => {
+                debug!(
+                    metadata_file_path = %test.metadata.metadata_file_path.display(),
+                    case_idx = %test.case_idx,
+                    mode = %test.mode,
+                    reason,
+                    additional_information =
+                        serde_json::to_string(&additional_information).unwrap(),
+                    "Ignoring Test Case"
+                );
+                test.reporter
+                    .report_test_ignored_event(
+                        reason.to_string(),
+                        additional_information
+                            .into_iter()
+                            .map(|(k, v)| (k.into(), v))
+                            .collect::<IndexMap<_, _>>(),
+                    )
+                    .expect("Can't fail");
+                None
+            }
+        }
+    })
+    .inspect(|test| {
+        info!(
+            metadata_file_path = %test.metadata_file_path.display(),
+            case_idx = %test.case_idx,
+            mode = %test.mode,
+            "Created a test case definition"
+        );
+    })
+}
+
+/// This is a full description of a differential test to run alongside the full metadata file, the
+/// specific case to be tested, the platforms that the tests should run on, the specific nodes of
+/// these platforms that they should run on, the compilers to use, and everything else needed making
+/// it a complete description.
+pub struct TestDefinition<'a> {
+    /* Metadata file information */
+    pub metadata: &'a MetadataFile,
+    pub metadata_file_path: &'a Path,
+
+    /* Mode Information */
+    pub mode: Cow<'a, Mode>,
+
+    /* Case Information */
+    pub case_idx: CaseIdx,
+    pub case: &'a Case,
+
+    /* Platform and Node Assignment Information */
+    pub platforms: BTreeMap<PlatformIdentifier, TestPlatformInformation<'a>>,
+
+    /* Reporter */
+    pub reporter: TestSpecificReporter,
+}
+
+impl<'a> TestDefinition<'a> {
+    /// Checks if this test can be ran with the current configuration.
+    pub fn check_compatibility(&self) -> TestCheckFunctionResult {
+        self.check_metadata_file_ignored()?;
+        self.check_case_file_ignored()?;
+        self.check_target_compatibility()?;
+        self.check_evm_version_compatibility()?;
+        self.check_compiler_compatibility()?;
+        Ok(())
+    }
+
+    /// Checks if the metadata file is ignored or not.
+    fn check_metadata_file_ignored(&self) -> TestCheckFunctionResult {
+        if self.metadata.ignore.is_some_and(|ignore| ignore) {
+            Err(("Metadata file is ignored.", indexmap! {}))
+        } else {
+            Ok(())
+        }
+    }
+
+    /// Checks if the case file is ignored or not.
+    fn check_case_file_ignored(&self) -> TestCheckFunctionResult {
+        if self.case.ignore.is_some_and(|ignore| ignore) {
+            Err(("Case is ignored.", indexmap! {}))
+        } else {
+            Ok(())
+        }
+    }
+
+    /// Checks if the platforms all support the desired targets in the metadata file.
+    fn check_target_compatibility(&self) -> TestCheckFunctionResult {
+        let mut error_map = indexmap! {
+            "test_desired_targets" => json!(self.metadata.targets.as_ref()),
+        };
+        let mut is_allowed = true;
+        for (_, platform_information) in self.platforms.iter() {
+            let is_allowed_for_platform = match self.metadata.targets.as_ref() {
+                None => true,
+                Some(required_vm_identifiers) => {
+                    required_vm_identifiers.contains(&platform_information.platform.vm_identifier())
+                }
+            };
+            is_allowed &= is_allowed_for_platform;
+            error_map.insert(
+                platform_information.platform.platform_identifier().into(),
+                json!(is_allowed_for_platform),
+            );
+        }
+
+        if is_allowed {
+            Ok(())
+        } else {
+            Err((
+                "One of the platforms do do not support the targets allowed by the test.",
+                error_map,
+            ))
+        }
+    }
+
+    // Checks for the compatibility of the EVM version with the platforms specified.
+    fn check_evm_version_compatibility(&self) -> TestCheckFunctionResult {
+        let Some(evm_version_requirement) = self.metadata.required_evm_version else {
+            return Ok(());
+        };
+
+        let mut error_map = indexmap! {
+            "test_desired_evm_version" => json!(self.metadata.required_evm_version),
+        };
+        let mut is_allowed = true;
+        for (_, platform_information) in self.platforms.iter() {
+            let is_allowed_for_platform =
+                evm_version_requirement.matches(&platform_information.node.evm_version());
+            is_allowed &= is_allowed_for_platform;
+            error_map.insert(
+                platform_information.platform.platform_identifier().into(),
+                json!(is_allowed_for_platform),
+            );
+        }
+
+        if is_allowed {
+            Ok(())
+        } else {
+            Err((
+                "EVM version is incompatible for the platforms specified",
+                error_map,
+            ))
+        }
+    }
+
+    /// Checks if the platforms compilers support the mode that the test is for.
+    fn check_compiler_compatibility(&self) -> TestCheckFunctionResult {
+        let mut error_map = indexmap! {
+            "test_desired_evm_version" => json!(self.metadata.required_evm_version),
+        };
+        let mut is_allowed = true;
+        for (_, platform_information) in self.platforms.iter() {
+            let is_allowed_for_platform = platform_information
+                .compiler
+                .supports_mode(self.mode.optimize_setting, self.mode.pipeline);
+            is_allowed &= is_allowed_for_platform;
+            error_map.insert(
+                platform_information.platform.platform_identifier().into(),
+                json!(is_allowed_for_platform),
+            );
+        }
+
+        if is_allowed {
+            Ok(())
+        } else {
+            Err((
+                "Compilers do not support this mode either for the provided platforms.",
+                error_map,
+            ))
+        }
+    }
+}
+
+pub struct TestPlatformInformation<'a> {
+    pub platform: &'a dyn Platform,
+    pub node: &'a dyn EthereumNode,
+    pub compiler: Box<dyn SolidityCompiler>,
+    pub reporter: ExecutionSpecificReporter,
+}
+
+type TestCheckFunctionResult = Result<(), (&'static str, IndexMap<&'static str, Value>)>;
@@ -14,13 +14,13 @@ use revive_dt_common::types::*;
 use revive_dt_compiler::{SolidityCompiler, revive_resolc::Resolc, solc::Solc};
 use revive_dt_config::*;
 use revive_dt_node::{
-    Node, geth::GethNode, lighthouse_geth::LighthouseGethNode, substrate::SubstrateNode,
+    Node, node_implementations::geth::GethNode,
+    node_implementations::lighthouse_geth::LighthouseGethNode,
+    node_implementations::substrate::SubstrateNode,
 };
 use revive_dt_node_interaction::EthereumNode;
 use tracing::info;

-pub mod driver;
-
 /// A trait that describes the interface for the platforms that are supported by the tool.
 #[allow(clippy::type_complexity)]
 pub trait Platform {
@@ -1,55 +1,21 @@
-mod cached_compiler;
-mod pool;
+mod differential_benchmarks;
+mod differential_tests;
+mod helpers;

-use std::{
-    borrow::Cow,
-    collections::{BTreeSet, HashMap},
-    io::{BufWriter, Write, stderr},
-    path::Path,
-    sync::Arc,
-    time::Instant,
-};
-
-use alloy::{
-    network::{Ethereum, TransactionBuilder},
-    rpc::types::TransactionRequest,
-};
-use anyhow::Context as _;
 use clap::Parser;
-use futures::stream;
-use futures::{Stream, StreamExt};
-use indexmap::{IndexMap, indexmap};
-use revive_dt_node_interaction::EthereumNode;
-use revive_dt_report::{
-    ExecutionSpecificReporter, ReportAggregator, Reporter, ReporterEvent, TestCaseStatus,
-    TestSpecificReporter, TestSpecifier,
-};
+use revive_dt_report::ReportAggregator;
 use schemars::schema_for;
-use serde_json::{Value, json};
-use tokio::sync::Mutex;
-use tracing::{debug, error, info, info_span, instrument};
+use tracing::info;
 use tracing_subscriber::{EnvFilter, FmtSubscriber};

-use revive_dt_common::{
-    iterators::EitherIter,
-    types::{Mode, PrivateKeyAllocator},
-};
-use revive_dt_compiler::SolidityCompiler;
-use revive_dt_config::{Context, *};
-use revive_dt_core::{
-    Platform,
-    driver::{CaseDriver, CaseState},
-};
-use revive_dt_format::{
-    case::{Case, CaseIdx},
-    corpus::Corpus,
-    metadata::{ContractPathAndIdent, Metadata, MetadataFile},
-    mode::ParsedMode,
-    steps::{FunctionCallStep, Step},
-};
+use revive_dt_config::Context;
+use revive_dt_core::Platform;
+use revive_dt_format::metadata::Metadata;

-use crate::cached_compiler::CachedCompiler;
-use crate::pool::NodePool;
+use crate::{
+    differential_benchmarks::handle_differential_benchmarks,
+    differential_tests::handle_differential_tests,
+};

 fn main() -> anyhow::Result<()> {
    let (writer, _guard) = tracing_appender::non_blocking::NonBlockingBuilder::default()
@@ -75,37 +41,37 @@ fn main() -> anyhow::Result<()> {
    let (reporter, report_aggregator_task) = ReportAggregator::new(context.clone()).into_task();

    match context {
-        Context::ExecuteTests(context) => {
-            let tests = collect_corpora(&context)
-                .context("Failed to collect corpus files from provided arguments")?
-                .into_iter()
-                .inspect(|(corpus, _)| {
-                    reporter
-                        .report_corpus_file_discovery_event(corpus.clone())
-                        .expect("Can't fail")
-                })
-                .flat_map(|(_, files)| files.into_iter())
-                .inspect(|metadata_file| {
-                    reporter
-                        .report_metadata_file_discovery_event(
-                            metadata_file.metadata_file_path.clone(),
-                            metadata_file.content.clone(),
-                        )
-                        .expect("Can't fail")
-                })
-                .collect::<Vec<_>>();
+        Context::Test(context) => tokio::runtime::Builder::new_multi_thread()
+            .worker_threads(context.concurrency_configuration.number_of_threads)
+            .enable_all()
+            .build()
+            .expect("Failed building the Runtime")
+            .block_on(async move {
+                let differential_tests_handling_task =
+                    handle_differential_tests(*context, reporter);

-            tokio::runtime::Builder::new_multi_thread()
-                .worker_threads(context.concurrency_configuration.number_of_threads)
-                .enable_all()
-                .build()
-                .expect("Failed building the Runtime")
-                .block_on(async move {
-                    execute_corpus(*context, &tests, reporter, report_aggregator_task)
-                        .await
-                        .context("Failed to execute corpus")
-                })
-        }
+                futures::future::try_join(differential_tests_handling_task, report_aggregator_task)
+                    .await?;
+
+                Ok(())
+            }),
+        Context::Benchmark(context) => tokio::runtime::Builder::new_multi_thread()
+            .worker_threads(context.concurrency_configuration.number_of_threads)
+            .enable_all()
+            .build()
+            .expect("Failed building the Runtime")
+            .block_on(async move {
+                let differential_benchmarks_handling_task =
+                    handle_differential_benchmarks(*context, reporter);
+
+                futures::future::try_join(
+                    differential_benchmarks_handling_task,
+                    report_aggregator_task,
+                )
+                .await?;
+
+                Ok(())
+            }),
        Context::ExportJsonSchema => {
            let schema = schema_for!(Metadata);
            println!("{}", serde_json::to_string_pretty(&schema).unwrap());
@@ -113,671 +79,3 @@ fn main() -> anyhow::Result<()> {
        }
    }
 }
-
-#[instrument(level = "debug", name = "Collecting Corpora", skip_all)]
-fn collect_corpora(
-    context: &TestExecutionContext,
-) -> anyhow::Result<HashMap<Corpus, Vec<MetadataFile>>> {
-    let mut corpora = HashMap::new();
-
-    for path in &context.corpus {
-        let span = info_span!("Processing corpus file", path = %path.display());
-        let _guard = span.enter();
-
-        let corpus = Corpus::try_from_path(path)?;
-        info!(
-            name = corpus.name(),
-            number_of_contained_paths = corpus.path_count(),
-            "Deserialized corpus file"
-        );
-        let tests = corpus.enumerate_tests();
-        corpora.insert(corpus, tests);
-    }
-
-    Ok(corpora)
-}
-
-async fn run_driver(
-    context: TestExecutionContext,
-    metadata_files: &[MetadataFile],
-    reporter: Reporter,
-    report_aggregator_task: impl Future<Output = anyhow::Result<()>>,
-    platforms: Vec<&dyn Platform>,
-) -> anyhow::Result<()> {
-    let mut nodes = Vec::<(&dyn Platform, NodePool)>::new();
-    for platform in platforms.into_iter() {
-        let pool = NodePool::new(Context::ExecuteTests(Box::new(context.clone())), platform)
-            .inspect_err(|err| {
-                error!(
-                    ?err,
-                    platform_identifier = %platform.platform_identifier(),
-                    "Failed to initialize the node pool for the platform."
-                )
-            })
-            .context("Failed to initialize the node pool")?;
-        nodes.push((platform, pool));
-    }
-
-    let tests_stream = tests_stream(
-        &context,
-        metadata_files.iter(),
-        nodes.as_slice(),
-        reporter.clone(),
-    )
-    .await;
-    let driver_task = start_driver_task(&context, tests_stream)
-        .await
-        .context("Failed to start driver task")?;
-    let cli_reporting_task = start_cli_reporting_task(reporter);
-
-    let (_, _, rtn) = tokio::join!(cli_reporting_task, driver_task, report_aggregator_task);
-    rtn?;
-
-    Ok(())
-}
-
-async fn tests_stream<'a>(
-    args: &TestExecutionContext,
-    metadata_files: impl IntoIterator<Item = &'a MetadataFile> + Clone,
-    nodes: &'a [(&dyn Platform, NodePool)],
-    reporter: Reporter,
-) -> impl Stream<Item = Test<'a>> {
-    let tests = metadata_files
-        .into_iter()
-        .flat_map(|metadata_file| {
-            metadata_file
-                .cases
-                .iter()
-                .enumerate()
-                .map(move |(case_idx, case)| (metadata_file, case_idx, case))
-        })
-        // Flatten over the modes, prefer the case modes over the metadata file modes.
-        .flat_map(|(metadata_file, case_idx, case)| {
-            let reporter = reporter.clone();
-
-            let modes = case.modes.as_ref().or(metadata_file.modes.as_ref());
-            let modes = match modes {
-                Some(modes) => EitherIter::A(
-                    ParsedMode::many_to_modes(modes.iter()).map(Cow::<'static, _>::Owned),
-                ),
-                None => EitherIter::B(Mode::all().map(Cow::<'static, _>::Borrowed)),
-            };
-
-            modes.into_iter().map(move |mode| {
-                (
-                    metadata_file,
-                    case_idx,
-                    case,
-                    mode.clone(),
-                    reporter.test_specific_reporter(Arc::new(TestSpecifier {
-                        solc_mode: mode.as_ref().clone(),
-                        metadata_file_path: metadata_file.metadata_file_path.clone(),
-                        case_idx: CaseIdx::new(case_idx),
-                    })),
-                )
-            })
-        })
-        .collect::<Vec<_>>();
-
-    // Note: before we do any kind of filtering or process the iterator in any way, we need to
-    // inform the report aggregator of all of the cases that were found as it keeps a state of the
-    // test cases for its internal use.
-    for (_, _, _, _, reporter) in tests.iter() {
-        reporter
-            .report_test_case_discovery_event()
-            .expect("Can't fail")
-    }
-
-    stream::iter(tests.into_iter())
-        .filter_map(
-            move |(metadata_file, case_idx, case, mode, reporter)| async move {
-                let mut platforms = Vec::new();
-                for (platform, node_pool) in nodes.iter() {
-                    let node = node_pool.round_robbin();
-                    let compiler = platform
-                        .new_compiler(
-                            Context::ExecuteTests(Box::new(args.clone())),
-                            mode.version.clone().map(Into::into),
-                        )
-                        .await
-                        .inspect_err(|err| {
-                            error!(
-                                ?err,
-                                platform_identifier = %platform.platform_identifier(),
-                                "Failed to instantiate the compiler"
-                            )
-                        })
-                        .ok()?;
-
-                    let reporter = reporter
-                        .execution_specific_reporter(node.id(), platform.platform_identifier());
-                    platforms.push((*platform, node, compiler, reporter));
-                }
-
-                Some(Test {
-                    metadata: metadata_file,
-                    metadata_file_path: metadata_file.metadata_file_path.as_path(),
-                    mode: mode.clone(),
-                    case_idx: CaseIdx::new(case_idx),
-                    case,
-                    platforms,
-                    reporter,
-                })
-            },
-        )
-        .filter_map(move |test| async move {
-            match test.check_compatibility() {
-                Ok(()) => Some(test),
-                Err((reason, additional_information)) => {
-                    debug!(
-                        metadata_file_path = %test.metadata.metadata_file_path.display(),
-                        case_idx = %test.case_idx,
-                        mode = %test.mode,
-                        reason,
-                        additional_information =
-                            serde_json::to_string(&additional_information).unwrap(),
-
-                        "Ignoring Test Case"
-                    );
-                    test.reporter
-                        .report_test_ignored_event(
-                            reason.to_string(),
-                            additional_information
-                                .into_iter()
-                                .map(|(k, v)| (k.into(), v))
-                                .collect::<IndexMap<_, _>>(),
-                        )
-                        .expect("Can't fail");
-                    None
-                }
-            }
-        })
-}
-
-async fn start_driver_task<'a>(
-    context: &TestExecutionContext,
-    tests: impl Stream<Item = Test<'a>>,
-) -> anyhow::Result<impl Future<Output = ()>> {
-    info!("Starting driver task");
-
-    let cached_compiler = Arc::new(
-        CachedCompiler::new(
-            context
-                .working_directory
-                .as_path()
-                .join("compilation_cache"),
-            context
-                .compilation_configuration
-                .invalidate_compilation_cache,
-        )
-        .await
-        .context("Failed to initialize cached compiler")?,
-    );
-
-    Ok(tests.for_each_concurrent(
-        context.concurrency_configuration.concurrency_limit(),
-        move |test| {
-            let cached_compiler = cached_compiler.clone();
-
-            async move {
-                for (platform, node, _, _) in test.platforms.iter() {
-                    test.reporter
-                        .report_node_assigned_event(
-                            node.id(),
-                            platform.platform_identifier(),
-                            node.connection_string(),
-                        )
-                        .expect("Can't fail");
-                }
-
-                let private_key_allocator = Arc::new(Mutex::new(PrivateKeyAllocator::new(
-                    context.wallet_configuration.highest_private_key_exclusive(),
-                )));
-
-                let reporter = test.reporter.clone();
-                let result =
-                    handle_case_driver(&test, cached_compiler, private_key_allocator).await;
-
-                match result {
-                    Ok(steps_executed) => reporter
-                        .report_test_succeeded_event(steps_executed)
-                        .expect("Can't fail"),
-                    Err(error) => reporter
-                        .report_test_failed_event(format!("{error:#}"))
-                        .expect("Can't fail"),
-                }
-            }
-        },
-    ))
-}
-
-#[allow(irrefutable_let_patterns, clippy::uninlined_format_args)]
-async fn start_cli_reporting_task(reporter: Reporter) {
-    let mut aggregator_events_rx = reporter.subscribe().await.expect("Can't fail");
-    drop(reporter);
-
-    let start = Instant::now();
-
-    const GREEN: &str = "\x1B[32m";
-    const RED: &str = "\x1B[31m";
-    const GREY: &str = "\x1B[90m";
-    const COLOR_RESET: &str = "\x1B[0m";
-    const BOLD: &str = "\x1B[1m";
-    const BOLD_RESET: &str = "\x1B[22m";
-
-    let mut number_of_successes = 0;
-    let mut number_of_failures = 0;
-
-    let mut buf = BufWriter::new(stderr());
-    while let Ok(event) = aggregator_events_rx.recv().await {
-        let ReporterEvent::MetadataFileSolcModeCombinationExecutionCompleted {
-            metadata_file_path,
-            mode,
-            case_status,
-        } = event
-        else {
-            continue;
-        };
-
-        let _ = writeln!(buf, "{} - {}", mode, metadata_file_path.display());
-        for (case_idx, case_status) in case_status.into_iter() {
-            let _ = write!(buf, "\tCase Index {case_idx:>3}: ");
-            let _ = match case_status {
-                TestCaseStatus::Succeeded { steps_executed } => {
-                    number_of_successes += 1;
-                    writeln!(
-                        buf,
-                        "{}{}Case Succeeded{} - Steps Executed: {}{}",
-                        GREEN, BOLD, BOLD_RESET, steps_executed, COLOR_RESET
-                    )
-                }
-                TestCaseStatus::Failed { reason } => {
-                    number_of_failures += 1;
-                    writeln!(
-                        buf,
-                        "{}{}Case Failed{} - Reason: {}{}",
-                        RED,
-                        BOLD,
-                        BOLD_RESET,
-                        reason.trim(),
-                        COLOR_RESET,
-                    )
-                }
-                TestCaseStatus::Ignored { reason, .. } => writeln!(
-                    buf,
-                    "{}{}Case Ignored{} - Reason: {}{}",
-                    GREY,
-                    BOLD,
-                    BOLD_RESET,
-                    reason.trim(),
-                    COLOR_RESET,
-                ),
-            };
-        }
-        let _ = writeln!(buf);
-    }
-
-    // Summary at the end.
-    let _ = writeln!(
-        buf,
-        "{} cases: {}{}{} cases succeeded, {}{}{} cases failed in {} seconds",
-        number_of_successes + number_of_failures,
-        GREEN,
-        number_of_successes,
-        COLOR_RESET,
-        RED,
-        number_of_failures,
-        COLOR_RESET,
-        start.elapsed().as_secs()
-    );
-}
-
-#[allow(clippy::too_many_arguments)]
-#[instrument(
-    level = "info",
-    name = "Handling Case"
-    skip_all,
-    fields(
-        metadata_file_path = %test.metadata.relative_path().display(),
-        mode = %test.mode,
-        case_idx = %test.case_idx,
-        case_name = test.case.name.as_deref().unwrap_or("Unnamed Case"),
-    )
-)]
-async fn handle_case_driver<'a>(
-    test: &Test<'a>,
-    cached_compiler: Arc<CachedCompiler<'a>>,
-    private_key_allocator: Arc<Mutex<PrivateKeyAllocator>>,
-) -> anyhow::Result<usize> {
-    let platform_state = stream::iter(test.platforms.iter())
-        // Compiling the pre-link contracts.
-        .filter_map(|(platform, node, compiler, reporter)| {
-            let cached_compiler = cached_compiler.clone();
-
-            async move {
-                let compiler_output = cached_compiler
-                    .compile_contracts(
-                        test.metadata,
-                        test.metadata_file_path,
-                        test.mode.clone(),
-                        None,
-                        compiler.as_ref(),
-                        *platform,
-                        reporter,
-                    )
-                    .await
-                    .inspect_err(|err| {
-                        error!(
-                            ?err,
-                            platform_identifier = %platform.platform_identifier(),
-                            "Pre-linking compilation failed"
-                        )
-                    })
-                    .ok()?;
-                Some((test, platform, node, compiler, reporter, compiler_output))
-            }
-        })
-        // Deploying the libraries for the platform.
-        .filter_map(
-            |(test, platform, node, compiler, reporter, compiler_output)| async move {
-                let mut deployed_libraries = None::<HashMap<_, _>>;
-                let mut contract_sources = test
-                    .metadata
-                    .contract_sources()
-                    .inspect_err(|err| {
-                        error!(
-                            ?err,
-                            platform_identifier = %platform.platform_identifier(),
-                            "Failed to retrieve contract sources from metadata"
-                        )
-                    })
-                    .ok()?;
-                for library_instance in test
-                    .metadata
-                    .libraries
-                    .iter()
-                    .flatten()
-                    .flat_map(|(_, map)| map.values())
-                {
-                    debug!(%library_instance, "Deploying Library Instance");
-
-                    let ContractPathAndIdent {
-                        contract_source_path: library_source_path,
-                        contract_ident: library_ident,
-                    } = contract_sources.remove(library_instance)?;
-
-                    let (code, abi) = compiler_output
-                        .contracts
-                        .get(&library_source_path)
-                        .and_then(|contracts| contracts.get(library_ident.as_str()))?;
-
-                    let code = alloy::hex::decode(code).ok()?;
-
-                    // Getting the deployer address from the cases themselves. This is to ensure
-                    // that we're doing the deployments from different accounts and therefore we're
-                    // not slowed down by the nonce.
-                    let deployer_address = test
-                        .case
-                        .steps
-                        .iter()
-                        .filter_map(|step| match step {
-                            Step::FunctionCall(input) => input.caller.as_address().copied(),
-                            Step::BalanceAssertion(..) => None,
-                            Step::StorageEmptyAssertion(..) => None,
-                            Step::Repeat(..) => None,
-                            Step::AllocateAccount(..) => None,
-                        })
-                        .next()
-                        .unwrap_or(FunctionCallStep::default_caller_address());
-                    let tx = TransactionBuilder::<Ethereum>::with_deploy_code(
-                        TransactionRequest::default().from(deployer_address),
-                        code,
-                    );
-                    let receipt = node
-                        .execute_transaction(tx)
-                        .await
-                        .inspect_err(|err| {
-                            error!(
-                                ?err,
-                                %library_instance,
-                                platform_identifier = %platform.platform_identifier(),
-                                "Failed to deploy the library"
-                            )
-                        })
-                        .ok()?;
-
-                    debug!(
-                        ?library_instance,
-                        platform_identifier = %platform.platform_identifier(),
-                        "Deployed library"
-                    );
-
-                    let library_address = receipt.contract_address?;
-
-                    deployed_libraries.get_or_insert_default().insert(
-                        library_instance.clone(),
-                        (library_ident.clone(), library_address, abi.clone()),
-                    );
-                }
-
-                Some((
-                    test,
-                    platform,
-                    node,
-                    compiler,
-                    reporter,
-                    compiler_output,
-                    deployed_libraries,
-                ))
-            },
-        )
-        // Compiling the post-link contracts.
-        .filter_map(
-            |(test, platform, node, compiler, reporter, _, deployed_libraries)| {
-                let cached_compiler = cached_compiler.clone();
-                let private_key_allocator = private_key_allocator.clone();
-
-                async move {
-                    let compiler_output = cached_compiler
-                        .compile_contracts(
-                            test.metadata,
-                            test.metadata_file_path,
-                            test.mode.clone(),
-                            deployed_libraries.as_ref(),
-                            compiler.as_ref(),
-                            *platform,
-                            reporter,
-                        )
-                        .await
-                        .inspect_err(|err| {
-                            error!(
-                                ?err,
-                                platform_identifier = %platform.platform_identifier(),
-                                "Pre-linking compilation failed"
-                            )
-                        })
-                        .ok()?;
-
-                    let case_state = CaseState::new(
-                        compiler.version().clone(),
-                        compiler_output.contracts,
-                        deployed_libraries.unwrap_or_default(),
-                        reporter.clone(),
-                        private_key_allocator,
-                    );
-
-                    Some((*node, platform.platform_identifier(), case_state))
-                }
-            },
-        )
-        // Collect
-        .collect::<Vec<_>>()
-        .await;
-
-    let mut driver = CaseDriver::new(test.metadata, test.case, platform_state);
-    driver
-        .execute()
-        .await
-        .inspect(|steps_executed| info!(steps_executed, "Case succeeded"))
-}
-
-async fn execute_corpus(
-    context: TestExecutionContext,
-    tests: &[MetadataFile],
-    reporter: Reporter,
-    report_aggregator_task: impl Future<Output = anyhow::Result<()>>,
-) -> anyhow::Result<()> {
-    let platforms = context
-        .platforms
-        .iter()
-        .copied()
-        .collect::<BTreeSet<_>>()
-        .into_iter()
-        .map(Into::<&dyn Platform>::into)
-        .collect::<Vec<_>>();
-
-    run_driver(context, tests, reporter, report_aggregator_task, platforms).await?;
-
-    Ok(())
-}
-
-/// this represents a single "test"; a mode, path and collection of cases.
-#[allow(clippy::type_complexity)]
-struct Test<'a> {
-    metadata: &'a MetadataFile,
-    metadata_file_path: &'a Path,
-    mode: Cow<'a, Mode>,
-    case_idx: CaseIdx,
-    case: &'a Case,
-    platforms: Vec<(
-        &'a dyn Platform,
-        &'a dyn EthereumNode,
-        Box<dyn SolidityCompiler>,
-        ExecutionSpecificReporter,
-    )>,
-    reporter: TestSpecificReporter,
-}
-
-impl<'a> Test<'a> {
-    /// Checks if this test can be ran with the current configuration.
-    pub fn check_compatibility(&self) -> TestCheckFunctionResult {
-        self.check_metadata_file_ignored()?;
-        self.check_case_file_ignored()?;
-        self.check_target_compatibility()?;
-        self.check_evm_version_compatibility()?;
-        self.check_compiler_compatibility()?;
-        Ok(())
-    }
-
-    /// Checks if the metadata file is ignored or not.
-    fn check_metadata_file_ignored(&self) -> TestCheckFunctionResult {
-        if self.metadata.ignore.is_some_and(|ignore| ignore) {
-            Err(("Metadata file is ignored.", indexmap! {}))
-        } else {
-            Ok(())
-        }
-    }
-
-    /// Checks if the case file is ignored or not.
-    fn check_case_file_ignored(&self) -> TestCheckFunctionResult {
-        if self.case.ignore.is_some_and(|ignore| ignore) {
-            Err(("Case is ignored.", indexmap! {}))
-        } else {
-            Ok(())
-        }
-    }
-
-    /// Checks if the platforms all support the desired targets in the metadata file.
-    fn check_target_compatibility(&self) -> TestCheckFunctionResult {
-        let mut error_map = indexmap! {
-            "test_desired_targets" => json!(self.metadata.targets.as_ref()),
-        };
-        let mut is_allowed = true;
-        for (platform, ..) in self.platforms.iter() {
-            let is_allowed_for_platform = match self.metadata.targets.as_ref() {
-                None => true,
-                Some(targets) => {
-                    let mut target_matches = false;
-                    for target in targets.iter() {
-                        if &platform.vm_identifier() == target {
-                            target_matches = true;
-                            break;
-                        }
-                    }
-                    target_matches
-                }
-            };
-            is_allowed &= is_allowed_for_platform;
-            error_map.insert(
-                platform.platform_identifier().into(),
-                json!(is_allowed_for_platform),
-            );
-        }
-
-        if is_allowed {
-            Ok(())
-        } else {
-            Err((
-                "One of the platforms do do not support the targets allowed by the test.",
-                error_map,
-            ))
-        }
-    }
-
-    // Checks for the compatibility of the EVM version with the platforms specified.
-    fn check_evm_version_compatibility(&self) -> TestCheckFunctionResult {
-        let Some(evm_version_requirement) = self.metadata.required_evm_version else {
-            return Ok(());
-        };
-
-        let mut error_map = indexmap! {
-            "test_desired_evm_version" => json!(self.metadata.required_evm_version),
-        };
-        let mut is_allowed = true;
-        for (platform, node, ..) in self.platforms.iter() {
-            let is_allowed_for_platform = evm_version_requirement.matches(&node.evm_version());
-            is_allowed &= is_allowed_for_platform;
-            error_map.insert(
-                platform.platform_identifier().into(),
-                json!(is_allowed_for_platform),
-            );
-        }
-
-        if is_allowed {
-            Ok(())
-        } else {
-            Err((
-                "EVM version is incompatible for the platforms specified",
-                error_map,
-            ))
-        }
-    }
-
-    /// Checks if the platforms compilers support the mode that the test is for.
-    fn check_compiler_compatibility(&self) -> TestCheckFunctionResult {
-        let mut error_map = indexmap! {
-            "test_desired_evm_version" => json!(self.metadata.required_evm_version),
-        };
-        let mut is_allowed = true;
-        for (platform, _, compiler, ..) in self.platforms.iter() {
-            let is_allowed_for_platform =
-                compiler.supports_mode(self.mode.optimize_setting, self.mode.pipeline);
-            is_allowed &= is_allowed_for_platform;
-            error_map.insert(
-                platform.platform_identifier().into(),
-                json!(is_allowed_for_platform),
-            );
-        }
-
-        if is_allowed {
-            Ok(())
-        } else {
-            Err((
-                "Compilers do not support this mode either for the provided platforms.",
-                error_map,
-            ))
-        }
-    }
-}
-
-type TestCheckFunctionResult = Result<(), (&'static str, IndexMap<&'static str, Value>)>;