Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feature(invariant) - persist and replay failure #7899

Merged
merged 6 commits into from
May 21, 2024
Merged
Show file tree
Hide file tree
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
44 changes: 41 additions & 3 deletions crates/config/src/invariant.rs
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,10 @@ use crate::{
},
};
use serde::{Deserialize, Serialize};
use std::path::PathBuf;

/// Contains for invariant testing
#[derive(Clone, Copy, Debug, PartialEq, Eq, Serialize, Deserialize)]
#[derive(Clone, Debug, PartialEq, Eq, Serialize, Deserialize)]
pub struct InvariantConfig {
/// The number of runs that must execute for each invariant test group.
pub runs: u32,
Expand All @@ -31,6 +32,8 @@ pub struct InvariantConfig {
pub max_assume_rejects: u32,
/// Number of runs to execute and include in the gas report.
pub gas_report_samples: u32,
/// Path where invariant failures are recorded and replayed.
pub failure_persist_dir: Option<PathBuf>,
}

impl Default for InvariantConfig {
Expand All @@ -44,10 +47,43 @@ impl Default for InvariantConfig {
shrink_run_limit: 2usize.pow(18_u32),
max_assume_rejects: 65536,
gas_report_samples: 256,
failure_persist_dir: None,
}
}
}

impl InvariantConfig {
/// Creates invariant configuration to write failures in `{PROJECT_ROOT}/cache/fuzz` dir.
pub fn new(cache_dir: PathBuf) -> Self {
InvariantConfig {
runs: 256,
depth: 15,
fail_on_revert: false,
call_override: false,
dictionary: FuzzDictionaryConfig { dictionary_weight: 80, ..Default::default() },
shrink_run_limit: 2usize.pow(18_u32),
max_assume_rejects: 65536,
gas_report_samples: 256,
failure_persist_dir: Some(cache_dir),
}
}

/// Returns path to failure dir of given invariant test contract.
pub fn failure_dir(self, contract_name: &str) -> PathBuf {
self.failure_persist_dir
.unwrap()
.join("failures")
.join(contract_name.split(':').last().unwrap())
}

/// Returns path to persisted failure of current invariant test (if any).
/// The path to failure file is `{failure_dir}/{test_contract_name}/{invariant_name}`,
/// for example: `cache/invariant/failures/InvariantTest/invariant_check`
pub fn failure_file(self, contract_name: &str, test_name: String) -> PathBuf {
self.failure_dir(contract_name).join(test_name)
}
}

impl InlineConfigParser for InvariantConfig {
fn config_key() -> String {
INLINE_CONFIG_INVARIANT_KEY.into()
Expand All @@ -60,8 +96,7 @@ impl InlineConfigParser for InvariantConfig {
return Ok(None)
}

// self is Copy. We clone it with dereference.
let mut conf_clone = *self;
let mut conf_clone = self.clone();

for pair in overrides {
let key = pair.0;
Expand All @@ -71,6 +106,9 @@ impl InlineConfigParser for InvariantConfig {
"depth" => conf_clone.depth = parse_config_u32(key, value)?,
"fail-on-revert" => conf_clone.fail_on_revert = parse_config_bool(key, value)?,
"call-override" => conf_clone.call_override = parse_config_bool(key, value)?,
"failure-persist-dir" => {
conf_clone.failure_persist_dir = Some(PathBuf::from(value))
}
_ => Err(InlineConfigParserError::InvalidConfigProperty(key.to_string()))?,
}
}
Expand Down
28 changes: 20 additions & 8 deletions crates/config/src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -787,13 +787,20 @@ impl Config {
pub fn cleanup(&self, project: &Project) -> Result<(), SolcError> {
project.cleanup()?;

// Remove fuzz cache directory.
if let Some(fuzz_cache) = &self.fuzz.failure_persist_dir {
let path = project.root().join(fuzz_cache);
if path.exists() {
std::fs::remove_dir_all(&path).map_err(|e| SolcIoError::new(e, path))?;
}
macro_rules! remove_test_cache {
($cache_dir:expr) => {
if let Some(test_cache) = $cache_dir {
let path = project.root().join(test_cache);
if path.exists() {
std::fs::remove_dir_all(&path).map_err(|e| SolcIoError::new(e, path))?;
}
}
};
}
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

can we convert this into either a private function or closure instead?

not a fan of using private macros for this

Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

changed in 9b22080 I opted not to throw the SolcIoError anymore (as is not really solc related) and just ignore, can readd it if you think it should be there

// Remove fuzz cache directory.
remove_test_cache!(&self.fuzz.failure_persist_dir);
// Remove invariant cache directory.
remove_test_cache!(&self.invariant.failure_persist_dir);

Ok(())
}
Expand Down Expand Up @@ -1952,7 +1959,7 @@ impl Default for Config {
path_pattern: None,
path_pattern_inverse: None,
fuzz: FuzzConfig::new("cache/fuzz".into()),
invariant: Default::default(),
invariant: InvariantConfig::new("cache/invariant".into()),
always_use_create_2_factory: false,
ffi: false,
prompt_timeout: 120,
Expand Down Expand Up @@ -4454,7 +4461,12 @@ mod tests {
let loaded = Config::load().sanitized();
assert_eq!(
loaded.invariant,
InvariantConfig { runs: 512, depth: 10, ..Default::default() }
InvariantConfig {
runs: 512,
depth: 10,
failure_persist_dir: Some(PathBuf::from("cache/invariant")),
..Default::default()
}
);

Ok(())
Expand Down
13 changes: 4 additions & 9 deletions crates/evm/evm/src/executors/fuzz/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -175,15 +175,10 @@ impl FuzzedExecutor {
} else {
vec![]
};
result.counterexample = Some(CounterExample::Single(BaseCounterExample {
sender: None,
addr: None,
signature: None,
contract_name: None,
traces: call.traces,
calldata,
args,
}));

result.counterexample = Some(CounterExample::Single(
BaseCounterExample::from_fuzz_call(calldata, args, call.traces),
));
}
_ => {}
}
Expand Down
1 change: 1 addition & 0 deletions crates/evm/evm/src/executors/invariant/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -40,6 +40,7 @@ mod result;
pub use result::InvariantFuzzTestResult;

mod shrink;
pub use shrink::check_sequence;

sol! {
interface IInvariantTest {
Expand Down
46 changes: 25 additions & 21 deletions crates/evm/evm/src/executors/invariant/replay.rs
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@ use foundry_evm_core::constants::CALLER;
use foundry_evm_coverage::HitMaps;
use foundry_evm_fuzz::{
invariant::{BasicTxDetails, InvariantContract},
BaseCounterExample, CounterExample,
BaseCounterExample,
};
use foundry_evm_traces::{load_contracts, TraceKind, Traces};
use parking_lot::RwLock;
Expand All @@ -28,7 +28,7 @@ pub fn replay_run(
traces: &mut Traces,
coverage: &mut Option<HitMaps>,
inputs: Vec<BasicTxDetails>,
) -> Result<Option<CounterExample>> {
) -> Result<Vec<BaseCounterExample>> {
// We want traces for a failed case.
executor.set_tracing(true);

Expand Down Expand Up @@ -56,31 +56,34 @@ pub fn replay_run(
));

// Create counter example to be used in failed case.
counterexample_sequence.push(BaseCounterExample::create(
counterexample_sequence.push(BaseCounterExample::from_invariant_call(
*sender,
*addr,
bytes,
&ided_contracts,
call_result.traces,
));

// Replay invariant to collect logs and traces.
let error_call_result = executor.call_raw(
CALLER,
invariant_contract.address,
invariant_contract
.invariant_function
.abi_encode_input(&[])
.expect("invariant should have no inputs")
.into(),
U256::ZERO,
)?;
traces.push((TraceKind::Execution, error_call_result.traces.clone().unwrap()));
logs.extend(error_call_result.logs);
}

Ok((!counterexample_sequence.is_empty())
.then_some(CounterExample::Sequence(counterexample_sequence)))
// Replay invariant to collect logs and traces.
// We do this only once at the end of the replayed sequence.
// Checking after each call doesn't add valuable info for passing scenario
// (invariant call result is always success) nor for failed scenarios
// (invariant call result is always success until the last call that breaks it).
let invariant_result = executor.call_raw(
CALLER,
invariant_contract.address,
invariant_contract
.invariant_function
.abi_encode_input(&[])
.expect("invariant should have no inputs")
.into(),
U256::ZERO,
)?;
traces.push((TraceKind::Execution, invariant_result.traces.clone().unwrap()));
logs.extend(invariant_result.logs);

Ok(counterexample_sequence)
}

/// Replays the error case, shrinks the failing sequence and collects all necessary traces.
Expand All @@ -94,15 +97,16 @@ pub fn replay_error(
logs: &mut Vec<Log>,
traces: &mut Traces,
coverage: &mut Option<HitMaps>,
) -> Result<Option<CounterExample>> {
) -> Result<Vec<BaseCounterExample>> {
match failed_case.test_error {
// Don't use at the moment.
TestError::Abort(_) => Ok(None),
TestError::Abort(_) => Ok(vec![]),
TestError::Fail(_, ref calls) => {
// Shrink sequence of failed calls.
let calls = shrink_sequence(failed_case, calls, &executor)?;

set_up_inner_replay(&mut executor, &failed_case.inner_sequence);

// Replay calls to get the counterexample and to collect logs, traces and coverage.
replay_run(
invariant_contract,
Expand Down
39 changes: 22 additions & 17 deletions crates/evm/evm/src/executors/invariant/shrink.rs
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
use crate::executors::{invariant::error::FailedInvariantCaseData, Executor};
use alloy_primitives::U256;
use alloy_primitives::{Address, Bytes, U256};
use foundry_evm_core::constants::CALLER;
use foundry_evm_fuzz::invariant::BasicTxDetails;
use proptest::bits::{BitSetLike, VarBitSet};
Expand Down Expand Up @@ -97,7 +97,14 @@ pub(crate) fn shrink_sequence(
let mut shrinker = CallSequenceShrinker::new(calls.len());
for _ in 0..failed_case.shrink_run_limit {
// Check candidate sequence result.
match check_sequence(failed_case, executor.clone(), calls, shrinker.current().collect()) {
match check_sequence(
executor.clone(),
calls,
shrinker.current().collect(),
failed_case.addr,
failed_case.func.clone(),
failed_case.fail_on_revert,
) {
// If candidate sequence still fails then shrink more if possible.
Ok(false) if !shrinker.simplify() => break,
// If candidate sequence pass then restore last removed call and shrink other
Expand All @@ -110,41 +117,39 @@ pub(crate) fn shrink_sequence(
Ok(shrinker.current().map(|idx| &calls[idx]).cloned().collect())
}

/// Checks if the shrinked sequence fails test, if it does then we can try simplifying more.
fn check_sequence(
failed_case: &FailedInvariantCaseData,
/// Checks if the given call sequence breaks the invariant.
/// Used in shrinking phase for checking candidate sequences and in replay failures phase to test
/// persisted failures.
pub fn check_sequence(
mut executor: Executor,
calls: &[BasicTxDetails],
sequence: Vec<usize>,
test_address: Address,
test_function: Bytes,
fail_on_revert: bool,
) -> eyre::Result<bool> {
let mut sequence_failed = false;
// Apply the shrinked candidate sequence.
// Apply the call sequence.
for call_index in sequence {
let (sender, (addr, bytes)) = &calls[call_index];
let call_result =
executor.call_raw_committing(*sender, *addr, bytes.clone(), U256::ZERO)?;
if call_result.reverted && failed_case.fail_on_revert {
if call_result.reverted && fail_on_revert {
// Candidate sequence fails test.
// We don't have to apply remaining calls to check sequence.
sequence_failed = true;
break;
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

can't we just return here instead of managing sequence_failed flag and counting calls for replayed_entirely?

Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

yep yep, nice cleanup! 7686c03

}
}
// Return without checking the invariant if we already have failing sequence.
// Return without checking the invariant if we already have a failing sequence.
if sequence_failed {
return Ok(false);
};

// Check the invariant for candidate sequence.
// If sequence fails then we can continue with shrinking - the removed call does not affect
// failure.
//
// If sequence doesn't fail then we have to restore last removed call and continue with next
// call - removed call is a required step for reproducing the failure.
let mut call_result =
executor.call_raw(CALLER, failed_case.addr, failed_case.func.clone(), U256::ZERO)?;
// Check the invariant for call sequence.
let mut call_result = executor.call_raw(CALLER, test_address, test_function, U256::ZERO)?;
Ok(executor.is_raw_call_success(
failed_case.addr,
test_address,
Cow::Owned(call_result.state_changeset.take().unwrap()),
&call_result,
false,
Expand Down
Loading
Loading