use alloy_consensus::BlockHeader;
use alloy_primitives::{Address, B256, U256};
use alloy_provider::network::TransactionResponse;
use parking_lot::RwLock;
use revm::{
primitives::{
map::{AddressHashMap, HashMap},
Account, AccountInfo, AccountStatus, BlobExcessGasAndPrice, BlockEnv, CfgEnv, KECCAK_EMPTY,
},
DatabaseCommit,
};
use serde::{ser::SerializeMap, Deserialize, Deserializer, Serialize, Serializer};
use std::{
collections::BTreeSet,
fs,
io::{BufWriter, Write},
path::{Path, PathBuf},
sync::Arc,
};
use url::Url;
pub type StorageInfo = HashMap<U256, U256>;
#[derive(Clone, Debug)]
pub struct BlockchainDb {
db: Arc<MemDb>,
meta: Arc<RwLock<BlockchainDbMeta>>,
cache: Arc<JsonBlockCacheDB>,
}
impl BlockchainDb {
pub fn new(meta: BlockchainDbMeta, cache_path: Option<PathBuf>) -> Self {
Self::new_db(meta, cache_path, false)
}
pub fn new_skip_check(meta: BlockchainDbMeta, cache_path: Option<PathBuf>) -> Self {
Self::new_db(meta, cache_path, true)
}
fn new_db(meta: BlockchainDbMeta, cache_path: Option<PathBuf>, skip_check: bool) -> Self {
trace!(target: "forge::cache", cache=?cache_path, "initialising blockchain db");
let cache = cache_path
.as_ref()
.and_then(|p| {
JsonBlockCacheDB::load(p).ok().filter(|cache| {
if skip_check {
return true;
}
let mut existing = cache.meta().write();
existing.hosts.extend(meta.hosts.clone());
if meta != *existing {
warn!(target: "cache", "non-matching block metadata");
false
} else {
true
}
})
})
.unwrap_or_else(|| JsonBlockCacheDB::new(Arc::new(RwLock::new(meta)), cache_path));
Self { db: Arc::clone(cache.db()), meta: Arc::clone(cache.meta()), cache: Arc::new(cache) }
}
pub fn accounts(&self) -> &RwLock<AddressHashMap<AccountInfo>> {
&self.db.accounts
}
pub fn storage(&self) -> &RwLock<AddressHashMap<StorageInfo>> {
&self.db.storage
}
pub fn block_hashes(&self) -> &RwLock<HashMap<U256, B256>> {
&self.db.block_hashes
}
pub const fn meta(&self) -> &Arc<RwLock<BlockchainDbMeta>> {
&self.meta
}
pub const fn cache(&self) -> &Arc<JsonBlockCacheDB> {
&self.cache
}
pub const fn db(&self) -> &Arc<MemDb> {
&self.db
}
}
#[derive(Clone, Debug, Eq, Serialize, Default)]
pub struct BlockchainDbMeta {
pub cfg_env: CfgEnv,
pub block_env: BlockEnv,
pub hosts: BTreeSet<String>,
}
impl BlockchainDbMeta {
pub fn new(env: revm::primitives::Env, url: String) -> Self {
let host = Url::parse(&url)
.ok()
.and_then(|url| url.host().map(|host| host.to_string()))
.unwrap_or(url);
Self { cfg_env: env.cfg.clone(), block_env: env.block, hosts: BTreeSet::from([host]) }
}
pub const fn with_chain_id(mut self, chain_id: u64) -> Self {
self.cfg_env.chain_id = chain_id;
self
}
pub fn with_block<T: TransactionResponse, H: BlockHeader>(
mut self,
block: &alloy_rpc_types::Block<T, H>,
) -> Self {
self.block_env = BlockEnv {
number: U256::from(block.header.number()),
coinbase: block.header.beneficiary(),
timestamp: U256::from(block.header.timestamp()),
difficulty: U256::from(block.header.difficulty()),
basefee: block.header.base_fee_per_gas().map(U256::from).unwrap_or_default(),
gas_limit: U256::from(block.header.gas_limit()),
prevrandao: block.header.mix_hash(),
blob_excess_gas_and_price: Some(BlobExcessGasAndPrice::new(
block.header.excess_blob_gas().unwrap_or_default(),
false,
)),
};
self
}
pub fn with_url(mut self, url: &str) -> Self {
let host = Url::parse(url)
.ok()
.and_then(|url| url.host().map(|host| host.to_string()))
.unwrap_or(url.to_string());
self.hosts.insert(host);
self
}
pub fn set_cfg_env(mut self, cfg_env: revm::primitives::CfgEnv) {
self.cfg_env = cfg_env;
}
pub fn set_block_env(mut self, block_env: revm::primitives::BlockEnv) {
self.block_env = block_env;
}
}
impl PartialEq for BlockchainDbMeta {
fn eq(&self, other: &Self) -> bool {
self.cfg_env == other.cfg_env && self.block_env == other.block_env
}
}
impl<'de> Deserialize<'de> for BlockchainDbMeta {
fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where
D: Deserializer<'de>,
{
struct CfgEnvBackwardsCompat {
inner: revm::primitives::CfgEnv,
}
impl<'de> Deserialize<'de> for CfgEnvBackwardsCompat {
fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where
D: Deserializer<'de>,
{
let mut value = serde_json::Value::deserialize(deserializer)?;
if let Some(obj) = value.as_object_mut() {
let default_value =
serde_json::to_value(revm::primitives::CfgEnv::default()).unwrap();
for (key, value) in default_value.as_object().unwrap() {
if !obj.contains_key(key) {
obj.insert(key.to_string(), value.clone());
}
}
}
let cfg_env: revm::primitives::CfgEnv =
serde_json::from_value(value).map_err(serde::de::Error::custom)?;
Ok(Self { inner: cfg_env })
}
}
struct BlockEnvBackwardsCompat {
inner: revm::primitives::BlockEnv,
}
impl<'de> Deserialize<'de> for BlockEnvBackwardsCompat {
fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where
D: Deserializer<'de>,
{
let mut value = serde_json::Value::deserialize(deserializer)?;
if let Some(obj) = value.as_object_mut() {
let default_value =
serde_json::to_value(revm::primitives::BlockEnv::default()).unwrap();
for (key, value) in default_value.as_object().unwrap() {
if !obj.contains_key(key) {
obj.insert(key.to_string(), value.clone());
}
}
}
let cfg_env: revm::primitives::BlockEnv =
serde_json::from_value(value).map_err(serde::de::Error::custom)?;
Ok(Self { inner: cfg_env })
}
}
#[derive(Deserialize)]
struct Meta {
cfg_env: CfgEnvBackwardsCompat,
block_env: BlockEnvBackwardsCompat,
#[serde(alias = "host")]
hosts: Hosts,
}
#[derive(Deserialize)]
#[serde(untagged)]
enum Hosts {
Multi(BTreeSet<String>),
Single(String),
}
let Meta { cfg_env, block_env, hosts } = Meta::deserialize(deserializer)?;
Ok(Self {
cfg_env: cfg_env.inner,
block_env: block_env.inner,
hosts: match hosts {
Hosts::Multi(hosts) => hosts,
Hosts::Single(host) => BTreeSet::from([host]),
},
})
}
}
#[derive(Debug, Default)]
pub struct MemDb {
pub accounts: RwLock<AddressHashMap<AccountInfo>>,
pub storage: RwLock<AddressHashMap<StorageInfo>>,
pub block_hashes: RwLock<HashMap<U256, B256>>,
}
impl MemDb {
pub fn clear(&self) {
self.accounts.write().clear();
self.storage.write().clear();
self.block_hashes.write().clear();
}
pub fn do_insert_account(&self, address: Address, account: AccountInfo) {
self.accounts.write().insert(address, account);
}
pub fn do_commit(&self, changes: HashMap<Address, Account>) {
let mut storage = self.storage.write();
let mut accounts = self.accounts.write();
for (add, mut acc) in changes {
if acc.is_empty() || acc.is_selfdestructed() {
accounts.remove(&add);
storage.remove(&add);
} else {
if let Some(code_hash) = acc
.info
.code
.as_ref()
.filter(|code| !code.is_empty())
.map(|code| code.hash_slow())
{
acc.info.code_hash = code_hash;
} else if acc.info.code_hash.is_zero() {
acc.info.code_hash = KECCAK_EMPTY;
}
accounts.insert(add, acc.info);
let acc_storage = storage.entry(add).or_default();
if acc.status.contains(AccountStatus::Created) {
acc_storage.clear();
}
for (index, value) in acc.storage {
if value.present_value().is_zero() {
acc_storage.remove(&index);
} else {
acc_storage.insert(index, value.present_value());
}
}
if acc_storage.is_empty() {
storage.remove(&add);
}
}
}
}
}
impl Clone for MemDb {
fn clone(&self) -> Self {
Self {
storage: RwLock::new(self.storage.read().clone()),
accounts: RwLock::new(self.accounts.read().clone()),
block_hashes: RwLock::new(self.block_hashes.read().clone()),
}
}
}
impl DatabaseCommit for MemDb {
fn commit(&mut self, changes: HashMap<Address, Account>) {
self.do_commit(changes)
}
}
#[derive(Debug)]
pub struct JsonBlockCacheDB {
cache_path: Option<PathBuf>,
data: JsonBlockCacheData,
}
impl JsonBlockCacheDB {
fn new(meta: Arc<RwLock<BlockchainDbMeta>>, cache_path: Option<PathBuf>) -> Self {
Self { cache_path, data: JsonBlockCacheData { meta, data: Arc::new(Default::default()) } }
}
pub fn load(path: impl Into<PathBuf>) -> eyre::Result<Self> {
let path = path.into();
trace!(target: "cache", ?path, "reading json cache");
let contents = std::fs::read_to_string(&path).map_err(|err| {
warn!(?err, ?path, "Failed to read cache file");
err
})?;
let data = serde_json::from_str(&contents).map_err(|err| {
warn!(target: "cache", ?err, ?path, "Failed to deserialize cache data");
err
})?;
Ok(Self { cache_path: Some(path), data })
}
pub const fn db(&self) -> &Arc<MemDb> {
&self.data.data
}
pub const fn meta(&self) -> &Arc<RwLock<BlockchainDbMeta>> {
&self.data.meta
}
pub const fn is_transient(&self) -> bool {
self.cache_path.is_none()
}
#[instrument(level = "warn", skip_all, fields(path = ?self.cache_path))]
pub fn flush(&self) {
let Some(path) = &self.cache_path else { return };
self.flush_to(path.as_path());
}
pub fn flush_to(&self, cache_path: &Path) {
let path: &Path = cache_path;
trace!(target: "cache", "saving json cache");
if let Some(parent) = path.parent() {
let _ = fs::create_dir_all(parent);
}
let file = match fs::File::create(path) {
Ok(file) => file,
Err(e) => return warn!(target: "cache", %e, "Failed to open json cache for writing"),
};
let mut writer = BufWriter::new(file);
if let Err(e) = serde_json::to_writer(&mut writer, &self.data) {
return warn!(target: "cache", %e, "Failed to write to json cache");
}
if let Err(e) = writer.flush() {
return warn!(target: "cache", %e, "Failed to flush to json cache");
}
trace!(target: "cache", "saved json cache");
}
}
#[derive(Debug)]
pub struct JsonBlockCacheData {
pub meta: Arc<RwLock<BlockchainDbMeta>>,
pub data: Arc<MemDb>,
}
impl Serialize for JsonBlockCacheData {
fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where
S: Serializer,
{
let mut map = serializer.serialize_map(Some(4))?;
map.serialize_entry("meta", &*self.meta.read())?;
map.serialize_entry("accounts", &*self.data.accounts.read())?;
map.serialize_entry("storage", &*self.data.storage.read())?;
map.serialize_entry("block_hashes", &*self.data.block_hashes.read())?;
map.end()
}
}
impl<'de> Deserialize<'de> for JsonBlockCacheData {
fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where
D: Deserializer<'de>,
{
#[derive(Deserialize)]
struct Data {
meta: BlockchainDbMeta,
accounts: AddressHashMap<AccountInfo>,
storage: AddressHashMap<HashMap<U256, U256>>,
block_hashes: HashMap<U256, B256>,
}
let Data { meta, accounts, storage, block_hashes } = Data::deserialize(deserializer)?;
Ok(Self {
meta: Arc::new(RwLock::new(meta)),
data: Arc::new(MemDb {
accounts: RwLock::new(accounts),
storage: RwLock::new(storage),
block_hashes: RwLock::new(block_hashes),
}),
})
}
}
#[derive(Debug)]
pub struct FlushJsonBlockCacheDB(pub Arc<JsonBlockCacheDB>);
impl Drop for FlushJsonBlockCacheDB {
fn drop(&mut self) {
trace!(target: "fork::cache", "flushing cache");
self.0.flush();
trace!(target: "fork::cache", "flushed cache");
}
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn can_deserialize_cache() {
let s = r#"{
"meta": {
"cfg_env": {
"chain_id": 1337,
"perf_analyse_created_bytecodes": "Analyse",
"limit_contract_code_size": 18446744073709551615,
"memory_limit": 4294967295,
"disable_block_gas_limit": false,
"disable_eip3607": false,
"disable_base_fee": false
},
"block_env": {
"number": "0xed3ddf",
"coinbase": "0x0000000000000000000000000000000000000000",
"timestamp": "0x6324bc3f",
"difficulty": "0x0",
"basefee": "0x2e5fda223",
"gas_limit": "0x1c9c380",
"prevrandao": "0x0000000000000000000000000000000000000000000000000000000000000000"
},
"hosts": [
"eth-mainnet.alchemyapi.io"
]
},
"accounts": {
"0xb8ffc3cd6e7cf5a098a1c92f48009765b24088dc": {
"balance": "0x0",
"nonce": 10,
"code_hash": "0x3ac64c95eedf82e5d821696a12daac0e1b22c8ee18a9fd688b00cfaf14550aad",
"code": {
"LegacyAnalyzed": {
"bytecode": "0x00",
"original_len": 0,
"jump_table": {
"order": "bitvec::order::Lsb0",
"head": {
"width": 8,
"index": 0
},
"bits": 1,
"data": [0]
}
}
}
}
},
"storage": {
"0xa354f35829ae975e850e23e9615b11da1b3dc4de": {
"0x290decd9548b62a8d60345a988386fc84ba6bc95484008f6362f93160ef3e564": "0x5553444320795661756c74000000000000000000000000000000000000000000",
"0x10": "0x37fd60ff8346",
"0x290decd9548b62a8d60345a988386fc84ba6bc95484008f6362f93160ef3e563": "0xb",
"0x6": "0xa0b86991c6218b36c1d19d4a2e9eb0ce3606eb48",
"0x5": "0x36ff5b93162e",
"0x14": "0x29d635a8e000",
"0x11": "0x63224c73",
"0x2": "0x6"
}
},
"block_hashes": {
"0xed3deb": "0xbf7be3174b261ea3c377b6aba4a1e05d5fae7eee7aab5691087c20cf353e9877",
"0xed3de9": "0xba1c3648e0aee193e7d00dffe4e9a5e420016b4880455641085a4731c1d32eef",
"0xed3de8": "0x61d1491c03a9295fb13395cca18b17b4fa5c64c6b8e56ee9cc0a70c3f6cf9855",
"0xed3de7": "0xb54560b5baeccd18350d56a3bee4035432294dc9d2b7e02f157813e1dee3a0be",
"0xed3dea": "0x816f124480b9661e1631c6ec9ee39350bda79f0cbfc911f925838d88e3d02e4b"
}
}"#;
let cache: JsonBlockCacheData = serde_json::from_str(s).unwrap();
assert_eq!(cache.data.accounts.read().len(), 1);
assert_eq!(cache.data.storage.read().len(), 1);
assert_eq!(cache.data.block_hashes.read().len(), 5);
let _s = serde_json::to_string(&cache).unwrap();
}
#[test]
fn can_deserialize_cache_post_4844() {
let s = r#"{
"meta": {
"cfg_env": {
"chain_id": 1,
"kzg_settings": "Default",
"perf_analyse_created_bytecodes": "Analyse",
"limit_contract_code_size": 18446744073709551615,
"memory_limit": 134217728,
"disable_block_gas_limit": false,
"disable_eip3607": true,
"disable_base_fee": false,
"optimism": false
},
"block_env": {
"number": "0x11c99bc",
"coinbase": "0x4838b106fce9647bdf1e7877bf73ce8b0bad5f97",
"timestamp": "0x65627003",
"gas_limit": "0x1c9c380",
"basefee": "0x64288ff1f",
"difficulty": "0xc6b1a299886016dea3865689f8393b9bf4d8f4fe8c0ad25f0058b3569297c057",
"prevrandao": "0xc6b1a299886016dea3865689f8393b9bf4d8f4fe8c0ad25f0058b3569297c057",
"blob_excess_gas_and_price": {
"excess_blob_gas": 0,
"blob_gasprice": 1
}
},
"hosts": [
"eth-mainnet.alchemyapi.io"
]
},
"accounts": {
"0x4838b106fce9647bdf1e7877bf73ce8b0bad5f97": {
"balance": "0x8e0c373cfcdfd0eb",
"nonce": 128912,
"code_hash": "0xc5d2460186f7233c927e7db2dcc703c0e500b653ca82273b7bfad8045d85a470",
"code": {
"LegacyAnalyzed": {
"bytecode": "0x00",
"original_len": 0,
"jump_table": {
"order": "bitvec::order::Lsb0",
"head": {
"width": 8,
"index": 0
},
"bits": 1,
"data": [0]
}
}
}
}
},
"storage": {},
"block_hashes": {}
}"#;
let cache: JsonBlockCacheData = serde_json::from_str(s).unwrap();
assert_eq!(cache.data.accounts.read().len(), 1);
let _s = serde_json::to_string(&cache).unwrap();
}
}