mirror of
https://github.com/pezkuwichain/pezkuwi-subxt.git
synced 2026-06-12 11:11:17 +00:00
96ca4bed0e
* Rework the trie cache * Align `state-machine` tests * Bump `schnellru` to 0.1.1 * Fix off-by-one * Align to review comments * Bump `ahash` to 0.8.2 * Bump `schnellru` to 0.2.0 * Bump `schnellru` to 0.2.1 * Remove unnecessary bound * Remove unnecessary loop when calculating maximum memory usage * Remove unnecessary `mut`s
981 lines
30 KiB
Rust
981 lines
30 KiB
Rust
// This file is part of Substrate.
|
|
|
|
// Copyright (C) 2022 Parity Technologies (UK) Ltd.
|
|
// SPDX-License-Identifier: Apache-2.0
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
//! Trie Cache
|
|
//!
|
|
//! Provides an implementation of the [`TrieCache`](trie_db::TrieCache) trait.
|
|
//! The implementation is split into three types [`SharedTrieCache`], [`LocalTrieCache`] and
|
|
//! [`TrieCache`]. The [`SharedTrieCache`] is the instance that should be kept around for the entire
|
|
//! lifetime of the node. It will store all cached trie nodes and values on a global level. Then
|
|
//! there is the [`LocalTrieCache`] that should be kept around per state instance requested from the
|
|
//! backend. As there are very likely multiple accesses to the state per instance, this
|
|
//! [`LocalTrieCache`] is used to cache the nodes and the values before they are merged back to the
|
|
//! shared instance. Last but not least there is the [`TrieCache`] that is being used per access to
|
|
//! the state. It will use the [`SharedTrieCache`] and the [`LocalTrieCache`] to fulfill cache
|
|
//! requests. If both of them don't provide the requested data it will be inserted into the
|
|
//! [`LocalTrieCache`] and then later into the [`SharedTrieCache`].
|
|
//!
|
|
//! The [`SharedTrieCache`] is bound to some maximum number of bytes. It is ensured that it never
|
|
//! runs above this limit. However as long as data is cached inside a [`LocalTrieCache`] it isn't
|
|
//! taken into account when limiting the [`SharedTrieCache`]. This means that for the lifetime of a
|
|
//! [`LocalTrieCache`] the actual memory usage could be above the allowed maximum.
|
|
|
|
use crate::{Error, NodeCodec};
|
|
use hash_db::Hasher;
|
|
use nohash_hasher::BuildNoHashHasher;
|
|
use parking_lot::{Mutex, MutexGuard};
|
|
use schnellru::LruMap;
|
|
use shared_cache::{ValueCacheKey, ValueCacheRef};
|
|
use std::{
|
|
collections::HashMap,
|
|
sync::{
|
|
atomic::{AtomicU64, Ordering},
|
|
Arc,
|
|
},
|
|
time::Duration,
|
|
};
|
|
use trie_db::{node::NodeOwned, CachedValue};
|
|
|
|
mod shared_cache;
|
|
|
|
pub use shared_cache::SharedTrieCache;
|
|
|
|
use self::shared_cache::ValueCacheKeyHash;
|
|
|
|
const LOG_TARGET: &str = "trie-cache";
|
|
|
|
/// The maximum amount of time we'll wait trying to acquire the shared cache lock
|
|
/// when the local cache is dropped and synchronized with the share cache.
|
|
///
|
|
/// This is just a failsafe; normally this should never trigger.
|
|
const SHARED_CACHE_WRITE_LOCK_TIMEOUT: Duration = Duration::from_millis(100);
|
|
|
|
/// The maximum number of existing keys in the shared cache that a single local cache
|
|
/// can promote to the front of the LRU cache in one go.
|
|
///
|
|
/// If we have a big shared cache and the local cache hits all of those keys we don't
|
|
/// want to spend forever bumping all of them.
|
|
const SHARED_NODE_CACHE_MAX_PROMOTED_KEYS: u32 = 1792;
|
|
/// Same as [`SHARED_NODE_CACHE_MAX_PROMOTED_KEYS`].
|
|
const SHARED_VALUE_CACHE_MAX_PROMOTED_KEYS: u32 = 1792;
|
|
|
|
/// The maximum portion of the shared cache (in percent) that a single local
|
|
/// cache can replace in one go.
|
|
///
|
|
/// We don't want a single local cache instance to have the ability to replace
|
|
/// everything in the shared cache.
|
|
const SHARED_NODE_CACHE_MAX_REPLACE_PERCENT: usize = 33;
|
|
/// Same as [`SHARED_NODE_CACHE_MAX_REPLACE_PERCENT`].
|
|
const SHARED_VALUE_CACHE_MAX_REPLACE_PERCENT: usize = 33;
|
|
|
|
/// The maximum inline capacity of the local cache, in bytes.
|
|
///
|
|
/// This is just an upper limit; since the maps are resized in powers of two
|
|
/// their actual size will most likely not exactly match this.
|
|
const LOCAL_NODE_CACHE_MAX_INLINE_SIZE: usize = 512 * 1024;
|
|
/// Same as [`LOCAL_NODE_CACHE_MAX_INLINE_SIZE`].
|
|
const LOCAL_VALUE_CACHE_MAX_INLINE_SIZE: usize = 512 * 1024;
|
|
|
|
/// The maximum size of the memory allocated on the heap by the local cache, in bytes.
|
|
const LOCAL_NODE_CACHE_MAX_HEAP_SIZE: usize = 2 * 1024 * 1024;
|
|
/// Same as [`LOCAL_NODE_CACHE_MAX_HEAP_SIZE`].
|
|
const LOCAL_VALUE_CACHE_MAX_HEAP_SIZE: usize = 4 * 1024 * 1024;
|
|
|
|
/// The size of the shared cache.
|
|
#[derive(Debug, Clone, Copy)]
|
|
pub struct CacheSize(usize);
|
|
|
|
impl CacheSize {
|
|
/// An unlimited cache size.
|
|
pub const fn unlimited() -> Self {
|
|
CacheSize(usize::MAX)
|
|
}
|
|
|
|
/// A cache size `bytes` big.
|
|
pub const fn new(bytes: usize) -> Self {
|
|
CacheSize(bytes)
|
|
}
|
|
}
|
|
|
|
/// A limiter for the local node cache. This makes sure the local cache doesn't grow too big.
|
|
#[derive(Default)]
|
|
pub struct LocalNodeCacheLimiter {
|
|
/// The current size (in bytes) of data allocated by this cache on the heap.
|
|
///
|
|
/// This doesn't include the size of the map itself.
|
|
current_heap_size: usize,
|
|
}
|
|
|
|
impl<H> schnellru::Limiter<H, NodeCached<H>> for LocalNodeCacheLimiter
|
|
where
|
|
H: AsRef<[u8]> + std::fmt::Debug,
|
|
{
|
|
type KeyToInsert<'a> = H;
|
|
type LinkType = u32;
|
|
|
|
#[inline]
|
|
fn is_over_the_limit(&self, length: usize) -> bool {
|
|
// Only enforce the limit if there's more than one element to make sure
|
|
// we can always add a new element to the cache.
|
|
if length <= 1 {
|
|
return false
|
|
}
|
|
|
|
self.current_heap_size > LOCAL_NODE_CACHE_MAX_HEAP_SIZE
|
|
}
|
|
|
|
#[inline]
|
|
fn on_insert<'a>(
|
|
&mut self,
|
|
_length: usize,
|
|
key: H,
|
|
cached_node: NodeCached<H>,
|
|
) -> Option<(H, NodeCached<H>)> {
|
|
self.current_heap_size += cached_node.heap_size();
|
|
Some((key, cached_node))
|
|
}
|
|
|
|
#[inline]
|
|
fn on_replace(
|
|
&mut self,
|
|
_length: usize,
|
|
_old_key: &mut H,
|
|
_new_key: H,
|
|
old_node: &mut NodeCached<H>,
|
|
new_node: &mut NodeCached<H>,
|
|
) -> bool {
|
|
debug_assert_eq!(_old_key.as_ref().len(), _new_key.as_ref().len());
|
|
self.current_heap_size =
|
|
self.current_heap_size + new_node.heap_size() - old_node.heap_size();
|
|
true
|
|
}
|
|
|
|
#[inline]
|
|
fn on_removed(&mut self, _key: &mut H, cached_node: &mut NodeCached<H>) {
|
|
self.current_heap_size -= cached_node.heap_size();
|
|
}
|
|
|
|
#[inline]
|
|
fn on_cleared(&mut self) {
|
|
self.current_heap_size = 0;
|
|
}
|
|
|
|
#[inline]
|
|
fn on_grow(&mut self, new_memory_usage: usize) -> bool {
|
|
new_memory_usage <= LOCAL_NODE_CACHE_MAX_INLINE_SIZE
|
|
}
|
|
}
|
|
|
|
/// A limiter for the local value cache. This makes sure the local cache doesn't grow too big.
|
|
#[derive(Default)]
|
|
pub struct LocalValueCacheLimiter {
|
|
/// The current size (in bytes) of data allocated by this cache on the heap.
|
|
///
|
|
/// This doesn't include the size of the map itself.
|
|
current_heap_size: usize,
|
|
}
|
|
|
|
impl<H> schnellru::Limiter<ValueCacheKey<H>, CachedValue<H>> for LocalValueCacheLimiter
|
|
where
|
|
H: AsRef<[u8]>,
|
|
{
|
|
type KeyToInsert<'a> = ValueCacheRef<'a, H>;
|
|
type LinkType = u32;
|
|
|
|
#[inline]
|
|
fn is_over_the_limit(&self, length: usize) -> bool {
|
|
// Only enforce the limit if there's more than one element to make sure
|
|
// we can always add a new element to the cache.
|
|
if length <= 1 {
|
|
return false
|
|
}
|
|
|
|
self.current_heap_size > LOCAL_VALUE_CACHE_MAX_HEAP_SIZE
|
|
}
|
|
|
|
#[inline]
|
|
fn on_insert(
|
|
&mut self,
|
|
_length: usize,
|
|
key: Self::KeyToInsert<'_>,
|
|
value: CachedValue<H>,
|
|
) -> Option<(ValueCacheKey<H>, CachedValue<H>)> {
|
|
self.current_heap_size += key.storage_key.len();
|
|
Some((key.into(), value))
|
|
}
|
|
|
|
#[inline]
|
|
fn on_replace(
|
|
&mut self,
|
|
_length: usize,
|
|
_old_key: &mut ValueCacheKey<H>,
|
|
_new_key: ValueCacheRef<H>,
|
|
_old_value: &mut CachedValue<H>,
|
|
_new_value: &mut CachedValue<H>,
|
|
) -> bool {
|
|
debug_assert_eq!(_old_key.storage_key.len(), _new_key.storage_key.len());
|
|
true
|
|
}
|
|
|
|
#[inline]
|
|
fn on_removed(&mut self, key: &mut ValueCacheKey<H>, _: &mut CachedValue<H>) {
|
|
self.current_heap_size -= key.storage_key.len();
|
|
}
|
|
|
|
#[inline]
|
|
fn on_cleared(&mut self) {
|
|
self.current_heap_size = 0;
|
|
}
|
|
|
|
#[inline]
|
|
fn on_grow(&mut self, new_memory_usage: usize) -> bool {
|
|
new_memory_usage <= LOCAL_VALUE_CACHE_MAX_INLINE_SIZE
|
|
}
|
|
}
|
|
|
|
/// A struct to gather hit/miss stats to aid in debugging the performance of the cache.
|
|
#[derive(Default)]
|
|
struct HitStats {
|
|
shared_hits: AtomicU64,
|
|
shared_fetch_attempts: AtomicU64,
|
|
local_hits: AtomicU64,
|
|
local_fetch_attempts: AtomicU64,
|
|
}
|
|
|
|
impl std::fmt::Display for HitStats {
|
|
fn fmt(&self, fmt: &mut std::fmt::Formatter) -> std::fmt::Result {
|
|
let shared_hits = self.shared_hits.load(Ordering::Relaxed);
|
|
let shared_fetch_attempts = self.shared_fetch_attempts.load(Ordering::Relaxed);
|
|
let local_hits = self.local_hits.load(Ordering::Relaxed);
|
|
let local_fetch_attempts = self.local_fetch_attempts.load(Ordering::Relaxed);
|
|
if shared_fetch_attempts == 0 && local_hits == 0 {
|
|
write!(fmt, "empty")
|
|
} else {
|
|
let percent_local = (local_hits as f32 / local_fetch_attempts as f32) * 100.0;
|
|
let percent_shared = (shared_hits as f32 / shared_fetch_attempts as f32) * 100.0;
|
|
write!(
|
|
fmt,
|
|
"local hit rate = {}% [{}/{}], shared hit rate = {}% [{}/{}]",
|
|
percent_local as u32,
|
|
local_hits,
|
|
local_fetch_attempts,
|
|
percent_shared as u32,
|
|
shared_hits,
|
|
shared_fetch_attempts
|
|
)
|
|
}
|
|
}
|
|
}
|
|
|
|
/// A struct to gather hit/miss stats for the node cache and the value cache.
|
|
#[derive(Default)]
|
|
struct TrieHitStats {
|
|
node_cache: HitStats,
|
|
value_cache: HitStats,
|
|
}
|
|
|
|
/// An internal struct to store the cached trie nodes.
|
|
pub(crate) struct NodeCached<H> {
|
|
/// The cached node.
|
|
pub node: NodeOwned<H>,
|
|
/// Whether this node was fetched from the shared cache or not.
|
|
pub is_from_shared_cache: bool,
|
|
}
|
|
|
|
impl<H> NodeCached<H> {
|
|
/// Returns the number of bytes allocated on the heap by this node.
|
|
fn heap_size(&self) -> usize {
|
|
self.node.size_in_bytes() - std::mem::size_of::<NodeOwned<H>>()
|
|
}
|
|
}
|
|
|
|
type NodeCacheMap<H> = LruMap<H, NodeCached<H>, LocalNodeCacheLimiter, schnellru::RandomState>;
|
|
|
|
type ValueCacheMap<H> = LruMap<
|
|
ValueCacheKey<H>,
|
|
CachedValue<H>,
|
|
LocalValueCacheLimiter,
|
|
BuildNoHashHasher<ValueCacheKey<H>>,
|
|
>;
|
|
|
|
type ValueAccessSet =
|
|
LruMap<ValueCacheKeyHash, (), schnellru::ByLength, BuildNoHashHasher<ValueCacheKeyHash>>;
|
|
|
|
/// The local trie cache.
|
|
///
|
|
/// This cache should be used per state instance created by the backend. One state instance is
|
|
/// referring to the state of one block. It will cache all the accesses that are done to the state
|
|
/// which could not be fullfilled by the [`SharedTrieCache`]. These locally cached items are merged
|
|
/// back to the shared trie cache when this instance is dropped.
|
|
///
|
|
/// When using [`Self::as_trie_db_cache`] or [`Self::as_trie_db_mut_cache`], it will lock Mutexes.
|
|
/// So, it is important that these methods are not called multiple times, because they otherwise
|
|
/// deadlock.
|
|
pub struct LocalTrieCache<H: Hasher> {
|
|
/// The shared trie cache that created this instance.
|
|
shared: SharedTrieCache<H>,
|
|
|
|
/// The local cache for the trie nodes.
|
|
node_cache: Mutex<NodeCacheMap<H::Out>>,
|
|
|
|
/// The local cache for the values.
|
|
value_cache: Mutex<ValueCacheMap<H::Out>>,
|
|
|
|
/// Keeps track of all values accessed in the shared cache.
|
|
///
|
|
/// This will be used to ensure that these nodes are brought to the front of the lru when this
|
|
/// local instance is merged back to the shared cache. This can actually lead to collision when
|
|
/// two [`ValueCacheKey`]s with different storage roots and keys map to the same hash. However,
|
|
/// as we only use this set to update the lru position it is fine, even if we bring the wrong
|
|
/// value to the top. The important part is that we always get the correct value from the value
|
|
/// cache for a given key.
|
|
shared_value_cache_access: Mutex<ValueAccessSet>,
|
|
|
|
stats: TrieHitStats,
|
|
}
|
|
|
|
impl<H: Hasher> LocalTrieCache<H> {
|
|
/// Return self as a [`TrieDB`](trie_db::TrieDB) compatible cache.
|
|
///
|
|
/// The given `storage_root` needs to be the storage root of the trie this cache is used for.
|
|
pub fn as_trie_db_cache(&self, storage_root: H::Out) -> TrieCache<'_, H> {
|
|
let value_cache = ValueCache::ForStorageRoot {
|
|
storage_root,
|
|
local_value_cache: self.value_cache.lock(),
|
|
shared_value_cache_access: self.shared_value_cache_access.lock(),
|
|
buffered_value: None,
|
|
};
|
|
|
|
TrieCache {
|
|
shared_cache: self.shared.clone(),
|
|
local_cache: self.node_cache.lock(),
|
|
value_cache,
|
|
stats: &self.stats,
|
|
}
|
|
}
|
|
|
|
/// Return self as [`TrieDBMut`](trie_db::TrieDBMut) compatible cache.
|
|
///
|
|
/// After finishing all operations with [`TrieDBMut`](trie_db::TrieDBMut) and having obtained
|
|
/// the new storage root, [`TrieCache::merge_into`] should be called to update this local
|
|
/// cache instance. If the function is not called, cached data is just thrown away and not
|
|
/// propagated to the shared cache. So, accessing these new items will be slower, but nothing
|
|
/// would break because of this.
|
|
pub fn as_trie_db_mut_cache(&self) -> TrieCache<'_, H> {
|
|
TrieCache {
|
|
shared_cache: self.shared.clone(),
|
|
local_cache: self.node_cache.lock(),
|
|
value_cache: ValueCache::Fresh(Default::default()),
|
|
stats: &self.stats,
|
|
}
|
|
}
|
|
}
|
|
|
|
impl<H: Hasher> Drop for LocalTrieCache<H> {
|
|
fn drop(&mut self) {
|
|
tracing::debug!(
|
|
target: LOG_TARGET,
|
|
"Local node trie cache dropped: {}",
|
|
self.stats.node_cache
|
|
);
|
|
|
|
tracing::debug!(
|
|
target: LOG_TARGET,
|
|
"Local value trie cache dropped: {}",
|
|
self.stats.value_cache
|
|
);
|
|
|
|
let mut shared_inner = match self.shared.write_lock_inner() {
|
|
Some(inner) => inner,
|
|
None => {
|
|
tracing::warn!(
|
|
target: LOG_TARGET,
|
|
"Timeout while trying to acquire a write lock for the shared trie cache"
|
|
);
|
|
return
|
|
},
|
|
};
|
|
|
|
shared_inner.node_cache_mut().update(self.node_cache.get_mut().drain());
|
|
|
|
shared_inner.value_cache_mut().update(
|
|
self.value_cache.get_mut().drain(),
|
|
self.shared_value_cache_access.get_mut().drain().map(|(key, ())| key),
|
|
);
|
|
}
|
|
}
|
|
|
|
/// The abstraction of the value cache for the [`TrieCache`].
|
|
enum ValueCache<'a, H: Hasher> {
|
|
/// The value cache is fresh, aka not yet associated to any storage root.
|
|
/// This is used for example when a new trie is being build, to cache new values.
|
|
Fresh(HashMap<Arc<[u8]>, CachedValue<H::Out>>),
|
|
/// The value cache is already bound to a specific storage root.
|
|
ForStorageRoot {
|
|
shared_value_cache_access: MutexGuard<'a, ValueAccessSet>,
|
|
local_value_cache: MutexGuard<'a, ValueCacheMap<H::Out>>,
|
|
storage_root: H::Out,
|
|
// The shared value cache needs to be temporarily locked when reading from it
|
|
// so we need to clone the value that is returned, but we need to be able to
|
|
// return a reference to the value, so we just buffer it here.
|
|
buffered_value: Option<CachedValue<H::Out>>,
|
|
},
|
|
}
|
|
|
|
impl<H: Hasher> ValueCache<'_, H> {
|
|
/// Get the value for the given `key`.
|
|
fn get<'a>(
|
|
&'a mut self,
|
|
key: &[u8],
|
|
shared_cache: &SharedTrieCache<H>,
|
|
stats: &HitStats,
|
|
) -> Option<&CachedValue<H::Out>> {
|
|
stats.local_fetch_attempts.fetch_add(1, Ordering::Relaxed);
|
|
|
|
match self {
|
|
Self::Fresh(map) =>
|
|
if let Some(value) = map.get(key) {
|
|
stats.local_hits.fetch_add(1, Ordering::Relaxed);
|
|
Some(value)
|
|
} else {
|
|
None
|
|
},
|
|
Self::ForStorageRoot {
|
|
local_value_cache,
|
|
shared_value_cache_access,
|
|
storage_root,
|
|
buffered_value,
|
|
} => {
|
|
// We first need to look up in the local cache and then the shared cache.
|
|
// It can happen that some value is cached in the shared cache, but the
|
|
// weak reference of the data can not be upgraded anymore. This for example
|
|
// happens when the node is dropped that contains the strong reference to the data.
|
|
//
|
|
// So, the logic of the trie would lookup the data and the node and store both
|
|
// in our local caches.
|
|
|
|
let hash = ValueCacheKey::hash_data(key, storage_root);
|
|
|
|
if let Some(value) = local_value_cache
|
|
.peek_by_hash(hash.raw(), |existing_key, _| {
|
|
existing_key.is_eq(storage_root, key)
|
|
}) {
|
|
stats.local_hits.fetch_add(1, Ordering::Relaxed);
|
|
|
|
return Some(value)
|
|
}
|
|
|
|
stats.shared_fetch_attempts.fetch_add(1, Ordering::Relaxed);
|
|
if let Some(value) = shared_cache.peek_value_by_hash(hash, storage_root, key) {
|
|
stats.shared_hits.fetch_add(1, Ordering::Relaxed);
|
|
shared_value_cache_access.insert(hash, ());
|
|
*buffered_value = Some(value.clone());
|
|
return buffered_value.as_ref()
|
|
}
|
|
|
|
None
|
|
},
|
|
}
|
|
}
|
|
|
|
/// Insert some new `value` under the given `key`.
|
|
fn insert(&mut self, key: &[u8], value: CachedValue<H::Out>) {
|
|
match self {
|
|
Self::Fresh(map) => {
|
|
map.insert(key.into(), value);
|
|
},
|
|
Self::ForStorageRoot { local_value_cache, storage_root, .. } => {
|
|
local_value_cache.insert(ValueCacheRef::new(key, *storage_root), value);
|
|
},
|
|
}
|
|
}
|
|
}
|
|
|
|
/// The actual [`TrieCache`](trie_db::TrieCache) implementation.
|
|
///
|
|
/// If this instance was created for using it with a [`TrieDBMut`](trie_db::TrieDBMut), it needs to
|
|
/// be merged back into the [`LocalTrieCache`] with [`Self::merge_into`] after all operations are
|
|
/// done.
|
|
pub struct TrieCache<'a, H: Hasher> {
|
|
shared_cache: SharedTrieCache<H>,
|
|
local_cache: MutexGuard<'a, NodeCacheMap<H::Out>>,
|
|
value_cache: ValueCache<'a, H>,
|
|
stats: &'a TrieHitStats,
|
|
}
|
|
|
|
impl<'a, H: Hasher> TrieCache<'a, H> {
|
|
/// Merge this cache into the given [`LocalTrieCache`].
|
|
///
|
|
/// This function is only required to be called when this instance was created through
|
|
/// [`LocalTrieCache::as_trie_db_mut_cache`], otherwise this method is a no-op. The given
|
|
/// `storage_root` is the new storage root that was obtained after finishing all operations
|
|
/// using the [`TrieDBMut`](trie_db::TrieDBMut).
|
|
pub fn merge_into(self, local: &LocalTrieCache<H>, storage_root: H::Out) {
|
|
let cache = if let ValueCache::Fresh(cache) = self.value_cache { cache } else { return };
|
|
|
|
if !cache.is_empty() {
|
|
let mut value_cache = local.value_cache.lock();
|
|
let partial_hash = ValueCacheKey::hash_partial_data(&storage_root);
|
|
|
|
cache.into_iter().for_each(|(k, v)| {
|
|
let hash = ValueCacheKeyHash::from_hasher_and_storage_key(partial_hash.clone(), &k);
|
|
let k = ValueCacheRef { storage_root, storage_key: &k, hash };
|
|
value_cache.insert(k, v);
|
|
});
|
|
}
|
|
}
|
|
}
|
|
|
|
impl<'a, H: Hasher> trie_db::TrieCache<NodeCodec<H>> for TrieCache<'a, H> {
|
|
fn get_or_insert_node(
|
|
&mut self,
|
|
hash: H::Out,
|
|
fetch_node: &mut dyn FnMut() -> trie_db::Result<NodeOwned<H::Out>, H::Out, Error<H::Out>>,
|
|
) -> trie_db::Result<&NodeOwned<H::Out>, H::Out, Error<H::Out>> {
|
|
let mut is_local_cache_hit = true;
|
|
self.stats.node_cache.local_fetch_attempts.fetch_add(1, Ordering::Relaxed);
|
|
|
|
// First try to grab the node from the local cache.
|
|
let node = self.local_cache.get_or_insert_fallible(hash, || {
|
|
is_local_cache_hit = false;
|
|
|
|
// It was not in the local cache; try the shared cache.
|
|
self.stats.node_cache.shared_fetch_attempts.fetch_add(1, Ordering::Relaxed);
|
|
if let Some(node) = self.shared_cache.peek_node(&hash) {
|
|
self.stats.node_cache.shared_hits.fetch_add(1, Ordering::Relaxed);
|
|
tracing::trace!(target: LOG_TARGET, ?hash, "Serving node from shared cache");
|
|
|
|
return Ok(NodeCached::<H::Out> { node: node.clone(), is_from_shared_cache: true })
|
|
}
|
|
|
|
// It was not in the shared cache; try fetching it from the database.
|
|
match fetch_node() {
|
|
Ok(node) => {
|
|
tracing::trace!(target: LOG_TARGET, ?hash, "Serving node from database");
|
|
Ok(NodeCached::<H::Out> { node, is_from_shared_cache: false })
|
|
},
|
|
Err(error) => {
|
|
tracing::trace!(target: LOG_TARGET, ?hash, "Serving node from database failed");
|
|
Err(error)
|
|
},
|
|
}
|
|
});
|
|
|
|
if is_local_cache_hit {
|
|
tracing::trace!(target: LOG_TARGET, ?hash, "Serving node from local cache");
|
|
self.stats.node_cache.local_hits.fetch_add(1, Ordering::Relaxed);
|
|
}
|
|
|
|
Ok(&node?
|
|
.expect("you can always insert at least one element into the local cache; qed")
|
|
.node)
|
|
}
|
|
|
|
fn get_node(&mut self, hash: &H::Out) -> Option<&NodeOwned<H::Out>> {
|
|
let mut is_local_cache_hit = true;
|
|
self.stats.node_cache.local_fetch_attempts.fetch_add(1, Ordering::Relaxed);
|
|
|
|
// First try to grab the node from the local cache.
|
|
let cached_node = self.local_cache.get_or_insert_fallible(*hash, || {
|
|
is_local_cache_hit = false;
|
|
|
|
// It was not in the local cache; try the shared cache.
|
|
self.stats.node_cache.shared_fetch_attempts.fetch_add(1, Ordering::Relaxed);
|
|
if let Some(node) = self.shared_cache.peek_node(&hash) {
|
|
self.stats.node_cache.shared_hits.fetch_add(1, Ordering::Relaxed);
|
|
tracing::trace!(target: LOG_TARGET, ?hash, "Serving node from shared cache");
|
|
|
|
Ok(NodeCached::<H::Out> { node: node.clone(), is_from_shared_cache: true })
|
|
} else {
|
|
tracing::trace!(target: LOG_TARGET, ?hash, "Serving node from cache failed");
|
|
|
|
Err(())
|
|
}
|
|
});
|
|
|
|
if is_local_cache_hit {
|
|
tracing::trace!(target: LOG_TARGET, ?hash, "Serving node from local cache");
|
|
self.stats.node_cache.local_hits.fetch_add(1, Ordering::Relaxed);
|
|
}
|
|
|
|
match cached_node {
|
|
Ok(Some(cached_node)) => Some(&cached_node.node),
|
|
Ok(None) => {
|
|
unreachable!(
|
|
"you can always insert at least one element into the local cache; qed"
|
|
);
|
|
},
|
|
Err(()) => None,
|
|
}
|
|
}
|
|
|
|
fn lookup_value_for_key(&mut self, key: &[u8]) -> Option<&CachedValue<H::Out>> {
|
|
let res = self.value_cache.get(key, &self.shared_cache, &self.stats.value_cache);
|
|
|
|
tracing::trace!(
|
|
target: LOG_TARGET,
|
|
key = ?sp_core::hexdisplay::HexDisplay::from(&key),
|
|
found = res.is_some(),
|
|
"Looked up value for key",
|
|
);
|
|
|
|
res
|
|
}
|
|
|
|
fn cache_value_for_key(&mut self, key: &[u8], data: CachedValue<H::Out>) {
|
|
tracing::trace!(
|
|
target: LOG_TARGET,
|
|
key = ?sp_core::hexdisplay::HexDisplay::from(&key),
|
|
"Caching value for key",
|
|
);
|
|
|
|
self.value_cache.insert(key, data);
|
|
}
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod tests {
|
|
use super::*;
|
|
use trie_db::{Bytes, Trie, TrieDBBuilder, TrieDBMutBuilder, TrieHash, TrieMut};
|
|
|
|
type MemoryDB = crate::MemoryDB<sp_core::Blake2Hasher>;
|
|
type Layout = crate::LayoutV1<sp_core::Blake2Hasher>;
|
|
type Cache = super::SharedTrieCache<sp_core::Blake2Hasher>;
|
|
type Recorder = crate::recorder::Recorder<sp_core::Blake2Hasher>;
|
|
|
|
const TEST_DATA: &[(&[u8], &[u8])] =
|
|
&[(b"key1", b"val1"), (b"key2", &[2; 64]), (b"key3", b"val3"), (b"key4", &[4; 64])];
|
|
const CACHE_SIZE_RAW: usize = 1024 * 10;
|
|
const CACHE_SIZE: CacheSize = CacheSize::new(CACHE_SIZE_RAW);
|
|
|
|
fn create_trie() -> (MemoryDB, TrieHash<Layout>) {
|
|
let mut db = MemoryDB::default();
|
|
let mut root = Default::default();
|
|
|
|
{
|
|
let mut trie = TrieDBMutBuilder::<Layout>::new(&mut db, &mut root).build();
|
|
for (k, v) in TEST_DATA {
|
|
trie.insert(k, v).expect("Inserts data");
|
|
}
|
|
}
|
|
|
|
(db, root)
|
|
}
|
|
|
|
#[test]
|
|
fn basic_cache_works() {
|
|
let (db, root) = create_trie();
|
|
|
|
let shared_cache = Cache::new(CACHE_SIZE);
|
|
let local_cache = shared_cache.local_cache();
|
|
|
|
{
|
|
let mut cache = local_cache.as_trie_db_cache(root);
|
|
let trie = TrieDBBuilder::<Layout>::new(&db, &root).with_cache(&mut cache).build();
|
|
assert_eq!(TEST_DATA[0].1.to_vec(), trie.get(TEST_DATA[0].0).unwrap().unwrap());
|
|
}
|
|
|
|
// Local cache wasn't dropped yet, so there should nothing in the shared caches.
|
|
assert!(shared_cache.read_lock_inner().value_cache().lru.is_empty());
|
|
assert!(shared_cache.read_lock_inner().node_cache().lru.is_empty());
|
|
|
|
drop(local_cache);
|
|
|
|
// Now we should have the cached items in the shared cache.
|
|
assert!(shared_cache.read_lock_inner().node_cache().lru.len() >= 1);
|
|
let cached_data = shared_cache
|
|
.read_lock_inner()
|
|
.value_cache()
|
|
.lru
|
|
.peek(&ValueCacheKey::new_value(TEST_DATA[0].0, root))
|
|
.unwrap()
|
|
.clone();
|
|
assert_eq!(Bytes::from(TEST_DATA[0].1.to_vec()), cached_data.data().flatten().unwrap());
|
|
|
|
let fake_data = Bytes::from(&b"fake_data"[..]);
|
|
|
|
let local_cache = shared_cache.local_cache();
|
|
shared_cache.write_lock_inner().unwrap().value_cache_mut().lru.insert(
|
|
ValueCacheKey::new_value(TEST_DATA[1].0, root),
|
|
(fake_data.clone(), Default::default()).into(),
|
|
);
|
|
|
|
{
|
|
let mut cache = local_cache.as_trie_db_cache(root);
|
|
let trie = TrieDBBuilder::<Layout>::new(&db, &root).with_cache(&mut cache).build();
|
|
|
|
// We should now get the "fake_data", because we inserted this manually to the cache.
|
|
assert_eq!(b"fake_data".to_vec(), trie.get(TEST_DATA[1].0).unwrap().unwrap());
|
|
}
|
|
}
|
|
|
|
#[test]
|
|
fn trie_db_mut_cache_works() {
|
|
let (mut db, root) = create_trie();
|
|
|
|
let new_key = b"new_key".to_vec();
|
|
// Use some long value to not have it inlined
|
|
let new_value = vec![23; 64];
|
|
|
|
let shared_cache = Cache::new(CACHE_SIZE);
|
|
let mut new_root = root;
|
|
|
|
{
|
|
let local_cache = shared_cache.local_cache();
|
|
|
|
let mut cache = local_cache.as_trie_db_mut_cache();
|
|
|
|
{
|
|
let mut trie = TrieDBMutBuilder::<Layout>::from_existing(&mut db, &mut new_root)
|
|
.with_cache(&mut cache)
|
|
.build();
|
|
|
|
trie.insert(&new_key, &new_value).unwrap();
|
|
}
|
|
|
|
cache.merge_into(&local_cache, new_root);
|
|
}
|
|
|
|
// After the local cache is dropped, all changes should have been merged back to the shared
|
|
// cache.
|
|
let cached_data = shared_cache
|
|
.read_lock_inner()
|
|
.value_cache()
|
|
.lru
|
|
.peek(&ValueCacheKey::new_value(new_key, new_root))
|
|
.unwrap()
|
|
.clone();
|
|
assert_eq!(Bytes::from(new_value), cached_data.data().flatten().unwrap());
|
|
}
|
|
|
|
#[test]
|
|
fn trie_db_cache_and_recorder_work_together() {
|
|
let (db, root) = create_trie();
|
|
|
|
let shared_cache = Cache::new(CACHE_SIZE);
|
|
|
|
for i in 0..5 {
|
|
// Clear some of the caches.
|
|
if i == 2 {
|
|
shared_cache.reset_node_cache();
|
|
} else if i == 3 {
|
|
shared_cache.reset_value_cache();
|
|
}
|
|
|
|
let local_cache = shared_cache.local_cache();
|
|
let recorder = Recorder::default();
|
|
|
|
{
|
|
let mut cache = local_cache.as_trie_db_cache(root);
|
|
let mut recorder = recorder.as_trie_recorder(root);
|
|
let trie = TrieDBBuilder::<Layout>::new(&db, &root)
|
|
.with_cache(&mut cache)
|
|
.with_recorder(&mut recorder)
|
|
.build();
|
|
|
|
for (key, value) in TEST_DATA {
|
|
assert_eq!(*value, trie.get(&key).unwrap().unwrap());
|
|
}
|
|
}
|
|
|
|
let storage_proof = recorder.drain_storage_proof();
|
|
let memory_db: MemoryDB = storage_proof.into_memory_db();
|
|
|
|
{
|
|
let trie = TrieDBBuilder::<Layout>::new(&memory_db, &root).build();
|
|
|
|
for (key, value) in TEST_DATA {
|
|
assert_eq!(*value, trie.get(&key).unwrap().unwrap());
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
#[test]
|
|
fn trie_db_mut_cache_and_recorder_work_together() {
|
|
const DATA_TO_ADD: &[(&[u8], &[u8])] = &[(b"key11", &[45; 78]), (b"key33", &[78; 89])];
|
|
|
|
let (db, root) = create_trie();
|
|
|
|
let shared_cache = Cache::new(CACHE_SIZE);
|
|
|
|
// Run this twice so that we use the data cache in the second run.
|
|
for i in 0..5 {
|
|
// Clear some of the caches.
|
|
if i == 2 {
|
|
shared_cache.reset_node_cache();
|
|
} else if i == 3 {
|
|
shared_cache.reset_value_cache();
|
|
}
|
|
|
|
let recorder = Recorder::default();
|
|
let local_cache = shared_cache.local_cache();
|
|
let mut new_root = root;
|
|
|
|
{
|
|
let mut db = db.clone();
|
|
let mut cache = local_cache.as_trie_db_cache(root);
|
|
let mut recorder = recorder.as_trie_recorder(root);
|
|
let mut trie = TrieDBMutBuilder::<Layout>::from_existing(&mut db, &mut new_root)
|
|
.with_cache(&mut cache)
|
|
.with_recorder(&mut recorder)
|
|
.build();
|
|
|
|
for (key, value) in DATA_TO_ADD {
|
|
trie.insert(key, value).unwrap();
|
|
}
|
|
}
|
|
|
|
let storage_proof = recorder.drain_storage_proof();
|
|
let mut memory_db: MemoryDB = storage_proof.into_memory_db();
|
|
let mut proof_root = root;
|
|
|
|
{
|
|
let mut trie =
|
|
TrieDBMutBuilder::<Layout>::from_existing(&mut memory_db, &mut proof_root)
|
|
.build();
|
|
|
|
for (key, value) in DATA_TO_ADD {
|
|
trie.insert(key, value).unwrap();
|
|
}
|
|
}
|
|
|
|
assert_eq!(new_root, proof_root)
|
|
}
|
|
}
|
|
|
|
#[test]
|
|
fn cache_lru_works() {
|
|
let (db, root) = create_trie();
|
|
|
|
let shared_cache = Cache::new(CACHE_SIZE);
|
|
|
|
{
|
|
let local_cache = shared_cache.local_cache();
|
|
|
|
let mut cache = local_cache.as_trie_db_cache(root);
|
|
let trie = TrieDBBuilder::<Layout>::new(&db, &root).with_cache(&mut cache).build();
|
|
|
|
for (k, _) in TEST_DATA {
|
|
trie.get(k).unwrap().unwrap();
|
|
}
|
|
}
|
|
|
|
// Check that all items are there.
|
|
assert!(shared_cache
|
|
.read_lock_inner()
|
|
.value_cache()
|
|
.lru
|
|
.iter()
|
|
.map(|d| d.0)
|
|
.all(|l| TEST_DATA.iter().any(|d| &*l.storage_key == d.0)));
|
|
|
|
// Run this in a loop. The first time we check that with the filled value cache,
|
|
// the expected values are at the top of the LRU.
|
|
// The second run is using an empty value cache to ensure that we access the nodes.
|
|
for _ in 0..2 {
|
|
{
|
|
let local_cache = shared_cache.local_cache();
|
|
|
|
let mut cache = local_cache.as_trie_db_cache(root);
|
|
let trie = TrieDBBuilder::<Layout>::new(&db, &root).with_cache(&mut cache).build();
|
|
|
|
for (k, _) in TEST_DATA.iter().take(2) {
|
|
trie.get(k).unwrap().unwrap();
|
|
}
|
|
}
|
|
|
|
// Ensure that the accessed items are most recently used items of the shared value
|
|
// cache.
|
|
assert!(shared_cache
|
|
.read_lock_inner()
|
|
.value_cache()
|
|
.lru
|
|
.iter()
|
|
.take(2)
|
|
.map(|d| d.0)
|
|
.all(|l| { TEST_DATA.iter().take(2).any(|d| &*l.storage_key == d.0) }));
|
|
|
|
// Delete the value cache, so that we access the nodes.
|
|
shared_cache.reset_value_cache();
|
|
}
|
|
|
|
let most_recently_used_nodes = shared_cache
|
|
.read_lock_inner()
|
|
.node_cache()
|
|
.lru
|
|
.iter()
|
|
.map(|d| *d.0)
|
|
.collect::<Vec<_>>();
|
|
|
|
{
|
|
let local_cache = shared_cache.local_cache();
|
|
|
|
let mut cache = local_cache.as_trie_db_cache(root);
|
|
let trie = TrieDBBuilder::<Layout>::new(&db, &root).with_cache(&mut cache).build();
|
|
|
|
for (k, _) in TEST_DATA.iter().skip(2) {
|
|
trie.get(k).unwrap().unwrap();
|
|
}
|
|
}
|
|
|
|
// Ensure that the most recently used nodes changed as well.
|
|
assert_ne!(
|
|
most_recently_used_nodes,
|
|
shared_cache
|
|
.read_lock_inner()
|
|
.node_cache()
|
|
.lru
|
|
.iter()
|
|
.map(|d| *d.0)
|
|
.collect::<Vec<_>>()
|
|
);
|
|
}
|
|
|
|
#[test]
|
|
fn cache_respects_bounds() {
|
|
let (mut db, root) = create_trie();
|
|
|
|
let shared_cache = Cache::new(CACHE_SIZE);
|
|
{
|
|
let local_cache = shared_cache.local_cache();
|
|
|
|
let mut new_root = root;
|
|
|
|
{
|
|
let mut cache = local_cache.as_trie_db_cache(root);
|
|
{
|
|
let mut trie =
|
|
TrieDBMutBuilder::<Layout>::from_existing(&mut db, &mut new_root)
|
|
.with_cache(&mut cache)
|
|
.build();
|
|
|
|
let value = vec![10u8; 100];
|
|
// Ensure we add enough data that would overflow the cache.
|
|
for i in 0..CACHE_SIZE_RAW / 100 * 2 {
|
|
trie.insert(format!("key{}", i).as_bytes(), &value).unwrap();
|
|
}
|
|
}
|
|
|
|
cache.merge_into(&local_cache, new_root);
|
|
}
|
|
}
|
|
|
|
assert!(shared_cache.used_memory_size() < CACHE_SIZE_RAW);
|
|
}
|
|
}
|