mirror of
https://github.com/hl-archive-node/nanoreth.git
synced 2025-12-06 10:59:55 +00:00
perf(stages): Adds benchmark to TransactionLookupStage (#1130)
Co-authored-by: Georgios Konstantopoulos <me@gakonst.com> Co-authored-by: Bjerg <onbjerg@users.noreply.github.com>
This commit is contained in:
@ -175,6 +175,7 @@ impl Command {
|
||||
BlockTransitionIndex,
|
||||
TxTransitionIndex,
|
||||
SyncStage,
|
||||
TxHashNumber,
|
||||
Transactions
|
||||
]);
|
||||
}
|
||||
|
||||
@ -23,7 +23,10 @@ impl Deref for Block {
|
||||
}
|
||||
|
||||
/// Sealed Ethereum full block.
|
||||
#[derive(Debug, Clone, PartialEq, Eq, Default, RlpEncodable, RlpDecodable)]
|
||||
#[derive_arbitrary(rlp, 10)]
|
||||
#[derive(
|
||||
Debug, Clone, PartialEq, Eq, Default, RlpEncodable, RlpDecodable, Serialize, Deserialize,
|
||||
)]
|
||||
pub struct SealedBlock {
|
||||
/// Locked block header.
|
||||
pub header: SealedHeader,
|
||||
|
||||
@ -5,7 +5,7 @@ use crate::{
|
||||
};
|
||||
use bytes::{BufMut, BytesMut};
|
||||
use ethers_core::types::{Block, H256 as EthersH256, H64};
|
||||
use reth_codecs::{derive_arbitrary, main_codec, Compact};
|
||||
use reth_codecs::{add_arbitrary_tests, derive_arbitrary, main_codec, Compact};
|
||||
use reth_rlp::{length_of_length, Decodable, Encodable};
|
||||
use serde::{Deserialize, Serialize};
|
||||
use std::ops::Deref;
|
||||
@ -229,7 +229,8 @@ impl Decodable for Header {
|
||||
|
||||
/// A [`Header`] that is sealed at a precalculated hash, use [`SealedHeader::unseal()`] if you want
|
||||
/// to modify header.
|
||||
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
|
||||
#[add_arbitrary_tests(rlp)]
|
||||
#[derive(Debug, Clone, PartialEq, Eq, Hash, Serialize, Deserialize)]
|
||||
pub struct SealedHeader {
|
||||
/// Locked Header fields.
|
||||
header: Header,
|
||||
@ -237,6 +238,32 @@ pub struct SealedHeader {
|
||||
hash: BlockHash,
|
||||
}
|
||||
|
||||
#[cfg(any(test, feature = "arbitrary"))]
|
||||
impl proptest::arbitrary::Arbitrary for SealedHeader {
|
||||
type Parameters = ();
|
||||
type Strategy = proptest::strategy::BoxedStrategy<SealedHeader>;
|
||||
|
||||
fn arbitrary_with(_: Self::Parameters) -> Self::Strategy {
|
||||
use proptest::prelude::{any, Strategy};
|
||||
|
||||
any::<(Header, BlockHash)>()
|
||||
.prop_map(move |(header, _)| {
|
||||
let hash = header.hash_slow();
|
||||
SealedHeader { header, hash }
|
||||
})
|
||||
.boxed()
|
||||
}
|
||||
}
|
||||
|
||||
#[cfg(any(test, feature = "arbitrary"))]
|
||||
impl<'a> arbitrary::Arbitrary<'a> for SealedHeader {
|
||||
fn arbitrary(u: &mut arbitrary::Unstructured<'a>) -> arbitrary::Result<Self> {
|
||||
let header = Header::arbitrary(u)?;
|
||||
let hash = header.hash_slow();
|
||||
Ok(SealedHeader { header, hash })
|
||||
}
|
||||
}
|
||||
|
||||
impl From<Block<EthersH256>> for SealedHeader {
|
||||
fn from(block: Block<EthersH256>) -> Self {
|
||||
let header = Header {
|
||||
|
||||
@ -16,8 +16,7 @@ criterion_main!(benches);
|
||||
|
||||
fn senders(c: &mut Criterion) {
|
||||
let mut group = c.benchmark_group("Stages");
|
||||
group.measurement_time(std::time::Duration::from_millis(2000));
|
||||
group.warm_up_time(std::time::Duration::from_millis(2000));
|
||||
|
||||
// don't need to run each stage for that many times
|
||||
group.sample_size(10);
|
||||
|
||||
@ -33,8 +32,7 @@ fn senders(c: &mut Criterion) {
|
||||
|
||||
fn tx_lookup(c: &mut Criterion) {
|
||||
let mut group = c.benchmark_group("Stages");
|
||||
group.measurement_time(std::time::Duration::from_millis(2000));
|
||||
group.warm_up_time(std::time::Duration::from_millis(2000));
|
||||
|
||||
// don't need to run each stage for that many times
|
||||
group.sample_size(10);
|
||||
|
||||
|
||||
@ -66,14 +66,37 @@ impl<DB: Database> Stage<DB> for TransactionLookupStage {
|
||||
.unwrap_or_default()
|
||||
});
|
||||
|
||||
// Collect tranasctions for each body and insert the reverse lookup for hash -> tx_id.
|
||||
// Collect transactions for each body
|
||||
let mut tx_list = vec![];
|
||||
for body_entry in bodies {
|
||||
let (_, body) = body_entry?;
|
||||
let transactions = tx_cursor.walk(body.start_tx_id)?.take(body.tx_count as usize);
|
||||
|
||||
for tx_entry in transactions {
|
||||
let (id, transaction) = tx_entry?;
|
||||
tx.put::<tables::TxHashNumber>(transaction.hash(), id)?;
|
||||
tx_list.push((transaction.hash(), id));
|
||||
}
|
||||
}
|
||||
|
||||
// Sort before inserting the reverse lookup for hash -> tx_id.
|
||||
tx_list.sort_by(|txa, txb| txa.0.cmp(&txb.0));
|
||||
|
||||
let mut txhash_cursor = tx.cursor_write::<tables::TxHashNumber>()?;
|
||||
|
||||
// If the last inserted element in the database is smaller than the first in our set, then
|
||||
// we can just append into the DB. This probably only ever happens during sync, on
|
||||
// the first table insertion.
|
||||
let append = tx_list
|
||||
.first()
|
||||
.zip(txhash_cursor.last()?)
|
||||
.map(|((first, _), (last, _))| &last < first)
|
||||
.unwrap_or_default();
|
||||
|
||||
for (tx_hash, id) in tx_list {
|
||||
if append {
|
||||
txhash_cursor.append(tx_hash, id)?;
|
||||
} else {
|
||||
txhash_cursor.insert(tx_hash, id)?;
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
@ -85,6 +85,10 @@ arbitrary = [
|
||||
"dep:proptest-derive",
|
||||
]
|
||||
|
||||
[[bench]]
|
||||
name = "hash_keys"
|
||||
harness = false
|
||||
|
||||
[[bench]]
|
||||
name = "criterion"
|
||||
harness = false
|
||||
|
||||
259
crates/storage/db/benches/hash_keys.rs
Normal file
259
crates/storage/db/benches/hash_keys.rs
Normal file
@ -0,0 +1,259 @@
|
||||
#![allow(dead_code, unused_imports, non_snake_case)]
|
||||
|
||||
use criterion::{
|
||||
black_box, criterion_group, criterion_main, measurement::WallTime, BenchmarkGroup, Criterion,
|
||||
};
|
||||
use proptest::{
|
||||
arbitrary::Arbitrary,
|
||||
prelude::{any_with, ProptestConfig},
|
||||
strategy::{Strategy, ValueTree},
|
||||
test_runner::TestRunner,
|
||||
};
|
||||
use reth_db::{
|
||||
cursor::{DbDupCursorRO, DbDupCursorRW},
|
||||
mdbx::Env,
|
||||
};
|
||||
use std::{collections::HashSet, time::Instant};
|
||||
use test_fuzz::runtime::num_traits::Zero;
|
||||
|
||||
criterion_group!(benches, hash_keys);
|
||||
criterion_main!(benches);
|
||||
|
||||
/// It benchmarks the insertion of rows into a table where `Keys` are hashes.
|
||||
/// * `append`: Table is empty. Sorts during benchmark.
|
||||
/// * `insert_sorted`: Table is preloaded with rows (same as batch size). Sorts during benchmark.
|
||||
/// * `insert_unsorted`: Table is preloaded with rows (same as batch size).
|
||||
/// * `put_sorted`: Table is preloaded with rows (same as batch size). Sorts during benchmark.
|
||||
/// * `put_unsorted`: Table is preloaded with rows (same as batch size).
|
||||
///
|
||||
/// It does the above steps with different batches of rows. 10_000, 100_000, 1_000_000. In the
|
||||
/// end, the table statistics are shown (eg. number of pages, table size...)
|
||||
pub fn hash_keys(c: &mut Criterion) {
|
||||
let mut group = c.benchmark_group("Hash-Keys Table Insertion");
|
||||
|
||||
group.sample_size(10);
|
||||
|
||||
for size in vec![10_000, 100_000, 1_000_000] {
|
||||
measure_table_insertion::<TxHashNumber>(&mut group, size);
|
||||
}
|
||||
}
|
||||
|
||||
fn measure_table_insertion<T>(group: &mut BenchmarkGroup<WallTime>, size: usize)
|
||||
where
|
||||
T: Table + Default,
|
||||
T::Key: Default
|
||||
+ Clone
|
||||
+ for<'de> serde::Deserialize<'de>
|
||||
+ Arbitrary
|
||||
+ serde::Serialize
|
||||
+ Ord
|
||||
+ std::hash::Hash,
|
||||
T::Value: Default + Clone + for<'de> serde::Deserialize<'de> + Arbitrary + serde::Serialize,
|
||||
{
|
||||
let bench_db_path = Path::new(BENCH_DB_PATH);
|
||||
|
||||
let scenarios: Vec<(fn(_, _) -> _, &str)> = vec![
|
||||
(append::<T>, "append_all"),
|
||||
(append::<T>, "append_input"),
|
||||
(insert::<T>, "insert_unsorted"),
|
||||
(insert::<T>, "insert_sorted"),
|
||||
(put::<T>, "put_unsorted"),
|
||||
(put::<T>, "put_sorted"),
|
||||
];
|
||||
|
||||
// `preload` is to be inserted into the database during the setup phase in all scenarios but
|
||||
// `append`.
|
||||
let (preload, unsorted_input) = generate_batches::<T>(size);
|
||||
|
||||
for (scenario, scenario_str) in scenarios {
|
||||
// Append does not preload the table
|
||||
let mut preload_size = size;
|
||||
let mut input_size = size;
|
||||
if scenario_str.contains("append") {
|
||||
if scenario_str == "append_all" {
|
||||
input_size = size * 2;
|
||||
}
|
||||
preload_size = 0;
|
||||
}
|
||||
|
||||
// Setup phase before each benchmark iteration
|
||||
let setup = || {
|
||||
// Reset DB
|
||||
let _ = std::fs::remove_dir_all(bench_db_path);
|
||||
let db = create_test_db_with_path::<WriteMap>(EnvKind::RW, bench_db_path);
|
||||
|
||||
let mut unsorted_input = unsorted_input.clone();
|
||||
if scenario_str == "append_all" {
|
||||
unsorted_input.extend_from_slice(&preload);
|
||||
}
|
||||
|
||||
if preload_size > 0 {
|
||||
db.update(|tx| {
|
||||
for (key, value) in &preload {
|
||||
let _ = tx.put::<T>(key.clone(), value.clone());
|
||||
}
|
||||
})
|
||||
.unwrap();
|
||||
}
|
||||
|
||||
(unsorted_input, db)
|
||||
};
|
||||
|
||||
// Iteration to be benchmarked
|
||||
let execution = |(input, db)| {
|
||||
let mut input: Vec<(T::Key, T::Value)> = input;
|
||||
if scenario_str.contains("_sorted") || scenario_str.contains("append") {
|
||||
input.sort_by(|a, b| a.0.cmp(&b.0));
|
||||
}
|
||||
scenario(db, input)
|
||||
};
|
||||
|
||||
group.bench_function(
|
||||
format!(
|
||||
"{} | {scenario_str} | preload: {} | writing: {} ",
|
||||
T::NAME,
|
||||
preload_size,
|
||||
input_size
|
||||
),
|
||||
|b| {
|
||||
b.iter_with_setup(setup, execution);
|
||||
},
|
||||
);
|
||||
|
||||
// Execute once more to show table stats (doesn't count for benchmarking speed)
|
||||
let db = execution(setup());
|
||||
get_table_stats::<T>(db);
|
||||
}
|
||||
}
|
||||
|
||||
/// Generates two batches. The first is to be inserted into the database before running the
|
||||
/// benchmark. The second is to be benchmarked with.
|
||||
fn generate_batches<T>(size: usize) -> (Vec<(T::Key, T::Value)>, Vec<(T::Key, T::Value)>)
|
||||
where
|
||||
T: Table + Default,
|
||||
T::Key: std::hash::Hash + Arbitrary,
|
||||
T::Value: Arbitrary,
|
||||
{
|
||||
let strat = proptest::collection::vec(
|
||||
any_with::<(T::Key, T::Value)>((
|
||||
<T::Key as Arbitrary>::Parameters::default(),
|
||||
<T::Value as Arbitrary>::Parameters::default(),
|
||||
)),
|
||||
size,
|
||||
)
|
||||
.no_shrink()
|
||||
.boxed();
|
||||
|
||||
let mut runner = TestRunner::new(ProptestConfig::default());
|
||||
let mut preload = strat.new_tree(&mut runner).unwrap().current();
|
||||
let mut input = strat.new_tree(&mut runner).unwrap().current();
|
||||
|
||||
let mut unique_keys = HashSet::new();
|
||||
preload.retain(|(k, _)| unique_keys.insert(k.clone()));
|
||||
input.retain(|(k, _)| unique_keys.insert(k.clone()));
|
||||
|
||||
(preload, input)
|
||||
}
|
||||
|
||||
fn append<T>(
|
||||
db: Env<WriteMap>,
|
||||
input: Vec<(<T as Table>::Key, <T as Table>::Value)>,
|
||||
) -> Env<WriteMap>
|
||||
where
|
||||
T: Table + Default,
|
||||
{
|
||||
{
|
||||
let tx = db.tx_mut().expect("tx");
|
||||
let mut crsr = tx.cursor_write::<T>().expect("cursor");
|
||||
black_box({
|
||||
for (k, v) in input {
|
||||
crsr.append(k, v).expect("submit");
|
||||
}
|
||||
|
||||
tx.inner.commit().unwrap();
|
||||
});
|
||||
}
|
||||
db
|
||||
}
|
||||
|
||||
fn insert<T>(
|
||||
db: Env<WriteMap>,
|
||||
input: Vec<(<T as Table>::Key, <T as Table>::Value)>,
|
||||
) -> Env<WriteMap>
|
||||
where
|
||||
T: Table + Default,
|
||||
{
|
||||
{
|
||||
let tx = db.tx_mut().expect("tx");
|
||||
let mut crsr = tx.cursor_write::<T>().expect("cursor");
|
||||
black_box({
|
||||
for (k, v) in input {
|
||||
crsr.insert(k, v).expect("submit");
|
||||
}
|
||||
|
||||
tx.inner.commit().unwrap();
|
||||
});
|
||||
}
|
||||
db
|
||||
}
|
||||
|
||||
fn put<T>(db: Env<WriteMap>, input: Vec<(<T as Table>::Key, <T as Table>::Value)>) -> Env<WriteMap>
|
||||
where
|
||||
T: Table + Default,
|
||||
{
|
||||
{
|
||||
let tx = db.tx_mut().expect("tx");
|
||||
black_box({
|
||||
for (k, v) in input {
|
||||
tx.put::<T>(k, v).expect("submit");
|
||||
}
|
||||
|
||||
tx.inner.commit().unwrap();
|
||||
});
|
||||
}
|
||||
db
|
||||
}
|
||||
|
||||
#[derive(Debug)]
|
||||
struct TableStats {
|
||||
page_size: usize,
|
||||
leaf_pages: usize,
|
||||
branch_pages: usize,
|
||||
overflow_pages: usize,
|
||||
num_pages: usize,
|
||||
size: usize,
|
||||
}
|
||||
|
||||
fn get_table_stats<T>(db: Env<WriteMap>)
|
||||
where
|
||||
T: Table + Default,
|
||||
{
|
||||
db.view(|tx| {
|
||||
let table_db = tx.inner.open_db(Some(T::NAME)).map_err(|_| "Could not open db.").unwrap();
|
||||
|
||||
println!(
|
||||
"{:?}\n",
|
||||
tx.inner
|
||||
.db_stat(&table_db)
|
||||
.map_err(|_| format!("Could not find table: {}", T::NAME))
|
||||
.map(|stats| {
|
||||
let num_pages =
|
||||
stats.leaf_pages() + stats.branch_pages() + stats.overflow_pages();
|
||||
let size = num_pages * stats.page_size() as usize;
|
||||
|
||||
TableStats {
|
||||
page_size: stats.page_size() as usize,
|
||||
leaf_pages: stats.leaf_pages(),
|
||||
branch_pages: stats.branch_pages(),
|
||||
overflow_pages: stats.overflow_pages(),
|
||||
num_pages,
|
||||
size,
|
||||
}
|
||||
})
|
||||
.unwrap()
|
||||
);
|
||||
})
|
||||
.unwrap();
|
||||
}
|
||||
|
||||
include!("./utils.rs");
|
||||
Reference in New Issue
Block a user