mirror of
https://github.com/pezkuwichain/pezkuwi-subxt.git
synced 2026-05-07 18:58:01 +00:00
9980d314b1
* Follow ups for the MachineCmd Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Fix CI Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Review fixes Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Add to node-template Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Fix test with feature flag Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Review fixes Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Lower disk requirements Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Add ExecutionLimit to the disk benchmarks Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * fmt Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Add doc Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Review fixes Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Rename DISK_WRITE_LIMIT -> DEFAULT_DISK_EXECUTION_LIMIT Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Rename POLKADOT_REFERENCE_HARDWARE -> SUBSTRATE_REFERENCE_HARDWARE Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Fix build profile + add license Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Remove deps Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Set tolerance to 10% Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Fix tests Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Ignore test I cannot reproduce the CI error, even with the full command: cargo test --workspace --locked --release --verbose --features runtime-benchmarks --manifest-path ./bin/node/cli/Cargo.toml I will put an 'ignore' on that test for now, since it works for me and is worth having. Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> * Remove test Still cannot reproduce the error and it fails in the CI. Removing it now. Signed-off-by: Oliver Tale-Yazdi <oliver.tale-yazdi@parity.io> Co-authored-by: Shawn Tabrizi <shawntabrizi@gmail.com>
479 lines
13 KiB
Rust
479 lines
13 KiB
Rust
// This file is part of Substrate.
|
|
|
|
// Copyright (C) 2022 Parity Technologies (UK) Ltd.
|
|
// SPDX-License-Identifier: GPL-3.0-or-later WITH Classpath-exception-2.0
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU General Public License for more details.
|
|
|
|
// You should have received a copy of the GNU General Public License
|
|
// along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
use crate::{ExecutionLimit, HwBench};
|
|
|
|
use sc_telemetry::SysInfo;
|
|
use sp_core::{sr25519, Pair};
|
|
use sp_io::crypto::sr25519_verify;
|
|
use sp_std::prelude::*;
|
|
|
|
use rand::{seq::SliceRandom, Rng, RngCore};
|
|
use std::{
|
|
fs::File,
|
|
io::{Seek, SeekFrom, Write},
|
|
ops::{Deref, DerefMut},
|
|
path::{Path, PathBuf},
|
|
time::{Duration, Instant},
|
|
};
|
|
|
|
#[inline(always)]
|
|
pub(crate) fn benchmark<E>(
|
|
name: &str,
|
|
size: usize,
|
|
max_iterations: usize,
|
|
max_duration: Duration,
|
|
mut run: impl FnMut() -> Result<(), E>,
|
|
) -> Result<f64, E> {
|
|
// Run the benchmark once as a warmup to get the code into the L1 cache.
|
|
run()?;
|
|
|
|
// Then run it multiple times and average the result.
|
|
let timestamp = Instant::now();
|
|
let mut elapsed = Duration::default();
|
|
let mut count = 0;
|
|
for _ in 0..max_iterations {
|
|
run()?;
|
|
|
|
count += 1;
|
|
elapsed = timestamp.elapsed();
|
|
|
|
if elapsed >= max_duration {
|
|
break
|
|
}
|
|
}
|
|
|
|
let score = ((size * count) as f64 / elapsed.as_secs_f64()) / (1024.0 * 1024.0);
|
|
log::trace!(
|
|
"Calculated {} of {}MB/s in {} iterations in {}ms",
|
|
name,
|
|
score as u64,
|
|
count,
|
|
elapsed.as_millis()
|
|
);
|
|
Ok(score)
|
|
}
|
|
|
|
/// Gathers information about node's hardware and software.
|
|
pub fn gather_sysinfo() -> SysInfo {
|
|
#[allow(unused_mut)]
|
|
let mut sysinfo = SysInfo {
|
|
cpu: None,
|
|
memory: None,
|
|
core_count: None,
|
|
linux_kernel: None,
|
|
linux_distro: None,
|
|
is_virtual_machine: None,
|
|
};
|
|
|
|
#[cfg(target_os = "linux")]
|
|
crate::sysinfo_linux::gather_linux_sysinfo(&mut sysinfo);
|
|
|
|
sysinfo
|
|
}
|
|
|
|
#[inline(never)]
|
|
fn clobber_slice<T>(slice: &mut [T]) {
|
|
assert!(!slice.is_empty());
|
|
|
|
// Discourage the compiler from optimizing out our benchmarks.
|
|
//
|
|
// Volatile reads and writes are guaranteed to not be elided nor reordered,
|
|
// so we can use them to effectively clobber a piece of memory and prevent
|
|
// the compiler from optimizing out our technically unnecessary code.
|
|
//
|
|
// This is not totally bulletproof in theory, but should work in practice.
|
|
//
|
|
// SAFETY: We've checked that the slice is not empty, so reading and writing
|
|
// its first element is always safe.
|
|
unsafe {
|
|
let value = std::ptr::read_volatile(slice.as_ptr());
|
|
std::ptr::write_volatile(slice.as_mut_ptr(), value);
|
|
}
|
|
}
|
|
|
|
#[inline(never)]
|
|
fn clobber_value<T>(input: &mut T) {
|
|
// Look into `clobber_slice` for a comment.
|
|
unsafe {
|
|
let value = std::ptr::read_volatile(input);
|
|
std::ptr::write_volatile(input, value);
|
|
}
|
|
}
|
|
|
|
// This benchmarks the CPU speed as measured by calculating BLAKE2b-256 hashes, in MB/s.
|
|
pub fn benchmark_cpu() -> u64 {
|
|
// In general the results of this benchmark are somewhat sensitive to how much
|
|
// data we hash at the time. The smaller this is the *less* MB/s we can hash,
|
|
// the bigger this is the *more* MB/s we can hash, up until a certain point
|
|
// where we can achieve roughly ~100% of what the hasher can do. If we'd plot
|
|
// this on a graph with the number of bytes we want to hash on the X axis
|
|
// and the speed in MB/s on the Y axis then we'd essentially see it grow
|
|
// logarithmically.
|
|
//
|
|
// In practice however we might not always have enough data to hit the maximum
|
|
// possible speed that the hasher can achieve, so the size set here should be
|
|
// picked in such a way as to still measure how fast the hasher is at hashing,
|
|
// but without hitting its theoretical maximum speed.
|
|
const SIZE: usize = 32 * 1024;
|
|
const MAX_ITERATIONS: usize = 4 * 1024;
|
|
const MAX_DURATION: Duration = Duration::from_millis(100);
|
|
|
|
let mut buffer = Vec::new();
|
|
buffer.resize(SIZE, 0x66);
|
|
let mut hash = Default::default();
|
|
|
|
let run = || -> Result<(), ()> {
|
|
clobber_slice(&mut buffer);
|
|
hash = sp_core::hashing::blake2_256(&buffer);
|
|
clobber_slice(&mut hash);
|
|
|
|
Ok(())
|
|
};
|
|
|
|
benchmark("CPU score", SIZE, MAX_ITERATIONS, MAX_DURATION, run)
|
|
.expect("benchmark cannot fail; qed") as u64
|
|
}
|
|
|
|
// This benchmarks the effective `memcpy` memory bandwidth available in MB/s.
|
|
//
|
|
// It doesn't technically measure the absolute maximum memory bandwidth available,
|
|
// but that's fine, because real code most of the time isn't optimized to take
|
|
// advantage of the full memory bandwidth either.
|
|
pub fn benchmark_memory() -> u64 {
|
|
// Ideally this should be at least as big as the CPU's L3 cache,
|
|
// and it should be big enough so that the `memcpy` takes enough
|
|
// time to be actually measurable.
|
|
//
|
|
// As long as it's big enough increasing it further won't change
|
|
// the benchmark's results.
|
|
const SIZE: usize = 64 * 1024 * 1024;
|
|
const MAX_ITERATIONS: usize = 32;
|
|
const MAX_DURATION: Duration = Duration::from_millis(100);
|
|
|
|
let mut src = Vec::new();
|
|
let mut dst = Vec::new();
|
|
|
|
// Prefault the pages; we want to measure the memory bandwidth,
|
|
// not how fast the kernel can supply us with fresh memory pages.
|
|
src.resize(SIZE, 0x66);
|
|
dst.resize(SIZE, 0x77);
|
|
|
|
let run = || -> Result<(), ()> {
|
|
clobber_slice(&mut src);
|
|
clobber_slice(&mut dst);
|
|
|
|
// SAFETY: Both vectors are of the same type and of the same size,
|
|
// so copying data between them is safe.
|
|
unsafe {
|
|
// We use `memcpy` directly here since `copy_from_slice` isn't actually
|
|
// guaranteed to be turned into a `memcpy`.
|
|
libc::memcpy(dst.as_mut_ptr().cast(), src.as_ptr().cast(), SIZE);
|
|
}
|
|
|
|
clobber_slice(&mut dst);
|
|
clobber_slice(&mut src);
|
|
|
|
Ok(())
|
|
};
|
|
|
|
benchmark("memory score", SIZE, MAX_ITERATIONS, MAX_DURATION, run)
|
|
.expect("benchmark cannot fail; qed") as u64
|
|
}
|
|
|
|
struct TemporaryFile {
|
|
fp: Option<File>,
|
|
path: PathBuf,
|
|
}
|
|
|
|
impl Drop for TemporaryFile {
|
|
fn drop(&mut self) {
|
|
let _ = self.fp.take();
|
|
|
|
// Remove the file.
|
|
//
|
|
// This has to be done *after* the benchmark,
|
|
// otherwise it changes the results as the data
|
|
// doesn't actually get properly flushed to the disk,
|
|
// since the file's not there anymore.
|
|
if let Err(error) = std::fs::remove_file(&self.path) {
|
|
log::warn!("Failed to remove the file used for the disk benchmark: {}", error);
|
|
}
|
|
}
|
|
}
|
|
|
|
impl Deref for TemporaryFile {
|
|
type Target = File;
|
|
fn deref(&self) -> &Self::Target {
|
|
self.fp.as_ref().expect("`fp` is None only during `drop`")
|
|
}
|
|
}
|
|
|
|
impl DerefMut for TemporaryFile {
|
|
fn deref_mut(&mut self) -> &mut Self::Target {
|
|
self.fp.as_mut().expect("`fp` is None only during `drop`")
|
|
}
|
|
}
|
|
|
|
fn rng() -> rand_pcg::Pcg64 {
|
|
rand_pcg::Pcg64::new(0xcafef00dd15ea5e5, 0xa02bdbf7bb3c0a7ac28fa16a64abf96)
|
|
}
|
|
|
|
fn random_data(size: usize) -> Vec<u8> {
|
|
let mut buffer = Vec::new();
|
|
buffer.resize(size, 0);
|
|
rng().fill(&mut buffer[..]);
|
|
buffer
|
|
}
|
|
|
|
/// A default [`ExecutionLimit`] that can be used to call [`benchmark_disk_sequential_writes`]
|
|
/// and [`benchmark_disk_random_writes`].
|
|
pub const DEFAULT_DISK_EXECUTION_LIMIT: ExecutionLimit =
|
|
ExecutionLimit::Both { max_iterations: 32, max_duration: Duration::from_millis(300) };
|
|
|
|
pub fn benchmark_disk_sequential_writes(
|
|
limit: ExecutionLimit,
|
|
directory: &Path,
|
|
) -> Result<u64, String> {
|
|
const SIZE: usize = 64 * 1024 * 1024;
|
|
|
|
let buffer = random_data(SIZE);
|
|
let path = directory.join(".disk_bench_seq_wr.tmp");
|
|
|
|
let fp =
|
|
File::create(&path).map_err(|error| format!("failed to create a test file: {}", error))?;
|
|
|
|
let mut fp = TemporaryFile { fp: Some(fp), path };
|
|
|
|
fp.sync_all()
|
|
.map_err(|error| format!("failed to fsync the test file: {}", error))?;
|
|
|
|
let run = || {
|
|
// Just dump everything to the disk in one go.
|
|
fp.write_all(&buffer)
|
|
.map_err(|error| format!("failed to write to the test file: {}", error))?;
|
|
|
|
// And then make sure it was actually written to disk.
|
|
fp.sync_all()
|
|
.map_err(|error| format!("failed to fsync the test file: {}", error))?;
|
|
|
|
// Rewind to the beginning for the next iteration of the benchmark.
|
|
fp.seek(SeekFrom::Start(0))
|
|
.map_err(|error| format!("failed to seek to the start of the test file: {}", error))?;
|
|
|
|
Ok(())
|
|
};
|
|
|
|
benchmark(
|
|
"disk sequential write score",
|
|
SIZE,
|
|
limit.max_iterations(),
|
|
limit.max_duration(),
|
|
run,
|
|
)
|
|
.map(|s| s as u64)
|
|
}
|
|
|
|
pub fn benchmark_disk_random_writes(
|
|
limit: ExecutionLimit,
|
|
directory: &Path,
|
|
) -> Result<u64, String> {
|
|
const SIZE: usize = 64 * 1024 * 1024;
|
|
|
|
let buffer = random_data(SIZE);
|
|
let path = directory.join(".disk_bench_rand_wr.tmp");
|
|
|
|
let fp =
|
|
File::create(&path).map_err(|error| format!("failed to create a test file: {}", error))?;
|
|
|
|
let mut fp = TemporaryFile { fp: Some(fp), path };
|
|
|
|
// Since we want to test random writes we need an existing file
|
|
// through which we can seek, so here we just populate it with some data.
|
|
fp.write_all(&buffer)
|
|
.map_err(|error| format!("failed to write to the test file: {}", error))?;
|
|
|
|
fp.sync_all()
|
|
.map_err(|error| format!("failed to fsync the test file: {}", error))?;
|
|
|
|
// Generate a list of random positions at which we'll issue writes.
|
|
let mut positions = Vec::with_capacity(SIZE / 4096);
|
|
{
|
|
let mut position = 0;
|
|
while position < SIZE {
|
|
positions.push(position);
|
|
position += 4096;
|
|
}
|
|
}
|
|
|
|
positions.shuffle(&mut rng());
|
|
|
|
let run = || {
|
|
for &position in &positions {
|
|
fp.seek(SeekFrom::Start(position as u64))
|
|
.map_err(|error| format!("failed to seek in the test file: {}", error))?;
|
|
|
|
// Here we deliberately only write half of the chunk since we don't
|
|
// want the OS' disk scheduler to coalesce our writes into one single
|
|
// sequential write.
|
|
//
|
|
// Also the chunk's size is deliberately exactly half of a modern disk's
|
|
// sector size to trigger an RMW cycle.
|
|
let chunk = &buffer[position..position + 2048];
|
|
fp.write_all(&chunk)
|
|
.map_err(|error| format!("failed to write to the test file: {}", error))?;
|
|
}
|
|
|
|
fp.sync_all()
|
|
.map_err(|error| format!("failed to fsync the test file: {}", error))?;
|
|
|
|
Ok(())
|
|
};
|
|
|
|
// We only wrote half of the bytes hence `SIZE / 2`.
|
|
benchmark(
|
|
"disk random write score",
|
|
SIZE / 2,
|
|
limit.max_iterations(),
|
|
limit.max_duration(),
|
|
run,
|
|
)
|
|
.map(|s| s as u64)
|
|
}
|
|
|
|
/// Benchmarks the verification speed of sr25519 signatures.
|
|
///
|
|
/// Returns the throughput in MB/s by convention.
|
|
/// The values are rather small (0.4-0.8) so it is advised to convert them into KB/s.
|
|
pub fn benchmark_sr25519_verify(limit: ExecutionLimit) -> f64 {
|
|
const INPUT_SIZE: usize = 32;
|
|
const ITERATION_SIZE: usize = 2048;
|
|
let pair = sr25519::Pair::from_string("//Alice", None).unwrap();
|
|
|
|
let mut rng = rng();
|
|
let mut msgs = Vec::new();
|
|
let mut sigs = Vec::new();
|
|
|
|
for _ in 0..ITERATION_SIZE {
|
|
let mut msg = vec![0u8; INPUT_SIZE];
|
|
rng.fill_bytes(&mut msg[..]);
|
|
|
|
sigs.push(pair.sign(&msg));
|
|
msgs.push(msg);
|
|
}
|
|
|
|
let run = || -> Result<(), String> {
|
|
for (sig, msg) in sigs.iter().zip(msgs.iter()) {
|
|
let mut ok = sr25519_verify(&sig, &msg[..], &pair.public());
|
|
clobber_value(&mut ok);
|
|
}
|
|
Ok(())
|
|
};
|
|
benchmark(
|
|
"sr25519 verification score",
|
|
INPUT_SIZE * ITERATION_SIZE,
|
|
limit.max_iterations(),
|
|
limit.max_duration(),
|
|
run,
|
|
)
|
|
.expect("sr25519 verification cannot fail; qed")
|
|
}
|
|
|
|
/// Benchmarks the hardware and returns the results of those benchmarks.
|
|
///
|
|
/// Optionally accepts a path to a `scratch_directory` to use to benchmark the disk.
|
|
pub fn gather_hwbench(scratch_directory: Option<&Path>) -> HwBench {
|
|
#[allow(unused_mut)]
|
|
let mut hwbench = HwBench {
|
|
cpu_hashrate_score: benchmark_cpu(),
|
|
memory_memcpy_score: benchmark_memory(),
|
|
disk_sequential_write_score: None,
|
|
disk_random_write_score: None,
|
|
};
|
|
|
|
if let Some(scratch_directory) = scratch_directory {
|
|
hwbench.disk_sequential_write_score =
|
|
match benchmark_disk_sequential_writes(DEFAULT_DISK_EXECUTION_LIMIT, scratch_directory)
|
|
{
|
|
Ok(score) => Some(score),
|
|
Err(error) => {
|
|
log::warn!("Failed to run the sequential write disk benchmark: {}", error);
|
|
None
|
|
},
|
|
};
|
|
|
|
hwbench.disk_random_write_score =
|
|
match benchmark_disk_random_writes(DEFAULT_DISK_EXECUTION_LIMIT, scratch_directory) {
|
|
Ok(score) => Some(score),
|
|
Err(error) => {
|
|
log::warn!("Failed to run the random write disk benchmark: {}", error);
|
|
None
|
|
},
|
|
};
|
|
}
|
|
|
|
hwbench
|
|
}
|
|
|
|
#[cfg(test)]
|
|
mod tests {
|
|
use super::*;
|
|
|
|
#[cfg(target_os = "linux")]
|
|
#[test]
|
|
fn test_gather_sysinfo_linux() {
|
|
let sysinfo = gather_sysinfo();
|
|
assert!(sysinfo.cpu.unwrap().len() > 0);
|
|
assert!(sysinfo.core_count.unwrap() > 0);
|
|
assert!(sysinfo.memory.unwrap() > 0);
|
|
assert_ne!(sysinfo.is_virtual_machine, None);
|
|
assert_ne!(sysinfo.linux_kernel, None);
|
|
assert_ne!(sysinfo.linux_distro, None);
|
|
}
|
|
|
|
#[test]
|
|
fn test_benchmark_cpu() {
|
|
assert_ne!(benchmark_cpu(), 0);
|
|
}
|
|
|
|
#[test]
|
|
fn test_benchmark_memory() {
|
|
assert_ne!(benchmark_memory(), 0);
|
|
}
|
|
|
|
#[test]
|
|
fn test_benchmark_disk_sequential_writes() {
|
|
assert!(
|
|
benchmark_disk_sequential_writes(DEFAULT_DISK_EXECUTION_LIMIT, "./".as_ref()).unwrap() >
|
|
0
|
|
);
|
|
}
|
|
|
|
#[test]
|
|
fn test_benchmark_disk_random_writes() {
|
|
assert!(
|
|
benchmark_disk_random_writes(DEFAULT_DISK_EXECUTION_LIMIT, "./".as_ref()).unwrap() > 0
|
|
);
|
|
}
|
|
|
|
#[test]
|
|
fn test_benchmark_sr25519_verify() {
|
|
assert!(benchmark_sr25519_verify(ExecutionLimit::MaxIterations(1)) > 0.0);
|
|
}
|
|
}
|