mirror of
https://github.com/pezkuwichain/pezkuwi-subxt.git
synced 2026-06-15 01:01:04 +00:00
New PVF validation host (#2710)
* Implement PVF validation host * WIP: Diener * Increase the alloted compilation time * Add more comments * Minor clean up * Apply suggestions from code review Co-authored-by: Bastian Köcher <bkchr@users.noreply.github.com> * Fix pruning artifact removal * Fix formatting and newlines * Fix the thread pool * Update node/core/pvf/src/executor_intf.rs Co-authored-by: Bastian Köcher <bkchr@users.noreply.github.com> * Remove redundant test declaration * Don't convert the path into an intermediate string * Try to workaround the test failure * Use the puppet_worker trick again * Fix a blip * Move `ensure_wasmtime_version` under the tests mod * Add a macro for puppet_workers * fix build for not real-overseer * Rename the puppet worker for adder collator * play it safe with the name of adder puppet worker * Typo: triggered * Add more comments * Do not kill exec worker on every error * Plumb Duration for timeouts * typo: critical * Add proofs * Clean unused imports * Revert "WIP: Diener" This reverts commit b9f54e513366c7a6dfdd117ac19fbdc46b900b4d. * Sync version of wasmtime * Update cargo.lock * Update Substrate * Merge fixes still * Update wasmtime version in test * bastifmt Co-authored-by: Bastian Köcher <bkchr@users.noreply.github.com> * Squash spaces * Trailing new line for testing.rs * Remove controversial code * comment about biasing * Fix suggestion * Add comments * make it more clear why unwrap_err * tmpfile retry * proper proofs for claim_idle * Remove mutex from ValidationHost * Add some more logging * Extract exec timeout into a constant * Add some clarifying logging * Use blake2_256 * Clean up the merge Specifically the leftovers after removing real-overseer * Update parachain/test-parachains/adder/collator/Cargo.toml Co-authored-by: Andronik Ordian <write@reusable.software> Co-authored-by: Bastian Köcher <bkchr@users.noreply.github.com> Co-authored-by: Andronik Ordian <write@reusable.software>
This commit is contained in:
@@ -0,0 +1,311 @@
|
||||
// Copyright 2021 Parity Technologies (UK) Ltd.
|
||||
// This file is part of Polkadot.
|
||||
|
||||
// Polkadot is free software: you can redistribute it and/or modify
|
||||
// it under the terms of the GNU General Public License as published by
|
||||
// the Free Software Foundation, either version 3 of the License, or
|
||||
// (at your option) any later version.
|
||||
|
||||
// Polkadot is distributed in the hope that it will be useful,
|
||||
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
// GNU General Public License for more details.
|
||||
|
||||
// You should have received a copy of the GNU General Public License
|
||||
// along with Polkadot. If not, see <http://www.gnu.org/licenses/>.
|
||||
|
||||
use crate::LOG_TARGET;
|
||||
use always_assert::always;
|
||||
use async_std::{
|
||||
io,
|
||||
path::{Path, PathBuf},
|
||||
};
|
||||
use polkadot_core_primitives::Hash;
|
||||
use std::{
|
||||
collections::HashMap,
|
||||
time::{Duration, SystemTime},
|
||||
};
|
||||
use parity_scale_codec::{Encode, Decode};
|
||||
use futures::StreamExt;
|
||||
|
||||
/// A final product of preparation process. Contains either a ready to run compiled artifact or
|
||||
/// a description what went wrong.
|
||||
#[derive(Encode, Decode)]
|
||||
pub enum Artifact {
|
||||
/// During the prevalidation stage of preparation an issue was found with the PVF.
|
||||
PrevalidationErr(String),
|
||||
/// Compilation failed for the given PVF.
|
||||
PreparationErr(String),
|
||||
/// This state indicates that the process assigned to prepare the artifact wasn't responsible
|
||||
/// or were killed. This state is reported by the validation host (not by the worker).
|
||||
DidntMakeIt,
|
||||
/// The PVF passed all the checks and is ready for execution.
|
||||
Compiled { compiled_artifact: Vec<u8> },
|
||||
}
|
||||
|
||||
impl Artifact {
|
||||
/// Serializes this struct into a byte buffer.
|
||||
pub fn serialize(&self) -> Vec<u8> {
|
||||
self.encode()
|
||||
}
|
||||
|
||||
/// Deserialize the given byte buffer to an artifact.
|
||||
pub fn deserialize(mut bytes: &[u8]) -> Result<Self, String> {
|
||||
Artifact::decode(&mut bytes).map_err(|e| format!("{:?}", e))
|
||||
}
|
||||
}
|
||||
|
||||
/// Identifier of an artifact. Right now it only encodes a code hash of the PVF. But if we get to
|
||||
/// multiple engine implementations the artifact ID should include the engine type as well.
|
||||
#[derive(Clone, Debug, PartialEq, Eq, PartialOrd, Ord, Hash)]
|
||||
pub struct ArtifactId {
|
||||
code_hash: Hash,
|
||||
}
|
||||
|
||||
impl ArtifactId {
|
||||
const PREFIX: &'static str = "wasmtime_1_";
|
||||
|
||||
/// Creates a new artifact ID with the given hash.
|
||||
pub fn new(code_hash: Hash) -> Self {
|
||||
Self { code_hash }
|
||||
}
|
||||
|
||||
/// Tries to recover the artifact id from the given file name.
|
||||
pub fn from_file_name(file_name: &str) -> Option<Self> {
|
||||
use std::str::FromStr as _;
|
||||
|
||||
let file_name = file_name.strip_prefix(Self::PREFIX)?;
|
||||
let code_hash = Hash::from_str(file_name).ok()?;
|
||||
|
||||
Some(Self { code_hash })
|
||||
}
|
||||
|
||||
/// Returns the expected path to this artifact given the root of the cache.
|
||||
pub fn path(&self, cache_path: &Path) -> PathBuf {
|
||||
let file_name = format!("{}{}", Self::PREFIX, self.code_hash.to_string());
|
||||
cache_path.join(file_name)
|
||||
}
|
||||
}
|
||||
|
||||
pub enum ArtifactState {
|
||||
/// The artifact is ready to be used by the executor.
|
||||
///
|
||||
/// That means that the artifact should be accessible through the path obtained by the artifact
|
||||
/// id (unless, it was removed externally).
|
||||
Prepared {
|
||||
/// The time when the artifact was the last time needed.
|
||||
///
|
||||
/// This is updated when we get the heads up for this artifact or when we just discover
|
||||
/// this file.
|
||||
last_time_needed: SystemTime,
|
||||
},
|
||||
/// A task to prepare this artifact is scheduled.
|
||||
Preparing,
|
||||
}
|
||||
|
||||
/// A container of all known artifact ids and their states.
|
||||
pub struct Artifacts {
|
||||
artifacts: HashMap<ArtifactId, ArtifactState>,
|
||||
}
|
||||
|
||||
impl Artifacts {
|
||||
/// Scan the given cache root for the artifacts.
|
||||
///
|
||||
/// The recognized artifacts will be filled in the table and unrecognized will be removed.
|
||||
pub async fn new(cache_path: &Path) -> Self {
|
||||
// Make sure that the cache path directory and all it's parents are created.
|
||||
let _ = async_std::fs::create_dir_all(cache_path).await;
|
||||
|
||||
let artifacts = match scan_for_known_artifacts(cache_path).await {
|
||||
Ok(a) => a,
|
||||
Err(err) => {
|
||||
tracing::warn!(
|
||||
target: LOG_TARGET,
|
||||
"unable to seed the artifacts in memory cache: {:?}. Starting with a clean one",
|
||||
err,
|
||||
);
|
||||
HashMap::new()
|
||||
}
|
||||
};
|
||||
|
||||
Self { artifacts }
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
pub(crate) fn empty() -> Self {
|
||||
Self {
|
||||
artifacts: HashMap::new(),
|
||||
}
|
||||
}
|
||||
|
||||
/// Returns the state of the given artifact by its ID.
|
||||
pub fn artifact_state_mut(&mut self, artifact_id: &ArtifactId) -> Option<&mut ArtifactState> {
|
||||
self.artifacts.get_mut(artifact_id)
|
||||
}
|
||||
|
||||
/// Inform the table about the artifact with the given ID. The state will be set to "preparing".
|
||||
///
|
||||
/// This function must be used only for brand new artifacts and should never be used for
|
||||
/// replacing existing ones.
|
||||
pub fn insert_preparing(&mut self, artifact_id: ArtifactId) {
|
||||
// See the precondition.
|
||||
always!(self
|
||||
.artifacts
|
||||
.insert(artifact_id, ArtifactState::Preparing)
|
||||
.is_none());
|
||||
}
|
||||
|
||||
/// Insert an artifact with the given ID as "prepared".
|
||||
///
|
||||
/// This function must be used only for brand new artifacts and should never be used for
|
||||
/// replacing existing ones.
|
||||
#[cfg(test)]
|
||||
pub fn insert_prepared(&mut self, artifact_id: ArtifactId, last_time_needed: SystemTime) {
|
||||
// See the precondition.
|
||||
always!(self
|
||||
.artifacts
|
||||
.insert(artifact_id, ArtifactState::Prepared { last_time_needed })
|
||||
.is_none());
|
||||
}
|
||||
|
||||
/// Remove and retrive the artifacts from the table that are older than the supplied Time-To-Live.
|
||||
pub fn prune(&mut self, artifact_ttl: Duration) -> Vec<ArtifactId> {
|
||||
let now = SystemTime::now();
|
||||
|
||||
let mut to_remove = vec![];
|
||||
for (k, v) in self.artifacts.iter() {
|
||||
if let ArtifactState::Prepared {
|
||||
last_time_needed, ..
|
||||
} = *v {
|
||||
if now
|
||||
.duration_since(last_time_needed)
|
||||
.map(|age| age > artifact_ttl)
|
||||
.unwrap_or(false)
|
||||
{
|
||||
to_remove.push(k.clone());
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
for artifact in &to_remove {
|
||||
self.artifacts.remove(artifact);
|
||||
}
|
||||
|
||||
to_remove
|
||||
}
|
||||
}
|
||||
|
||||
/// Goes over all files in the given directory, collecting all recognizable artifacts. All files
|
||||
/// that do not look like artifacts are removed.
|
||||
///
|
||||
/// All recognized artifacts will be created with the current datetime.
|
||||
async fn scan_for_known_artifacts(
|
||||
cache_path: &Path,
|
||||
) -> io::Result<HashMap<ArtifactId, ArtifactState>> {
|
||||
let mut result = HashMap::new();
|
||||
let now = SystemTime::now();
|
||||
|
||||
let mut dir = async_std::fs::read_dir(cache_path).await?;
|
||||
while let Some(res) = dir.next().await {
|
||||
let entry = res?;
|
||||
|
||||
if entry.file_type().await?.is_dir() {
|
||||
tracing::debug!(
|
||||
target: LOG_TARGET,
|
||||
"{} is a dir, and dirs do not belong to us. Removing",
|
||||
entry.path().display(),
|
||||
);
|
||||
let _ = async_std::fs::remove_dir_all(entry.path()).await;
|
||||
}
|
||||
|
||||
let path = entry.path();
|
||||
let file_name = match path.file_name() {
|
||||
None => {
|
||||
// A file without a file name? Weird, just skip it.
|
||||
continue;
|
||||
}
|
||||
Some(file_name) => file_name,
|
||||
};
|
||||
|
||||
let file_name = match file_name.to_str() {
|
||||
None => {
|
||||
tracing::debug!(
|
||||
target: LOG_TARGET,
|
||||
"{} is not utf-8. Removing",
|
||||
path.display(),
|
||||
);
|
||||
let _ = async_std::fs::remove_file(&path).await;
|
||||
continue;
|
||||
}
|
||||
Some(file_name) => file_name,
|
||||
};
|
||||
|
||||
let artifact_id = match ArtifactId::from_file_name(file_name) {
|
||||
None => {
|
||||
tracing::debug!(
|
||||
target: LOG_TARGET,
|
||||
"{} is not a recognized artifact. Removing",
|
||||
path.display(),
|
||||
);
|
||||
let _ = async_std::fs::remove_file(&path).await;
|
||||
continue;
|
||||
}
|
||||
Some(artifact_id) => artifact_id,
|
||||
};
|
||||
|
||||
// A sanity check so that we really can access the artifact through the artifact id.
|
||||
if artifact_id.path(cache_path).is_file().await {
|
||||
result.insert(
|
||||
artifact_id,
|
||||
ArtifactState::Prepared {
|
||||
last_time_needed: now,
|
||||
},
|
||||
);
|
||||
} else {
|
||||
tracing::warn!(
|
||||
target: LOG_TARGET,
|
||||
"{} is not accessible by artifact_id {:?}",
|
||||
cache_path.display(),
|
||||
artifact_id,
|
||||
);
|
||||
}
|
||||
}
|
||||
|
||||
Ok(result)
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod tests {
|
||||
use super::ArtifactId;
|
||||
|
||||
#[test]
|
||||
fn ensure_wasmtime_version() {
|
||||
assert_eq!(
|
||||
wasmtime_jit::VERSION,
|
||||
"0.24.0",
|
||||
"wasmtime version is updated. Check the prefix.",
|
||||
);
|
||||
// If the version bump is significant, change `ArtifactId::PREFIX`.
|
||||
//
|
||||
// If in doubt bump it. This will lead to removal of the existing artifacts in the on-disk cache
|
||||
// and recompilation.
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn from_file_name() {
|
||||
assert!(ArtifactId::from_file_name("").is_none());
|
||||
assert!(ArtifactId::from_file_name("junk").is_none());
|
||||
|
||||
assert_eq!(
|
||||
ArtifactId::from_file_name(
|
||||
"wasmtime_1_0x0022800000000000000000000000000000000000000000000000000000000000"
|
||||
),
|
||||
Some(ArtifactId::new(
|
||||
hex_literal::hex![
|
||||
"0022800000000000000000000000000000000000000000000000000000000000"
|
||||
]
|
||||
.into()
|
||||
)),
|
||||
);
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user