mirror of
https://github.com/pezkuwichain/pezkuwi-subxt.git
synced 2026-06-12 13:31:10 +00:00
initial jaeger integration (#2047)
Co-authored-by: Pierre Krieger <pierre.krieger1708@gmail.com> Co-authored-by: Peter Goodspeed-Niklaus <coriolinus@users.noreply.github.com> Co-authored-by: Bastian Köcher <bkchr@users.noreply.github.com>
This commit is contained in:
committed by
GitHub
parent
15c253117d
commit
a5fe710cc6
@@ -59,3 +59,21 @@ impl core::fmt::Display for ChainApiError {
|
||||
}
|
||||
|
||||
impl std::error::Error for ChainApiError {}
|
||||
|
||||
|
||||
/// A description of an error causing the chain API request to be unservable.
|
||||
#[derive(Debug, thiserror::Error)]
|
||||
#[allow(missing_docs)]
|
||||
pub enum JaegerError {
|
||||
#[error("Already launched the collector thread")]
|
||||
AlreadyLaunched,
|
||||
|
||||
#[error("Missing jaeger configuration")]
|
||||
MissingConfiguration,
|
||||
|
||||
#[error("Failed to allocate port for UDP transfer to jaeger agent")]
|
||||
PortAllocationError(#[source] std::io::Error),
|
||||
|
||||
#[error("Failed to send jaeger span to agent")]
|
||||
SendError(#[source] std::io::Error),
|
||||
}
|
||||
|
||||
@@ -0,0 +1,251 @@
|
||||
// Copyright 2020 Parity Technologies (UK) Ltd.
|
||||
// This file is part of Polkadot.
|
||||
|
||||
// Polkadot is free software: you can redistribute it and/or modify
|
||||
// it under the terms of the GNU General Public License as published by
|
||||
// the Free Software Foundation, either version 3 of the License, or
|
||||
// (at your option) any later version.
|
||||
|
||||
// Polkadot is distributed in the hope that it will be useful,
|
||||
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
// GNU General Public License for more details.
|
||||
|
||||
// You should have received a copy of the GNU General Public License
|
||||
// along with Polkadot. If not, see <http://www.gnu.org/licenses/>.
|
||||
|
||||
//! Jaeger integration.
|
||||
//!
|
||||
//! See <https://www.jaegertracing.io/> for an introduction.
|
||||
//!
|
||||
//! The easiest way to try Jaeger is:
|
||||
//!
|
||||
//! - Start a docker container with the all-in-one docker image (see below).
|
||||
//! - Open your browser and navigate to <https://localhost:16686> to acces the UI.
|
||||
//!
|
||||
//! The all-in-one image can be started with:
|
||||
//!
|
||||
//! ```not_rust
|
||||
//! podman login docker.io
|
||||
//! podman run -d --name jaeger \
|
||||
//! -e COLLECTOR_ZIPKIN_HTTP_PORT=9411 \
|
||||
//! -p 5775:5775/udp \
|
||||
//! -p 6831:6831/udp \
|
||||
//! -p 6832:6832/udp \
|
||||
//! -p 5778:5778 \
|
||||
//! -p 16686:16686 \
|
||||
//! -p 14268:14268 \
|
||||
//! -p 14250:14250 \
|
||||
//! -p 9411:9411 \
|
||||
//! docker.io/jaegertracing/all-in-one:1.21
|
||||
//! ```
|
||||
//!
|
||||
|
||||
use polkadot_node_primitives::SpawnNamed;
|
||||
use polkadot_primitives::v1::{Hash, PoV, CandidateHash};
|
||||
use parking_lot::RwLock;
|
||||
use std::sync::Arc;
|
||||
use std::result;
|
||||
pub use crate::errors::JaegerError;
|
||||
|
||||
|
||||
lazy_static::lazy_static! {
|
||||
static ref INSTANCE: RwLock<Jaeger> = RwLock::new(Jaeger::None);
|
||||
}
|
||||
|
||||
/// Configuration for the jaeger tracing.
|
||||
#[derive(Clone)]
|
||||
pub struct JaegerConfig {
|
||||
node_name: String,
|
||||
agent_addr: std::net::SocketAddr,
|
||||
}
|
||||
|
||||
impl std::default::Default for JaegerConfig {
|
||||
fn default() -> Self {
|
||||
Self {
|
||||
node_name: "unknown_".to_owned(),
|
||||
agent_addr: "127.0.0.1:6831".parse().expect(r#"Static "127.0.0.1:6831" is a valid socket address string. qed"#),
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
impl JaegerConfig {
|
||||
/// Use the builder pattern to construct a configuration.
|
||||
pub fn builder() -> JaegerConfigBuilder {
|
||||
JaegerConfigBuilder::default()
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
/// Jaeger configuration builder.
|
||||
#[derive(Default)]
|
||||
pub struct JaegerConfigBuilder {
|
||||
inner: JaegerConfig
|
||||
}
|
||||
|
||||
impl JaegerConfigBuilder {
|
||||
/// Set the name for this node.
|
||||
pub fn named<S>(mut self, name: S) -> Self where S: AsRef<str> {
|
||||
self.inner.node_name = name.as_ref().to_owned();
|
||||
self
|
||||
}
|
||||
|
||||
/// Set the agent address to send the collected spans to.
|
||||
pub fn agent<U>(mut self, addr: U) -> Self where U: Into<std::net::SocketAddr> {
|
||||
self.inner.agent_addr = addr.into();
|
||||
self
|
||||
}
|
||||
|
||||
/// Construct the configuration.
|
||||
pub fn build(self) -> JaegerConfig {
|
||||
self.inner
|
||||
}
|
||||
}
|
||||
|
||||
/// A wrapper type for a span.
|
||||
///
|
||||
/// Handles running with and without jaeger.
|
||||
pub enum JaegerSpan {
|
||||
/// Running with jaeger being enabled.
|
||||
Enabled(mick_jaeger::Span),
|
||||
/// Running with jaeger disabled.
|
||||
Disabled,
|
||||
}
|
||||
|
||||
impl JaegerSpan {
|
||||
/// Derive a child span from `self`.
|
||||
pub fn child(&self, name: impl Into<String>) -> Self {
|
||||
match self {
|
||||
Self::Enabled(inner) => Self::Enabled(inner.child(name)),
|
||||
Self::Disabled => Self::Disabled,
|
||||
}
|
||||
}
|
||||
/// Add an additional tag to the span.
|
||||
pub fn add_string_tag(&mut self, tag: &str, value: &str) {
|
||||
match self {
|
||||
Self::Enabled(ref mut inner) => inner.add_string_tag(tag, value),
|
||||
Self::Disabled => {},
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
impl From<Option<mick_jaeger::Span>> for JaegerSpan {
|
||||
fn from(src: Option<mick_jaeger::Span>) -> Self {
|
||||
if let Some(span) = src {
|
||||
Self::Enabled(span)
|
||||
} else {
|
||||
Self::Disabled
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
impl From<mick_jaeger::Span> for JaegerSpan {
|
||||
fn from(src: mick_jaeger::Span) -> Self {
|
||||
Self::Enabled(src)
|
||||
}
|
||||
}
|
||||
|
||||
/// Shortcut for [`candidate_hash_span`] with the hash of the `Candidate` block.
|
||||
#[inline(always)]
|
||||
pub fn candidate_hash_span(candidate_hash: &CandidateHash, span_name: impl Into<String>) -> JaegerSpan {
|
||||
INSTANCE.read_recursive().span(|| { candidate_hash.0 }, span_name).into()
|
||||
}
|
||||
|
||||
/// Shortcut for [`hash_span`] with the hash of the `PoV`.
|
||||
#[inline(always)]
|
||||
pub fn pov_span(pov: &PoV, span_name: impl Into<String>) -> JaegerSpan {
|
||||
INSTANCE.read_recursive().span(|| { pov.hash() }, span_name).into()
|
||||
}
|
||||
|
||||
/// Creates a `Span` referring to the given hash. All spans created with [`hash_span`] with the
|
||||
/// same hash (even from multiple different nodes) will be visible in the same view on Jaeger.
|
||||
#[inline(always)]
|
||||
pub fn hash_span(hash: &Hash, span_name: impl Into<String>) -> JaegerSpan {
|
||||
INSTANCE.read_recursive().span(|| { *hash }, span_name).into()
|
||||
}
|
||||
|
||||
/// Stateful convenience wrapper around [`mick_jaeger`].
|
||||
pub enum Jaeger {
|
||||
/// Launched and operational state.
|
||||
Launched {
|
||||
/// [`mick_jaeger`] provided API to record spans to.
|
||||
traces_in: Arc<mick_jaeger::TracesIn>,
|
||||
},
|
||||
/// Preparation state with the necessary config to launch the collector.
|
||||
Prep(JaegerConfig),
|
||||
/// Uninitialized, suggests wrong API usage if encountered.
|
||||
None,
|
||||
}
|
||||
|
||||
impl Jaeger {
|
||||
/// Spawn the jaeger instance.
|
||||
pub fn new(cfg: JaegerConfig) -> Self {
|
||||
Jaeger::Prep(cfg)
|
||||
}
|
||||
|
||||
/// Spawn the background task in order to send the tracing information out via udp
|
||||
#[cfg(target_os = "unknown")]
|
||||
pub fn launch<S: SpawnNamed>(self, _spawner: S) -> result::Result<(), JaegerError> {
|
||||
Ok(())
|
||||
}
|
||||
|
||||
/// Spawn the background task in order to send the tracing information out via udp
|
||||
#[cfg(not(target_os = "unknown"))]
|
||||
pub fn launch<S: SpawnNamed>(self, spawner: S) -> result::Result<(), JaegerError> {
|
||||
let cfg = match self {
|
||||
Self::Prep(cfg) => Ok(cfg),
|
||||
Self::Launched{ .. } => {
|
||||
return Err(JaegerError::AlreadyLaunched)
|
||||
}
|
||||
Self::None => Err(JaegerError::MissingConfiguration),
|
||||
}?;
|
||||
|
||||
let jaeger_agent = cfg.agent_addr;
|
||||
|
||||
log::info!("🐹 Collecting jaeger spans for {:?}", &jaeger_agent);
|
||||
|
||||
let (traces_in, mut traces_out) = mick_jaeger::init(mick_jaeger::Config {
|
||||
service_name: format!("{}-{}", cfg.node_name, cfg.node_name),
|
||||
});
|
||||
|
||||
// Spawn a background task that pulls span information and sends them on the network.
|
||||
spawner.spawn("jaeger-collector", Box::pin(async move {
|
||||
let res = async_std::net::UdpSocket::bind("127.0.0.1:0").await
|
||||
.map_err(JaegerError::PortAllocationError);
|
||||
match res {
|
||||
Ok(udp_socket) => loop {
|
||||
let buf = traces_out.next().await;
|
||||
// UDP sending errors happen only either if the API is misused or in case of missing privilege.
|
||||
if let Err(e) = udp_socket.send_to(&buf, jaeger_agent).await
|
||||
.map_err(|e| JaegerError::SendError(e))
|
||||
{
|
||||
log::trace!("Jaeger: {:?}", e);
|
||||
}
|
||||
}
|
||||
Err(e) => {
|
||||
log::warn!("Jaeger: {:?}", e);
|
||||
}
|
||||
}
|
||||
}));
|
||||
|
||||
*INSTANCE.write() = Self::Launched {
|
||||
traces_in,
|
||||
};
|
||||
Ok(())
|
||||
}
|
||||
|
||||
fn span<F>(&self, lazy_hash: F, span_name: impl Into<String>) -> Option<mick_jaeger::Span>
|
||||
where
|
||||
F: Fn() -> Hash,
|
||||
{
|
||||
if let Self::Launched { traces_in , .. } = self {
|
||||
let hash = lazy_hash();
|
||||
let mut buf = [0u8; 16];
|
||||
buf.copy_from_slice(&hash.as_ref()[0..16]);
|
||||
let trace_id = std::num::NonZeroU128::new(u128::from_be_bytes(buf))?;
|
||||
Some(traces_in.span(trace_id, span_name))
|
||||
} else {
|
||||
None
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -31,12 +31,13 @@ use futures::future::BoxFuture;
|
||||
use polkadot_primitives::v1::Hash;
|
||||
use async_trait::async_trait;
|
||||
use smallvec::SmallVec;
|
||||
use thiserror::Error;
|
||||
|
||||
use crate::messages::AllMessages;
|
||||
|
||||
pub mod errors;
|
||||
pub mod messages;
|
||||
pub mod jaeger;
|
||||
pub use crate::jaeger::*;
|
||||
|
||||
/// How many slots are stack-reserved for active leaves updates
|
||||
///
|
||||
@@ -119,29 +120,27 @@ pub enum FromOverseer<M> {
|
||||
/// * Subsystems dying when they are not expected to
|
||||
/// * Subsystems not dying when they are told to die
|
||||
/// * etc.
|
||||
#[derive(Error, Debug)]
|
||||
#[derive(thiserror::Error, Debug)]
|
||||
#[allow(missing_docs)]
|
||||
pub enum SubsystemError {
|
||||
/// A notification connection is no longer valid.
|
||||
#[error(transparent)]
|
||||
NotifyCancellation(#[from] oneshot::Canceled),
|
||||
|
||||
/// Queue does not accept another item.
|
||||
#[error(transparent)]
|
||||
QueueError(#[from] mpsc::SendError),
|
||||
|
||||
/// An attempt to spawn a futures task did not succeed.
|
||||
#[error(transparent)]
|
||||
TaskSpawn(#[from] futures::task::SpawnError),
|
||||
|
||||
/// An infallable error.
|
||||
#[error(transparent)]
|
||||
Infallible(#[from] std::convert::Infallible),
|
||||
|
||||
/// Prometheus had a problem
|
||||
#[error(transparent)]
|
||||
Prometheus(#[from] substrate_prometheus_endpoint::PrometheusError),
|
||||
|
||||
/// An other error lacking particular type information.
|
||||
#[error(transparent)]
|
||||
Jaeger(#[from] errors::JaegerError),
|
||||
|
||||
#[error("Failed to {0}")]
|
||||
Context(String),
|
||||
|
||||
|
||||
Reference in New Issue
Block a user