mirror of
https://github.com/pezkuwichain/pezkuwi-subxt.git
synced 2026-06-11 23:31:07 +00:00
Add group name in task metrics (#10196)
* SpawnNamed: add new trait methods Signed-off-by: Andrei Sandu <sandu.andrei@gmail.com> * Implement new methods Signed-off-by: Andrei Sandu <sandu.andrei@gmail.com> * cargo fmt Signed-off-by: Andrei Sandu <sandu.andrei@gmail.com> * SpawnNamed: add new trait methods Signed-off-by: Andrei Sandu <sandu.andrei@gmail.com> * Implement new methods Signed-off-by: Andrei Sandu <sandu.andrei@gmail.com> * cargo fmt Signed-off-by: Andrei Sandu <sandu.andrei@gmail.com> * New approach - spaw() group param Signed-off-by: Andrei Sandu <andrei-mihail@parity.io> * Update traits: SpawnNamed and SpawnNamed Signed-off-by: Andrei Sandu <andrei-mihail@parity.io> * Update TaskManager tests Signed-off-by: Andrei Sandu <andrei-mihail@parity.io> * Update test TaskExecutor Signed-off-by: Andrei Sandu <andrei-mihail@parity.io> * Fix typo Signed-off-by: Andrei Sandu <andrei-mihail@parity.io> * grunt work: fix spawn() calls Signed-off-by: Andrei Sandu <andrei-mihail@parity.io> * cargo fmt Signed-off-by: Andrei Sandu <andrei-mihail@parity.io> * remove old code Signed-off-by: Andrei Sandu <andrei-mihail@parity.io> * cargo fmt - the right version Signed-off-by: Andrei Sandu <andrei-mihail@parity.io> * Implement review feedback - use Option group name in SpawnNamed methods - switch to kebab case - implement default group name - add group name to some tasks Signed-off-by: Andrei Sandu <andrei-mihail@parity.io>
This commit is contained in:
@@ -38,6 +38,9 @@ mod prometheus_future;
|
||||
#[cfg(test)]
|
||||
mod tests;
|
||||
|
||||
/// Default task group name.
|
||||
pub const DEFAULT_GROUP_NAME: &'static str = "default";
|
||||
|
||||
/// An handle for spawning tasks in the service.
|
||||
#[derive(Clone)]
|
||||
pub struct SpawnTaskHandle {
|
||||
@@ -48,31 +51,39 @@ pub struct SpawnTaskHandle {
|
||||
}
|
||||
|
||||
impl SpawnTaskHandle {
|
||||
/// Spawns the given task with the given name.
|
||||
/// Spawns the given task with the given name and an optional group name.
|
||||
/// If group is not specified `DEFAULT_GROUP_NAME` will be used.
|
||||
///
|
||||
/// Note that the `name` is a `&'static str`. The reason for this choice is that statistics
|
||||
/// about this task are getting reported to the Prometheus endpoint (if enabled), and that
|
||||
/// therefore the set of possible task names must be bounded.
|
||||
/// Note that the `name`/`group` is a `&'static str`. The reason for this choice is that
|
||||
/// statistics about this task are getting reported to the Prometheus endpoint (if enabled), and
|
||||
/// that therefore the set of possible task names must be bounded.
|
||||
///
|
||||
/// In other words, it would be a bad idea for someone to do for example
|
||||
/// `spawn(format!("{:?}", some_public_key))`.
|
||||
pub fn spawn(&self, name: &'static str, task: impl Future<Output = ()> + Send + 'static) {
|
||||
self.spawn_inner(name, task, TaskType::Async)
|
||||
pub fn spawn(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
task: impl Future<Output = ()> + Send + 'static,
|
||||
) {
|
||||
self.spawn_inner(name, group, task, TaskType::Async)
|
||||
}
|
||||
|
||||
/// Spawns the blocking task with the given name. See also `spawn`.
|
||||
pub fn spawn_blocking(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
task: impl Future<Output = ()> + Send + 'static,
|
||||
) {
|
||||
self.spawn_inner(name, task, TaskType::Blocking)
|
||||
self.spawn_inner(name, group, task, TaskType::Blocking)
|
||||
}
|
||||
|
||||
/// Helper function that implements the spawning logic. See `spawn` and `spawn_blocking`.
|
||||
fn spawn_inner(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
task: impl Future<Output = ()> + Send + 'static,
|
||||
task_type: TaskType,
|
||||
) {
|
||||
@@ -83,21 +94,23 @@ impl SpawnTaskHandle {
|
||||
|
||||
let on_exit = self.on_exit.clone();
|
||||
let metrics = self.metrics.clone();
|
||||
// If no group is specified use default.
|
||||
let group = group.unwrap_or(DEFAULT_GROUP_NAME);
|
||||
|
||||
// Note that we increase the started counter here and not within the future. This way,
|
||||
// we could properly visualize on Prometheus situations where the spawning doesn't work.
|
||||
if let Some(metrics) = &self.metrics {
|
||||
metrics.tasks_spawned.with_label_values(&[name]).inc();
|
||||
metrics.tasks_spawned.with_label_values(&[name, group]).inc();
|
||||
// We do a dummy increase in order for the task to show up in metrics.
|
||||
metrics.tasks_ended.with_label_values(&[name, "finished"]).inc_by(0);
|
||||
metrics.tasks_ended.with_label_values(&[name, "finished", group]).inc_by(0);
|
||||
}
|
||||
|
||||
let future = async move {
|
||||
if let Some(metrics) = metrics {
|
||||
// Add some wrappers around `task`.
|
||||
let task = {
|
||||
let poll_duration = metrics.poll_duration.with_label_values(&[name]);
|
||||
let poll_start = metrics.poll_start.with_label_values(&[name]);
|
||||
let poll_duration = metrics.poll_duration.with_label_values(&[name, group]);
|
||||
let poll_start = metrics.poll_start.with_label_values(&[name, group]);
|
||||
let inner =
|
||||
prometheus_future::with_poll_durations(poll_duration, poll_start, task);
|
||||
// The logic of `AssertUnwindSafe` here is ok considering that we throw
|
||||
@@ -108,15 +121,15 @@ impl SpawnTaskHandle {
|
||||
|
||||
match select(on_exit, task).await {
|
||||
Either::Right((Err(payload), _)) => {
|
||||
metrics.tasks_ended.with_label_values(&[name, "panic"]).inc();
|
||||
metrics.tasks_ended.with_label_values(&[name, "panic", group]).inc();
|
||||
panic::resume_unwind(payload)
|
||||
},
|
||||
Either::Right((Ok(()), _)) => {
|
||||
metrics.tasks_ended.with_label_values(&[name, "finished"]).inc();
|
||||
metrics.tasks_ended.with_label_values(&[name, "finished", group]).inc();
|
||||
},
|
||||
Either::Left(((), _)) => {
|
||||
// The `on_exit` has triggered.
|
||||
metrics.tasks_ended.with_label_values(&[name, "interrupted"]).inc();
|
||||
metrics.tasks_ended.with_label_values(&[name, "interrupted", group]).inc();
|
||||
},
|
||||
}
|
||||
} else {
|
||||
@@ -141,12 +154,22 @@ impl SpawnTaskHandle {
|
||||
}
|
||||
|
||||
impl sp_core::traits::SpawnNamed for SpawnTaskHandle {
|
||||
fn spawn_blocking(&self, name: &'static str, future: BoxFuture<'static, ()>) {
|
||||
self.spawn_blocking(name, future);
|
||||
fn spawn_blocking(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
future: BoxFuture<'static, ()>,
|
||||
) {
|
||||
self.spawn_inner(name, group, future, TaskType::Blocking)
|
||||
}
|
||||
|
||||
fn spawn(&self, name: &'static str, future: BoxFuture<'static, ()>) {
|
||||
self.spawn(name, future);
|
||||
fn spawn(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
future: BoxFuture<'static, ()>,
|
||||
) {
|
||||
self.spawn_inner(name, group, future, TaskType::Async)
|
||||
}
|
||||
}
|
||||
|
||||
@@ -172,8 +195,13 @@ impl SpawnEssentialTaskHandle {
|
||||
/// Spawns the given task with the given name.
|
||||
///
|
||||
/// See also [`SpawnTaskHandle::spawn`].
|
||||
pub fn spawn(&self, name: &'static str, task: impl Future<Output = ()> + Send + 'static) {
|
||||
self.spawn_inner(name, task, TaskType::Async)
|
||||
pub fn spawn(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
task: impl Future<Output = ()> + Send + 'static,
|
||||
) {
|
||||
self.spawn_inner(name, group, task, TaskType::Async)
|
||||
}
|
||||
|
||||
/// Spawns the blocking task with the given name.
|
||||
@@ -182,14 +210,16 @@ impl SpawnEssentialTaskHandle {
|
||||
pub fn spawn_blocking(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
task: impl Future<Output = ()> + Send + 'static,
|
||||
) {
|
||||
self.spawn_inner(name, task, TaskType::Blocking)
|
||||
self.spawn_inner(name, group, task, TaskType::Blocking)
|
||||
}
|
||||
|
||||
fn spawn_inner(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
task: impl Future<Output = ()> + Send + 'static,
|
||||
task_type: TaskType,
|
||||
) {
|
||||
@@ -199,17 +229,27 @@ impl SpawnEssentialTaskHandle {
|
||||
let _ = essential_failed.close_channel();
|
||||
});
|
||||
|
||||
let _ = self.inner.spawn_inner(name, essential_task, task_type);
|
||||
let _ = self.inner.spawn_inner(name, group, essential_task, task_type);
|
||||
}
|
||||
}
|
||||
|
||||
impl sp_core::traits::SpawnEssentialNamed for SpawnEssentialTaskHandle {
|
||||
fn spawn_essential_blocking(&self, name: &'static str, future: BoxFuture<'static, ()>) {
|
||||
self.spawn_blocking(name, future);
|
||||
fn spawn_essential_blocking(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
future: BoxFuture<'static, ()>,
|
||||
) {
|
||||
self.spawn_blocking(name, group, future);
|
||||
}
|
||||
|
||||
fn spawn_essential(&self, name: &'static str, future: BoxFuture<'static, ()>) {
|
||||
self.spawn(name, future);
|
||||
fn spawn_essential(
|
||||
&self,
|
||||
name: &'static str,
|
||||
group: Option<&'static str>,
|
||||
future: BoxFuture<'static, ()>,
|
||||
) {
|
||||
self.spawn(name, group, future);
|
||||
}
|
||||
}
|
||||
|
||||
@@ -396,28 +436,28 @@ impl Metrics {
|
||||
buckets: exponential_buckets(0.001, 4.0, 9)
|
||||
.expect("function parameters are constant and always valid; qed"),
|
||||
},
|
||||
&["task_name"]
|
||||
&["task_name", "task_group"]
|
||||
)?, registry)?,
|
||||
poll_start: register(CounterVec::new(
|
||||
Opts::new(
|
||||
"tasks_polling_started_total",
|
||||
"Total number of times we started invoking Future::poll"
|
||||
),
|
||||
&["task_name"]
|
||||
&["task_name", "task_group"]
|
||||
)?, registry)?,
|
||||
tasks_spawned: register(CounterVec::new(
|
||||
Opts::new(
|
||||
"tasks_spawned_total",
|
||||
"Total number of tasks that have been spawned on the Service"
|
||||
),
|
||||
&["task_name"]
|
||||
&["task_name", "task_group"]
|
||||
)?, registry)?,
|
||||
tasks_ended: register(CounterVec::new(
|
||||
Opts::new(
|
||||
"tasks_ended_total",
|
||||
"Total number of tasks for which Future::poll has returned Ready(()) or panicked"
|
||||
),
|
||||
&["task_name", "reason"]
|
||||
&["task_name", "reason", "task_group"]
|
||||
)?, registry)?,
|
||||
})
|
||||
}
|
||||
|
||||
@@ -96,8 +96,8 @@ fn ensure_tasks_are_awaited_on_shutdown() {
|
||||
let task_manager = new_task_manager(handle);
|
||||
let spawn_handle = task_manager.spawn_handle();
|
||||
let drop_tester = DropTester::new();
|
||||
spawn_handle.spawn("task1", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task1", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", None, run_background_task(drop_tester.new_ref()));
|
||||
assert_eq!(drop_tester, 2);
|
||||
// allow the tasks to even start
|
||||
runtime.block_on(async { tokio::time::sleep(Duration::from_secs(1)).await });
|
||||
@@ -115,7 +115,7 @@ fn ensure_keep_alive_during_shutdown() {
|
||||
let spawn_handle = task_manager.spawn_handle();
|
||||
let drop_tester = DropTester::new();
|
||||
task_manager.keep_alive(drop_tester.new_ref());
|
||||
spawn_handle.spawn("task1", run_background_task(()));
|
||||
spawn_handle.spawn("task1", None, run_background_task(()));
|
||||
assert_eq!(drop_tester, 1);
|
||||
// allow the tasks to even start
|
||||
runtime.block_on(async { tokio::time::sleep(Duration::from_secs(1)).await });
|
||||
@@ -134,10 +134,12 @@ fn ensure_blocking_futures_are_awaited_on_shutdown() {
|
||||
let drop_tester = DropTester::new();
|
||||
spawn_handle.spawn(
|
||||
"task1",
|
||||
None,
|
||||
run_background_task_blocking(Duration::from_secs(3), drop_tester.new_ref()),
|
||||
);
|
||||
spawn_handle.spawn(
|
||||
"task2",
|
||||
None,
|
||||
run_background_task_blocking(Duration::from_secs(3), drop_tester.new_ref()),
|
||||
);
|
||||
assert_eq!(drop_tester, 2);
|
||||
@@ -156,14 +158,14 @@ fn ensure_no_task_can_be_spawn_after_terminate() {
|
||||
let mut task_manager = new_task_manager(handle);
|
||||
let spawn_handle = task_manager.spawn_handle();
|
||||
let drop_tester = DropTester::new();
|
||||
spawn_handle.spawn("task1", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task1", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", None, run_background_task(drop_tester.new_ref()));
|
||||
assert_eq!(drop_tester, 2);
|
||||
// allow the tasks to even start
|
||||
runtime.block_on(async { tokio::time::sleep(Duration::from_secs(1)).await });
|
||||
assert_eq!(drop_tester, 2);
|
||||
task_manager.terminate();
|
||||
spawn_handle.spawn("task3", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task3", None, run_background_task(drop_tester.new_ref()));
|
||||
runtime.block_on(task_manager.clean_shutdown());
|
||||
drop_tester.wait_on_drop();
|
||||
}
|
||||
@@ -176,8 +178,8 @@ fn ensure_task_manager_future_ends_when_task_manager_terminated() {
|
||||
let mut task_manager = new_task_manager(handle);
|
||||
let spawn_handle = task_manager.spawn_handle();
|
||||
let drop_tester = DropTester::new();
|
||||
spawn_handle.spawn("task1", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task1", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", None, run_background_task(drop_tester.new_ref()));
|
||||
assert_eq!(drop_tester, 2);
|
||||
// allow the tasks to even start
|
||||
runtime.block_on(async { tokio::time::sleep(Duration::from_secs(1)).await });
|
||||
@@ -197,13 +199,13 @@ fn ensure_task_manager_future_ends_with_error_when_essential_task_fails() {
|
||||
let spawn_handle = task_manager.spawn_handle();
|
||||
let spawn_essential_handle = task_manager.spawn_essential_handle();
|
||||
let drop_tester = DropTester::new();
|
||||
spawn_handle.spawn("task1", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task1", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", None, run_background_task(drop_tester.new_ref()));
|
||||
assert_eq!(drop_tester, 2);
|
||||
// allow the tasks to even start
|
||||
runtime.block_on(async { tokio::time::sleep(Duration::from_secs(1)).await });
|
||||
assert_eq!(drop_tester, 2);
|
||||
spawn_essential_handle.spawn("task3", async { panic!("task failed") });
|
||||
spawn_essential_handle.spawn("task3", None, async { panic!("task failed") });
|
||||
runtime
|
||||
.block_on(task_manager.future())
|
||||
.expect_err("future()'s Result must be Err");
|
||||
@@ -226,10 +228,10 @@ fn ensure_children_tasks_ends_when_task_manager_terminated() {
|
||||
task_manager.add_child(child_2);
|
||||
let spawn_handle = task_manager.spawn_handle();
|
||||
let drop_tester = DropTester::new();
|
||||
spawn_handle.spawn("task1", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_1.spawn("task3", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_2.spawn("task4", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task1", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_1.spawn("task3", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_2.spawn("task4", None, run_background_task(drop_tester.new_ref()));
|
||||
assert_eq!(drop_tester, 4);
|
||||
// allow the tasks to even start
|
||||
runtime.block_on(async { tokio::time::sleep(Duration::from_secs(1)).await });
|
||||
@@ -255,15 +257,15 @@ fn ensure_task_manager_future_ends_with_error_when_childs_essential_task_fails()
|
||||
task_manager.add_child(child_2);
|
||||
let spawn_handle = task_manager.spawn_handle();
|
||||
let drop_tester = DropTester::new();
|
||||
spawn_handle.spawn("task1", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_1.spawn("task3", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_2.spawn("task4", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task1", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_1.spawn("task3", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_2.spawn("task4", None, run_background_task(drop_tester.new_ref()));
|
||||
assert_eq!(drop_tester, 4);
|
||||
// allow the tasks to even start
|
||||
runtime.block_on(async { tokio::time::sleep(Duration::from_secs(1)).await });
|
||||
assert_eq!(drop_tester, 4);
|
||||
spawn_essential_handle_child_1.spawn("task5", async { panic!("task failed") });
|
||||
spawn_essential_handle_child_1.spawn("task5", None, async { panic!("task failed") });
|
||||
runtime
|
||||
.block_on(task_manager.future())
|
||||
.expect_err("future()'s Result must be Err");
|
||||
@@ -286,15 +288,15 @@ fn ensure_task_manager_future_continues_when_childs_not_essential_task_fails() {
|
||||
task_manager.add_child(child_2);
|
||||
let spawn_handle = task_manager.spawn_handle();
|
||||
let drop_tester = DropTester::new();
|
||||
spawn_handle.spawn("task1", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_1.spawn("task3", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_2.spawn("task4", run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task1", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle.spawn("task2", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_1.spawn("task3", None, run_background_task(drop_tester.new_ref()));
|
||||
spawn_handle_child_2.spawn("task4", None, run_background_task(drop_tester.new_ref()));
|
||||
assert_eq!(drop_tester, 4);
|
||||
// allow the tasks to even start
|
||||
runtime.block_on(async { tokio::time::sleep(Duration::from_secs(1)).await });
|
||||
assert_eq!(drop_tester, 4);
|
||||
spawn_handle_child_1.spawn("task5", async { panic!("task failed") });
|
||||
spawn_handle_child_1.spawn("task5", None, async { panic!("task failed") });
|
||||
runtime.block_on(async {
|
||||
let t1 = task_manager.future().fuse();
|
||||
let t2 = tokio::time::sleep(Duration::from_secs(3)).fuse();
|
||||
|
||||
Reference in New Issue
Block a user