Add TaskMonitor interval metrics w/ admin command.

Signed-off-by: Jason Volk <jason@zemos.net>
This commit is contained in:
Jason Volk
2026-03-02 02:10:55 +00:00
parent bf8ae48ec2
commit 9e75453303
6 changed files with 90 additions and 12 deletions

View File

@@ -1,9 +1,9 @@
use std::sync::atomic::{AtomicU32, AtomicU64};
use tokio::runtime;
use tokio_metrics::TaskMonitor;
#[cfg(tokio_unstable)]
use tokio_metrics::{RuntimeIntervals, RuntimeMonitor};
use tokio_metrics::{TaskMetrics, TaskMonitor};
pub struct Metrics {
_runtime: Option<runtime::Handle>,
@@ -12,6 +12,8 @@ pub struct Metrics {
task_monitor: Option<TaskMonitor>,
task_intervals: std::sync::Mutex<Option<Box<dyn Iterator<Item = TaskMetrics> + Send>>>,
#[cfg(tokio_unstable)]
_runtime_monitor: Option<RuntimeMonitor>,
@@ -27,21 +29,37 @@ pub struct Metrics {
impl Metrics {
#[must_use]
pub fn new(runtime: Option<runtime::Handle>) -> Self {
pub fn new(runtime: Option<&runtime::Handle>) -> Self {
#[cfg(tokio_unstable)]
let runtime_monitor = runtime.as_ref().map(RuntimeMonitor::new);
let runtime_monitor = runtime.map(RuntimeMonitor::new);
#[cfg(tokio_unstable)]
let runtime_intervals = runtime_monitor
.as_ref()
.map(RuntimeMonitor::intervals);
let task_monitor = cfg!(tokio_unstable).then(|| {
TaskMonitor::builder()
.with_slow_poll_threshold(TaskMonitor::DEFAULT_SLOW_POLL_THRESHOLD)
.with_long_delay_threshold(TaskMonitor::DEFAULT_LONG_DELAY_THRESHOLD)
.clone()
.build()
});
let task_intervals = task_monitor.as_ref().map(
|task_monitor| -> Box<dyn Iterator<Item = TaskMetrics> + Send> {
Box::new(task_monitor.intervals())
},
);
Self {
_runtime: runtime.clone(),
_runtime: runtime.cloned(),
runtime_metrics: runtime.as_ref().map(runtime::Handle::metrics),
runtime_metrics: runtime.map(runtime::Handle::metrics),
task_monitor: runtime.map(|_| TaskMonitor::new()),
task_monitor,
task_intervals: task_intervals.into(),
#[cfg(tokio_unstable)]
_runtime_monitor: runtime_monitor,
@@ -56,6 +74,26 @@ impl Metrics {
}
}
#[inline]
pub async fn instrument<F, Output>(&self, f: F) -> Output
where
F: Future<Output = Output>,
{
if let Some(monitor) = self.task_metrics() {
monitor.instrument(f).await
} else {
f.await
}
}
pub fn task_interval(&self) -> Option<TaskMetrics> {
self.task_intervals
.lock()
.expect("locked")
.as_mut()
.and_then(Iterator::next)
}
#[cfg(tokio_unstable)]
pub fn runtime_interval(&self) -> Option<tokio_metrics::RuntimeMetrics> {
self.runtime_intervals
@@ -66,15 +104,15 @@ impl Metrics {
.expect("next interval")
}
#[inline]
pub fn task_root(&self) -> Option<&TaskMonitor> { self.task_monitor.as_ref() }
#[inline]
pub fn num_workers(&self) -> usize {
self.runtime_metrics()
.map_or(0, runtime::RuntimeMetrics::num_workers)
}
#[inline]
pub fn task_metrics(&self) -> Option<&TaskMonitor> { self.task_monitor.as_ref() }
#[inline]
pub fn runtime_metrics(&self) -> Option<&runtime::RuntimeMetrics> {
self.runtime_metrics.as_ref()

View File

@@ -20,6 +20,7 @@ pub use ::jsonwebtoken as jwt;
pub use ::ruma;
pub use ::smallstr;
pub use ::smallvec;
pub use ::tokio_metrics;
pub use ::toml;
pub use ::tracing;
pub use config::Config;

View File

@@ -49,7 +49,7 @@ pub struct Server {
impl Server {
#[must_use]
pub fn new(config: Config, runtime: Option<runtime::Handle>, log: Logging) -> Self {
pub fn new(config: Config, runtime: Option<&runtime::Handle>, log: Logging) -> Self {
Self {
name: config.server_name.clone(),
config: config::Manager::new(config),
@@ -57,7 +57,7 @@ impl Server {
stopping: AtomicBool::new(false),
reloading: AtomicBool::new(false),
restarting: AtomicBool::new(false),
runtime: runtime.clone(),
runtime: runtime.cloned(),
signal: broadcast::channel::<&'static str>(1).0,
log,
metrics: Metrics::new(runtime),