[pdm-devel] [PATCH proxmox-datacenter-manager v7 23/24] metric collection: allow to wait until completion when triggering collection manually
Lukas Wagner
l.wagner at proxmox.com
Tue Aug 26 15:51:18 CEST 2025
This allows us to request the latest metrics for a single remote in the
rrddata API calls, closing the gap in data the results from the longer
10min poll interval.
Signed-off-by: Lukas Wagner <l.wagner at proxmox.com>
---
Notes:
New in v7.
server/src/api/metric_collection.rs | 2 +-
server/src/api/remotes.rs | 2 +-
.../src/metric_collection/collection_task.rs | 16 +++++++++++-----
server/src/metric_collection/mod.rs | 18 +++++++++++++++---
4 files changed, 28 insertions(+), 10 deletions(-)
diff --git a/server/src/api/metric_collection.rs b/server/src/api/metric_collection.rs
index 845cc0e6..0658fb1f 100644
--- a/server/src/api/metric_collection.rs
+++ b/server/src/api/metric_collection.rs
@@ -34,7 +34,7 @@ const SUBDIRS: SubdirMap = &sorted!([
)]
/// Trigger metric collection for a provided remote or for all remotes if no remote is passed.
pub async fn trigger_metric_collection(remote: Option<String>) -> Result<(), Error> {
- crate::metric_collection::trigger_metric_collection(remote).await?;
+ crate::metric_collection::trigger_metric_collection(remote, false).await?;
Ok(())
}
diff --git a/server/src/api/remotes.rs b/server/src/api/remotes.rs
index c2489e60..033aa7c9 100644
--- a/server/src/api/remotes.rs
+++ b/server/src/api/remotes.rs
@@ -186,7 +186,7 @@ pub async fn add_remote(mut entry: Remote, create_token: Option<String>) -> Resu
pdm_config::remotes::save_config(&remotes)?;
- if let Err(e) = metric_collection::trigger_metric_collection(Some(name)).await {
+ if let Err(e) = metric_collection::trigger_metric_collection(Some(name), false).await {
log::error!("could not trigger metric collection after adding remote: {e}");
}
diff --git a/server/src/metric_collection/collection_task.rs b/server/src/metric_collection/collection_task.rs
index 1e23fa88..5f67d65d 100644
--- a/server/src/metric_collection/collection_task.rs
+++ b/server/src/metric_collection/collection_task.rs
@@ -41,7 +41,7 @@ pub const MIN_COLLECTION_INTERVAL: u64 = 10;
/// Control messages for the metric collection task.
pub(super) enum ControlMsg {
- TriggerMetricCollection(Option<String>),
+ TriggerMetricCollection(Option<String>, oneshot::Sender<()>),
}
/// Task which periodically collects metrics from all remotes and stores
@@ -136,20 +136,26 @@ impl MetricCollectionTask {
/// Handle a control message for force-triggered collection.
async fn handle_control_message(&mut self, message: ControlMsg) {
if let Some(remotes) = Self::load_remote_config() {
- match message {
- ControlMsg::TriggerMetricCollection(Some(remote)) => {
+ let done_tx = match message {
+ ControlMsg::TriggerMetricCollection(Some(remote), done_tx) => {
log::debug!("starting metric collection for remote '{remote}'- triggered by control message");
self.fetch_remotes(&remotes, &[remote]).await;
+ done_tx
}
- ControlMsg::TriggerMetricCollection(None) => {
+ ControlMsg::TriggerMetricCollection(None, done_tx) => {
log::debug!("starting metric collection from all remotes - triggered by control message");
let to_fetch = remotes
.iter()
.map(|(name, _)| name.into())
.collect::<Vec<String>>();
self.fetch_remotes(&remotes, &to_fetch).await;
+ done_tx
}
- }
+ };
+
+ // We don't care about the result, if the caller does not wait for the result, it
+ // might have dropped the receiver already.
+ let _ = done_tx.send(());
}
}
diff --git a/server/src/metric_collection/mod.rs b/server/src/metric_collection/mod.rs
index 2ddffda5..0e6860fc 100644
--- a/server/src/metric_collection/mod.rs
+++ b/server/src/metric_collection/mod.rs
@@ -5,6 +5,7 @@ use std::sync::OnceLock;
use anyhow::{bail, Error};
use nix::sys::stat::Mode;
use tokio::sync::mpsc::{self, Sender};
+use tokio::sync::oneshot;
use pdm_api_types::MetricCollectionStatus;
use pdm_buildcfg::PDM_STATE_DIR_M;
@@ -66,15 +67,26 @@ pub fn start_task() -> Result<(), Error> {
Ok(())
}
-/// Schedule metric collection for a given remote as soon as possible.
+/// Schedule metric collection as soon as possible.
+///
+/// If `remote` is `Some(String)`, then the remote with the given ID is
+/// collected. If remote is `None`, all remotes are scheduled for collection.
+/// If `wait` is `true`, this function waits for the completion of the requested
+/// metric collection run.
///
/// Has no effect if the tx end of the channel has not been initialized yet.
/// Returns an error if the mpsc channel has been closed already.
-pub async fn trigger_metric_collection(remote: Option<String>) -> Result<(), Error> {
+pub async fn trigger_metric_collection(remote: Option<String>, wait: bool) -> Result<(), Error> {
+ let (done_sender, done_receiver) = oneshot::channel();
+
if let Some(sender) = CONTROL_MESSAGE_TX.get() {
sender
- .send(ControlMsg::TriggerMetricCollection(remote))
+ .send(ControlMsg::TriggerMetricCollection(remote, done_sender))
.await?;
+
+ if wait {
+ done_receiver.await?;
+ }
}
Ok(())
--
2.47.2
More information about the pdm-devel
mailing list