2020-04-06 13:28:02 +02:00
|
|
|
/********************************************************************************
|
|
|
|
* Prometheus exporter for monitoring network connectivity using icmp pings *
|
|
|
|
* *
|
|
|
|
* Copyright (C) 2019-2020 Jan Christian Grünhage *
|
|
|
|
* Copyright (C) 2020 Famedly GmbH *
|
|
|
|
* *
|
|
|
|
* This program is free software: you can redistribute it and/or modify *
|
|
|
|
* it under the terms of the GNU Affero General Public License as *
|
|
|
|
* published by the Free Software Foundation, either version 3 of the *
|
|
|
|
* License, or (at your option) any later version. *
|
|
|
|
* *
|
|
|
|
* This program is distributed in the hope that it will be useful, *
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of *
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
|
|
|
|
* GNU Affero General Public License for more details. *
|
|
|
|
* *
|
|
|
|
* You should have received a copy of the GNU Affero General Public License *
|
|
|
|
* along with this program. If not, see <https://www.gnu.org/licenses/>. *
|
|
|
|
********************************************************************************/
|
2020-04-06 12:56:39 +02:00
|
|
|
use crate::config::Config;
|
2021-04-23 09:08:55 +02:00
|
|
|
use anyhow::{Context, Result};
|
|
|
|
use async_anyhow_logger::catch;
|
2019-02-06 19:29:27 +01:00
|
|
|
use lazy_static::lazy_static;
|
2021-04-23 09:08:55 +02:00
|
|
|
use log::{info, trace};
|
2020-04-06 12:56:39 +02:00
|
|
|
use prometheus::*;
|
2020-04-06 20:29:46 +02:00
|
|
|
use std::net::IpAddr;
|
2020-04-06 12:56:39 +02:00
|
|
|
use std::time::Duration;
|
2020-04-08 12:01:19 +02:00
|
|
|
use tokio_ping::{PingFuture, Pinger};
|
2019-02-06 19:29:27 +01:00
|
|
|
|
|
|
|
lazy_static! {
|
2020-04-06 12:56:39 +02:00
|
|
|
static ref PING_HISTOGRAM: HistogramVec = register_histogram_vec!(
|
2019-02-06 19:29:27 +01:00
|
|
|
"ping_rtt_milliseconds",
|
|
|
|
"The ping round trip time in milliseconds",
|
|
|
|
&["target"],
|
2020-04-06 12:56:39 +02:00
|
|
|
vec![
|
|
|
|
0.5, 1.0, 5.0, 10.0, 15.0, 20.0, 25.0, 50.0, 75.0, 100.0, 150.0, 200.0, 250.0, 300.0,
|
|
|
|
350.0, 400.0, 450.0, 500.0, 550.0, 600.0, 650.0, 700.0, 750.0, 800.0, 900.0, 1000.0,
|
|
|
|
1250.0, 1500.0, 1750.0, 2000.0
|
|
|
|
]
|
|
|
|
)
|
|
|
|
.unwrap();
|
2019-02-06 19:29:27 +01:00
|
|
|
}
|
|
|
|
|
2021-04-23 14:32:26 +02:00
|
|
|
pub(crate) async fn start_pinging_hosts(config: &Config) -> Result<()> {
|
2021-04-23 09:08:55 +02:00
|
|
|
let pinger = Pinger::new().await.context("Couldn't create pinger")?;
|
|
|
|
let mut handles = vec![];
|
2019-02-06 19:29:27 +01:00
|
|
|
for (host, interval) in config.hosts.clone() {
|
|
|
|
info!("Spawn ping task for {}", host);
|
2021-04-23 14:32:26 +02:00
|
|
|
handles.push(tokio::spawn(ping_host(pinger.clone(), host, interval)));
|
2019-02-06 19:29:27 +01:00
|
|
|
}
|
2021-04-23 09:08:55 +02:00
|
|
|
let (result, _, _) = futures::future::select_all(handles).await;
|
2021-04-23 14:32:26 +02:00
|
|
|
result??;
|
2020-04-06 12:56:39 +02:00
|
|
|
Ok(())
|
|
|
|
}
|
2020-04-06 20:29:46 +02:00
|
|
|
|
2021-04-23 09:08:55 +02:00
|
|
|
async fn ping_host(pinger: Pinger, host: IpAddr, interval: u64) -> Result<()> {
|
2020-04-08 12:01:19 +02:00
|
|
|
let mut pingchain = pinger.chain(host).timeout(Duration::from_secs(3));
|
2020-04-06 20:29:46 +02:00
|
|
|
let mut interval = tokio::time::interval(Duration::from_millis(interval));
|
2020-04-08 12:01:19 +02:00
|
|
|
let host_string = host.to_string();
|
2020-04-06 20:29:46 +02:00
|
|
|
loop {
|
|
|
|
interval.tick().await;
|
2021-04-23 09:08:55 +02:00
|
|
|
tokio::spawn(catch(handle_ping_result(
|
|
|
|
pingchain.send(),
|
|
|
|
host_string.clone(),
|
|
|
|
)));
|
2020-04-06 20:29:46 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-04-23 09:08:55 +02:00
|
|
|
async fn handle_ping_result(result: PingFuture, host: String) -> Result<()> {
|
|
|
|
let pong = result.await.context(format!("Couldn't ping {}", &host))?;
|
2020-04-06 20:29:46 +02:00
|
|
|
match pong {
|
|
|
|
Some(time) => {
|
|
|
|
let ms = time.as_millis();
|
|
|
|
trace!("Received pong from {} after {} ms", &host, &ms);
|
|
|
|
PING_HISTOGRAM
|
|
|
|
.with_label_values(&[&host])
|
|
|
|
.observe(ms as f64);
|
|
|
|
}
|
|
|
|
None => {
|
|
|
|
trace!("Received no response from {} within timeout", &host);
|
|
|
|
PING_HISTOGRAM.with_label_values(&[&host]).observe(3000.0);
|
|
|
|
}
|
|
|
|
};
|
2021-04-23 09:08:55 +02:00
|
|
|
|
|
|
|
Ok(())
|
2020-04-06 20:29:46 +02:00
|
|
|
}
|