Unverified Commit 8621ed28 authored by asynchronous rob's avatar asynchronous rob Committed by GitHub
Browse files

Separate metrics for messages sent & received (#2721)

* metered channel - sent & received

* Add for readouts

* metrics for both sent & received

* retract on send failure
parent e35b288d
Pipeline #130788 failed with stages
in 25 minutes and 8 seconds
...@@ -3879,6 +3879,7 @@ name = "metered-channel" ...@@ -3879,6 +3879,7 @@ name = "metered-channel"
version = "0.1.0" version = "0.1.0"
dependencies = [ dependencies = [
"assert_matches", "assert_matches",
"derive_more",
"futures 0.3.13", "futures 0.3.13",
"futures-timer 3.0.2", "futures-timer 3.0.2",
] ]
......
...@@ -8,6 +8,7 @@ description = "Channels with attached Meters" ...@@ -8,6 +8,7 @@ description = "Channels with attached Meters"
[dependencies] [dependencies]
futures = "0.3.12" futures = "0.3.12"
futures-timer = "3.0.2" futures-timer = "3.0.2"
derive_more = "0.99"
[dev-dependencies] [dev-dependencies]
assert_matches = "1.4.0" assert_matches = "1.4.0"
......
...@@ -54,8 +54,7 @@ impl<T> Stream for MeteredReceiver<T> { ...@@ -54,8 +54,7 @@ impl<T> Stream for MeteredReceiver<T> {
fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> { fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> {
match mpsc::Receiver::poll_next(Pin::new(&mut self.inner), cx) { match mpsc::Receiver::poll_next(Pin::new(&mut self.inner), cx) {
Poll::Ready(x) => { Poll::Ready(x) => {
// always use Ordering::SeqCst to avoid underflows self.meter.note_received();
self.meter.fill.fetch_sub(1, Ordering::SeqCst);
Poll::Ready(x) Poll::Ready(x)
} }
other => other, other => other,
...@@ -78,7 +77,7 @@ impl<T> MeteredReceiver<T> { ...@@ -78,7 +77,7 @@ impl<T> MeteredReceiver<T> {
pub fn try_next(&mut self) -> Result<Option<T>, mpsc::TryRecvError> { pub fn try_next(&mut self) -> Result<Option<T>, mpsc::TryRecvError> {
match self.inner.try_next()? { match self.inner.try_next()? {
Some(x) => { Some(x) => {
self.meter.fill.fetch_sub(1, Ordering::SeqCst); self.meter.note_received();
Ok(Some(x)) Ok(Some(x))
} }
None => Ok(None), None => Ok(None),
...@@ -131,17 +130,22 @@ impl<T> MeteredSender<T> { ...@@ -131,17 +130,22 @@ impl<T> MeteredSender<T> {
where where
Self: Unpin, Self: Unpin,
{ {
self.meter.fill.fetch_add(1, Ordering::SeqCst); self.meter.note_sent();
let fut = self.inner.send(item); let fut = self.inner.send(item);
futures::pin_mut!(fut); futures::pin_mut!(fut);
fut.await fut.await.map_err(|e| {
self.meter.retract_sent();
e
})
} }
/// Attempt to send message or fail immediately. /// Attempt to send message or fail immediately.
pub fn try_send(&mut self, msg: T) -> result::Result<(), mpsc::TrySendError<T>> { pub fn try_send(&mut self, msg: T) -> result::Result<(), mpsc::TrySendError<T>> {
self.inner.try_send(msg)?; self.meter.note_sent();
self.meter.fill.fetch_add(1, Ordering::SeqCst); self.inner.try_send(msg).map_err(|e| {
Ok(()) self.meter.retract_sent();
e
})
} }
} }
...@@ -159,7 +163,6 @@ impl<T> futures::sink::Sink<T> for MeteredSender<T> { ...@@ -159,7 +163,6 @@ impl<T> futures::sink::Sink<T> for MeteredSender<T> {
fn poll_close(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> { fn poll_close(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
match Pin::new(&mut self.inner).poll_close(cx) { match Pin::new(&mut self.inner).poll_close(cx) {
val @ Poll::Ready(_)=> { val @ Poll::Ready(_)=> {
self.meter.fill.store(0, Ordering::SeqCst);
val val
} }
other => other, other => other,
...@@ -169,7 +172,7 @@ impl<T> futures::sink::Sink<T> for MeteredSender<T> { ...@@ -169,7 +172,7 @@ impl<T> futures::sink::Sink<T> for MeteredSender<T> {
fn poll_flush(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> { fn poll_flush(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
match Pin::new(&mut self.inner).poll_flush(cx) { match Pin::new(&mut self.inner).poll_flush(cx) {
val @ Poll::Ready(_)=> { val @ Poll::Ready(_)=> {
self.meter.fill.fetch_add(1, Ordering::SeqCst); self.meter.note_sent();
val val
} }
other => other, other => other,
......
...@@ -24,6 +24,8 @@ use std::result; ...@@ -24,6 +24,8 @@ use std::result;
use std::sync::Arc; use std::sync::Arc;
use std::pin::Pin; use std::pin::Pin;
use derive_more::{Add, Display};
mod bounded; mod bounded;
mod unbounded; mod unbounded;
...@@ -35,22 +37,50 @@ pub use self::unbounded::*; ...@@ -35,22 +37,50 @@ pub use self::unbounded::*;
pub struct Meter { pub struct Meter {
/// Name of the receiver and sender pair. /// Name of the receiver and sender pair.
name: &'static str, name: &'static str,
// fill state of the channel // Number of sends on this channel.
fill: Arc<AtomicUsize>, sent: Arc<AtomicUsize>,
// Number of receives on this channel.
received: Arc<AtomicUsize>,
}
/// A readout of sizes from the meter. Note that it is possible, due to asynchrony, for received
/// to be slightly higher than sent.
#[derive(Debug, Add, Display, Clone, Default, PartialEq)]
#[display(fmt = "(sent={} received={})", sent, received)]
pub struct Readout {
/// The amount of messages sent on the channel, in aggregate.
pub sent: usize,
/// The amount of messages received on the channel, in aggregate.
pub received: usize,
} }
impl Meter { impl Meter {
/// Count the number of items queued up inside the channel. /// Count the number of items queued up inside the channel.
pub fn queue_count(&self) -> usize { pub fn read(&self) -> Readout {
// when obtaining we don't care much about off by one // when obtaining we don't care much about off by one
// accuracy // accuracy
self.fill.load(Ordering::Relaxed) Readout {
sent: self.sent.load(Ordering::Relaxed),
received: self.received.load(Ordering::Relaxed),
}
} }
/// Obtain the name of the channel `Sender` and `Receiver` pair. /// Obtain the name of the channel `Sender` and `Receiver` pair.
pub fn name(&self) -> &'static str { pub fn name(&self) -> &'static str {
self.name self.name
} }
fn note_sent(&self) {
self.sent.fetch_add(1, Ordering::Relaxed);
}
fn retract_sent(&self) {
self.sent.fetch_sub(1, Ordering::Relaxed);
}
fn note_received(&self) {
self.received.fetch_add(1, Ordering::Relaxed);
}
} }
#[cfg(test)] #[cfg(test)]
...@@ -69,20 +99,20 @@ mod tests { ...@@ -69,20 +99,20 @@ mod tests {
block_on(async move { block_on(async move {
let (mut tx, mut rx) = channel::<Msg>(5, "goofy"); let (mut tx, mut rx) = channel::<Msg>(5, "goofy");
let msg = Msg::default(); let msg = Msg::default();
assert_eq!(rx.meter().queue_count(), 0); assert_eq!(rx.meter().read(), Readout { sent: 0, received: 0 });
tx.try_send(msg).unwrap(); tx.try_send(msg).unwrap();
assert_eq!(tx.meter().queue_count(), 1); assert_eq!(tx.meter().read(), Readout { sent: 1, received: 0 });
tx.try_send(msg).unwrap(); tx.try_send(msg).unwrap();
tx.try_send(msg).unwrap(); tx.try_send(msg).unwrap();
tx.try_send(msg).unwrap(); tx.try_send(msg).unwrap();
assert_eq!(tx.meter().queue_count(), 4); assert_eq!(tx.meter().read(), Readout { sent: 4, received: 0 });
rx.try_next().unwrap(); rx.try_next().unwrap();
assert_eq!(rx.meter().queue_count(), 3); assert_eq!(rx.meter().read(), Readout { sent: 4, received: 1 });
rx.try_next().unwrap(); rx.try_next().unwrap();
rx.try_next().unwrap(); rx.try_next().unwrap();
assert_eq!(tx.meter().queue_count(), 1); assert_eq!(tx.meter().read(), Readout { sent: 4, received: 3 });
rx.try_next().unwrap(); rx.try_next().unwrap();
assert_eq!(rx.meter().queue_count(), 0); assert_eq!(rx.meter().read(), Readout { sent: 4, received: 4 });
assert!(rx.try_next().is_err()); assert!(rx.try_next().is_err());
}); });
} }
...@@ -96,9 +126,9 @@ mod tests { ...@@ -96,9 +126,9 @@ mod tests {
futures::join!( futures::join!(
async move { async move {
let msg = Msg::default(); let msg = Msg::default();
assert_eq!(tx.meter().queue_count(), 0); assert_eq!(tx.meter().read(), Readout { sent: 0, received: 0 });
tx.try_send(msg).unwrap(); tx.try_send(msg).unwrap();
assert_eq!(tx.meter().queue_count(), 1); assert_eq!(tx.meter().read(), Readout { sent: 1, received: 0 });
tx.try_send(msg).unwrap(); tx.try_send(msg).unwrap();
tx.try_send(msg).unwrap(); tx.try_send(msg).unwrap();
tx.try_send(msg).unwrap(); tx.try_send(msg).unwrap();
...@@ -106,14 +136,14 @@ mod tests { ...@@ -106,14 +136,14 @@ mod tests {
}, },
async move { async move {
go.await.expect("Helper oneshot channel must work. qed"); go.await.expect("Helper oneshot channel must work. qed");
assert_eq!(rx.meter().queue_count(), 4); assert_eq!(rx.meter().read(), Readout { sent: 4, received: 0 });
rx.try_next().unwrap(); rx.try_next().unwrap();
assert_eq!(rx.meter().queue_count(), 3); assert_eq!(rx.meter().read(), Readout { sent: 4, received: 1 });
rx.try_next().unwrap(); rx.try_next().unwrap();
rx.try_next().unwrap(); rx.try_next().unwrap();
assert_eq!(rx.meter().queue_count(), 1); assert_eq!(rx.meter().read(), Readout { sent: 4, received: 3 });
rx.try_next().unwrap(); rx.try_next().unwrap();
assert_eq!(dbg!(rx.meter().queue_count()), 0); assert_eq!(dbg!(rx.meter().read()), Readout { sent: 4, received: 4 });
} }
) )
}); });
...@@ -130,21 +160,37 @@ mod tests { ...@@ -130,21 +160,37 @@ mod tests {
futures::join!( futures::join!(
async move { async move {
for i in 0..15 { for i in 0..15 {
println!("Sent #{} with a backlog of {} items", i + 1, tx.meter().queue_count()); println!("Sent #{} with a backlog of {} items", i + 1, tx.meter().read());
let msg = Msg { val: i as u8 + 1u8 }; let msg = Msg { val: i as u8 + 1u8 };
tx.send(msg).await.unwrap(); tx.send(msg).await.unwrap();
assert!(tx.meter().queue_count() > 0usize); assert!(tx.meter().read().sent > 0usize);
Delay::new(Duration::from_millis(20)).await; Delay::new(Duration::from_millis(20)).await;
} }
() ()
}, },
async move { async move {
while let Some(msg) = rx.next().await { while let Some(msg) = rx.next().await {
println!("rx'd one {} with {} backlogged", msg.val, rx.meter().queue_count()); println!("rx'd one {} with {} backlogged", msg.val, rx.meter().read());
Delay::new(Duration::from_millis(29)).await; Delay::new(Duration::from_millis(29)).await;
} }
} }
) )
}); });
} }
#[test]
fn failed_send_does_not_inc_sent() {
let (mut bounded, _) = channel::<Msg>(5, "pluto");
let (mut unbounded, _) = unbounded::<Msg>("pluto");
block_on(async move {
assert!(bounded.send(Msg::default()).await.is_err());
assert!(bounded.try_send(Msg::default()).is_err());
assert_eq!(bounded.meter().read(), Readout { sent: 0, received: 0 });
assert!(unbounded.send(Msg::default()).await.is_err());
assert!(unbounded.unbounded_send(Msg::default()).is_err());
assert_eq!(unbounded.meter().read(), Readout { sent: 0, received: 0 });
});
}
} }
...@@ -54,8 +54,7 @@ impl<T> Stream for UnboundedMeteredReceiver<T> { ...@@ -54,8 +54,7 @@ impl<T> Stream for UnboundedMeteredReceiver<T> {
fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> { fn poll_next(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Option<Self::Item>> {
match mpsc::UnboundedReceiver::poll_next(Pin::new(&mut self.inner), cx) { match mpsc::UnboundedReceiver::poll_next(Pin::new(&mut self.inner), cx) {
Poll::Ready(x) => { Poll::Ready(x) => {
// always use Ordering::SeqCst to avoid underflows self.meter.note_received();
self.meter.fill.fetch_sub(1, Ordering::SeqCst);
Poll::Ready(x) Poll::Ready(x)
} }
other => other, other => other,
...@@ -78,7 +77,7 @@ impl<T> UnboundedMeteredReceiver<T> { ...@@ -78,7 +77,7 @@ impl<T> UnboundedMeteredReceiver<T> {
pub fn try_next(&mut self) -> Result<Option<T>, mpsc::TryRecvError> { pub fn try_next(&mut self) -> Result<Option<T>, mpsc::TryRecvError> {
match self.inner.try_next()? { match self.inner.try_next()? {
Some(x) => { Some(x) => {
self.meter.fill.fetch_sub(1, Ordering::SeqCst); self.meter.note_received();
Ok(Some(x)) Ok(Some(x))
} }
None => Ok(None), None => Ok(None),
...@@ -131,18 +130,23 @@ impl<T> UnboundedMeteredSender<T> { ...@@ -131,18 +130,23 @@ impl<T> UnboundedMeteredSender<T> {
where where
Self: Unpin, Self: Unpin,
{ {
self.meter.fill.fetch_add(1, Ordering::SeqCst); self.meter.note_sent();
let fut = self.inner.send(item); let fut = self.inner.send(item);
futures::pin_mut!(fut); futures::pin_mut!(fut);
fut.await fut.await.map_err(|e| {
self.meter.retract_sent();
e
})
} }
/// Attempt to send message or fail immediately. /// Attempt to send message or fail immediately.
pub fn unbounded_send(&mut self, msg: T) -> result::Result<(), mpsc::TrySendError<T>> { pub fn unbounded_send(&mut self, msg: T) -> result::Result<(), mpsc::TrySendError<T>> {
self.inner.unbounded_send(msg)?; self.meter.note_sent();
self.meter.fill.fetch_add(1, Ordering::SeqCst); self.inner.unbounded_send(msg).map_err(|e| {
Ok(()) self.meter.retract_sent();
e
})
} }
} }
...@@ -160,7 +164,6 @@ impl<T> futures::sink::Sink<T> for UnboundedMeteredSender<T> { ...@@ -160,7 +164,6 @@ impl<T> futures::sink::Sink<T> for UnboundedMeteredSender<T> {
fn poll_close(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> { fn poll_close(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
match Pin::new(&mut self.inner).poll_ready(cx) { match Pin::new(&mut self.inner).poll_ready(cx) {
val @ Poll::Ready(_)=> { val @ Poll::Ready(_)=> {
self.meter.fill.store(0, Ordering::SeqCst);
val val
} }
other => other, other => other,
...@@ -170,7 +173,7 @@ impl<T> futures::sink::Sink<T> for UnboundedMeteredSender<T> { ...@@ -170,7 +173,7 @@ impl<T> futures::sink::Sink<T> for UnboundedMeteredSender<T> {
fn poll_flush(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> { fn poll_flush(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Result<(), Self::Error>> {
match Pin::new(&mut self.inner).poll_ready(cx) { match Pin::new(&mut self.inner).poll_ready(cx) {
val @ Poll::Ready(_)=> { val @ Poll::Ready(_)=> {
self.meter.fill.fetch_add(1, Ordering::SeqCst); self.meter.note_sent();
val val
} }
other => other, other => other,
......
...@@ -1327,8 +1327,10 @@ struct MetricsInner { ...@@ -1327,8 +1327,10 @@ struct MetricsInner {
deactivated_heads_total: prometheus::Counter<prometheus::U64>, deactivated_heads_total: prometheus::Counter<prometheus::U64>,
messages_relayed_total: prometheus::Counter<prometheus::U64>, messages_relayed_total: prometheus::Counter<prometheus::U64>,
message_relay_timings: prometheus::Histogram, message_relay_timings: prometheus::Histogram,
to_overseer_channel_queue_size: prometheus::Gauge<prometheus::U64>, to_overseer_sent: prometheus::Gauge<prometheus::U64>,
from_overseer_channel_queue_size: prometheus::GaugeVec<prometheus::U64>, to_overseer_received: prometheus::Gauge<prometheus::U64>,
from_overseer_sent: prometheus::GaugeVec<prometheus::U64>,
from_overseer_received: prometheus::GaugeVec<prometheus::U64>,
} }
#[derive(Default, Clone)] #[derive(Default, Clone)]
...@@ -1360,15 +1362,21 @@ impl Metrics { ...@@ -1360,15 +1362,21 @@ impl Metrics {
fn channel_fill_level_snapshot( fn channel_fill_level_snapshot(
&self, &self,
from_overseer: AllSubsystemsSame<(&'static str, usize)>, from_overseer: AllSubsystemsSame<(&'static str, metered::Readout)>,
to_overseer: usize, to_overseer: metered::Readout,
) { ) {
self.0.as_ref().map(|metrics| { self.0.as_ref().map(|metrics| {
from_overseer.map_subsystems(|(name, queue_size): (_, usize)| { from_overseer.map_subsystems(|(name, readout): (_, metered::Readout)| {
metrics.from_overseer_channel_queue_size.with_label_values(&[name]).set(queue_size as u64); metrics.from_overseer_sent.with_label_values(&[name])
}) .set(readout.sent as u64);
metrics.from_overseer_received.with_label_values(&[name])
.set(readout.received as u64);
});
metrics.to_overseer_sent.set(to_overseer.sent as u64);
metrics.to_overseer_received.set(to_overseer.received as u64);
}); });
self.0.as_ref().map(|metrics| metrics.to_overseer_channel_queue_size.set(to_overseer as u64));
} }
} }
...@@ -1418,11 +1426,23 @@ impl metrics::Metrics for Metrics { ...@@ -1418,11 +1426,23 @@ impl metrics::Metrics for Metrics {
)?, )?,
registry, registry,
)?, )?,
from_overseer_channel_queue_size: prometheus::register( from_overseer_sent: prometheus::register(
prometheus::GaugeVec::<prometheus::U64>::new(
prometheus::Opts::new(
"parachain_from_overseer_sent",
"Number of elements sent by the overseer to subsystems",
),
&[
"subsystem_name",
],
)?,
registry,
)?,
from_overseer_received: prometheus::register(
prometheus::GaugeVec::<prometheus::U64>::new( prometheus::GaugeVec::<prometheus::U64>::new(
prometheus::Opts::new( prometheus::Opts::new(
"parachain_from_overseer_channel_queue_size", "parachain_from_overseer_received",
"Number of elements sitting in the channel from the overseer waiting to be processed.", "Number of elements received by subsystems from overseer",
), ),
&[ &[
"subsystem_name", "subsystem_name",
...@@ -1430,11 +1450,20 @@ impl metrics::Metrics for Metrics { ...@@ -1430,11 +1450,20 @@ impl metrics::Metrics for Metrics {
)?, )?,
registry, registry,
)?, )?,
to_overseer_channel_queue_size: prometheus::register( to_overseer_sent: prometheus::register(
prometheus::Gauge::<prometheus::U64>::with_opts(
prometheus::Opts::new(
"parachain_to_overseer_sent",
"Number of elements sent by subsystems to overseer",
),
)?,
registry,
)?,
to_overseer_received: prometheus::register(
prometheus::Gauge::<prometheus::U64>::with_opts( prometheus::Gauge::<prometheus::U64>::with_opts(
prometheus::Opts::new( prometheus::Opts::new(
"parachain_to_overseer_channel_queue_size", "parachain_to_overseer_received",
"Number of elements sitting in the channel to the overseer waiting to be processed.", "Number of element received by overseer from subsystems",
), ),
)?, )?,
registry, registry,
...@@ -1820,14 +1849,14 @@ where ...@@ -1820,14 +1849,14 @@ where
let metronome = Metronome::new(std::time::Duration::from_millis(950)) let metronome = Metronome::new(std::time::Duration::from_millis(950))
.for_each(move |_| { .for_each(move |_| {
let to_subsystem_counts = subsystem_meters.as_ref() let to_subsystem_counts = subsystem_meters.as_ref()
.map_subsystems(|&(name, ref meter): &(_, metered::Meter)| (name, meter.queue_count())); .map_subsystems(|&(name, ref meter): &(_, metered::Meter)| (name, meter.read()));
// We combine the amount of messages from subsystems to the overseer // We combine the amount of messages from subsystems to the overseer
// as well as the amount of messages from external sources to the overseer // as well as the amount of messages from external sources to the overseer
// into one to_overseer value. // into one to_overseer value.
metronome_metrics.channel_fill_level_snapshot( metronome_metrics.channel_fill_level_snapshot(
to_subsystem_counts, to_subsystem_counts,
meter_subsystem_to_overseer.queue_count() + meter_external_to_overseer.queue_count(), meter_subsystem_to_overseer.read() + meter_external_to_overseer.read(),
); );
async move { async move {
...@@ -2467,7 +2496,8 @@ mod tests { ...@@ -2467,7 +2496,8 @@ mod tests {
assert_eq!(gather[1].get_name(), "parachain_deactivated_heads_total"); assert_eq!(gather[1].get_name(), "parachain_deactivated_heads_total");
assert_eq!(gather[2].get_name(), "parachain_messages_relayed_total"); assert_eq!(gather[2].get_name(), "parachain_messages_relayed_total");
assert_eq!(gather[3].get_name(), "parachain_overseer_messages_relay_timings"); assert_eq!(gather[3].get_name(), "parachain_overseer_messages_relay_timings");
assert_eq!(gather[4].get_name(), "parachain_to_overseer_channel_queue_size"); assert_eq!(gather[4].get_name(), "parachain_to_overseer_received");
assert_eq!(gather[5].get_name(), "parachain_to_overseer_sent");
let activated = gather[0].get_metric()[0].get_counter().get_value() as u64; let activated = gather[0].get_metric()[0].get_counter().get_value() as u64;
let deactivated = gather[1].get_metric()[0].get_counter().get_value() as u64; let deactivated = gather[1].get_metric()[0].get_counter().get_value() as u64;
let relayed = gather[2].get_metric()[0].get_counter().get_value() as u64; let relayed = gather[2].get_metric()[0].get_counter().get_value() as u64;
......
Supports Markdown
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment