Improve smooth load generator observability (open-telemetry#2766)

lquerel · web-flow · commit 685040edd2ef · 2026-04-28T18:42:35.000Z
# Change Summary

Improves smooth load generator pacing by using nanosecond intervals and
skipped missed ticks. Adds smooth-mode observability for behind runs,
remaining work, tick lateness, payload generation, and send
backpressure. Also adds the performance experiment log and diagrams
documenting the methodology and conclusions.

## What issue does this PR close?

* Closes #NNN

## How are these changes tested?

## Are there any user-facing changes?
diff --git a/rust/otap-dataflow/crates/core-nodes/src/receivers/fake_data_generator/metrics.rs b/rust/otap-dataflow/crates/core-nodes/src/receivers/fake_data_generator/metrics.rs
@@ -3,7 +3,7 @@
 
 //! Metrics for the OTLP Fake Signal Receiver node.
 
-use otap_df_telemetry::instrument::Counter;
+use otap_df_telemetry::instrument::{Counter, Gauge, Mmsc};
 use otap_df_telemetry_macros::metric_set;
 
 /// Pdata-oriented metrics for the OTAP PerfExporter.
@@ -19,4 +19,40 @@ pub struct FakeSignalReceiverMetrics {
     /// Number of metrics generated.
     #[metric(unit = "{metric}")]
     pub metrics_produced: Counter<u64>,
+    /// Number of smooth-mode production runs started.
+    #[metric(name = "smooth.runs.started", unit = "{run}")]
+    pub smooth_runs_started: Counter<u64>,
+    /// Number of smooth-mode production runs that completed before the next run tick.
+    #[metric(name = "smooth.runs.completed", unit = "{run}")]
+    pub smooth_runs_completed: Counter<u64>,
+    /// Number of smooth-mode production runs that still had work at the next run tick.
+    #[metric(name = "smooth.runs.behind", unit = "{run}")]
+    pub smooth_runs_behind: Counter<u64>,
+    /// Number of batches remaining when smooth mode detects that a run is behind.
+    #[metric(name = "smooth.behind.remaining.batches", unit = "{batch}")]
+    pub smooth_behind_remaining_batches: Mmsc,
+    /// Number of signal items remaining when smooth mode detects that a run is behind.
+    #[metric(name = "smooth.behind.remaining.items", unit = "{item}")]
+    pub smooth_behind_remaining_items: Mmsc,
+    /// Smooth-mode configured batches per one-second run.
+    #[metric(name = "smooth.run.batches", unit = "{batch}")]
+    pub smooth_run_batches: Gauge<u64>,
+    /// Smooth-mode configured interval between batches.
+    #[metric(name = "smooth.batch.interval", unit = "ns")]
+    pub smooth_batch_interval_ns: Gauge<u64>,
+    /// Lateness of smooth-mode batch ticks relative to their scheduled instant.
+    #[metric(name = "smooth.batch.tick.lateness.duration", unit = "ns")]
+    pub smooth_batch_tick_lateness_duration_ns: Mmsc,
+    /// Wall-clock time spent generating or cloning one smooth-mode payload.
+    #[metric(name = "smooth.payload.generate.duration", unit = "ns")]
+    pub smooth_payload_generate_duration_ns: Mmsc,
+    /// Wall-clock time spent sending one smooth-mode payload into the downstream channel.
+    #[metric(name = "smooth.payload.send.duration", unit = "ns")]
+    pub smooth_payload_send_duration_ns: Mmsc,
+    /// Number of smooth-mode payload send attempts rejected because the downstream channel was full.
+    #[metric(name = "smooth.payload.send.full", unit = "{attempt}")]
+    pub smooth_payload_send_full: Counter<u64>,
+    /// Number of smooth-mode payloads retried after a previous full-channel send.
+    #[metric(name = "smooth.payload.send.retry", unit = "{payload}")]
+    pub smooth_payload_send_retry: Counter<u64>,
 }
diff --git a/rust/otap-dataflow/crates/core-nodes/src/receivers/fake_data_generator/mod.rs b/rust/otap-dataflow/crates/core-nodes/src/receivers/fake_data_generator/mod.rs
@@ -32,7 +32,8 @@ use otap_df_telemetry::{otel_debug, otel_info, otel_warn};
 use serde_json::Value;
 use std::collections::HashMap;
 use std::sync::Arc;
-use tokio::time::{Duration, Interval, interval};
+use std::time::Instant as StdInstant;
+use tokio::time::{Duration, Interval, MissedTickBehavior, interval};
 
 use self::producer::{GenerateError, TrafficProducer};
 
@@ -53,6 +54,8 @@ pub mod static_signal;
 /// The URN for the fake data generator receiver
 pub const OTAP_FAKE_DATA_GENERATOR_URN: &str = "urn:otel:receiver:traffic_generator";
 
+const NANOS_PER_SECOND: u128 = 1_000_000_000;
+
 /// A Receiver that generates fake OTAP data for testing purposes.
 pub struct FakeGeneratorReceiver {
     /// Configuration for the fake data generator
@@ -62,6 +65,24 @@ pub struct FakeGeneratorReceiver {
     metrics: MetricSet<FakeSignalReceiverMetrics>,
 }
 
+fn smooth_batch_interval(run_len: usize) -> Option<Duration> {
+    if run_len == 0 {
+        return None;
+    }
+
+    let run_len = run_len as u128;
+    let nanos = NANOS_PER_SECOND.div_ceil(run_len);
+    u64::try_from(nanos).ok().map(Duration::from_nanos)
+}
+
+fn duration_nanos(duration: Duration) -> f64 {
+    duration.as_secs_f64() * 1e9
+}
+
+fn elapsed_nanos(start: StdInstant) -> f64 {
+    duration_nanos(start.elapsed())
+}
+
 /// Declares the fake data generator as a local receiver factory
 ///
 /// Unsafe code is temporarily used here to allow the use of `distributed_slice` macro
@@ -117,6 +138,7 @@ impl FakeGeneratorReceiver {
         transport_headers: Option<TransportHeaders>,
     ) -> Result<TerminalState, Error> {
         let mut run_produced: u64 = 0;
+        let mut next_pdata: Option<OtapPdata> = None;
 
         loop {
             producer.record_production(run_produced);
@@ -126,6 +148,9 @@ impl FakeGeneratorReceiver {
                 return wait_for_terminal(ctrl_msg_recv, handler, &mut self.metrics).await;
             };
 
+            self.metrics.smooth_runs_started.inc();
+            let mut run_completed = false;
+
             loop {
                 tokio::select! {
                     biased;
@@ -137,29 +162,83 @@ impl FakeGeneratorReceiver {
                     }
 
                     _ = run_ticker.tick() => {
-                        if current_run.len() > 0 {
+                        let remaining_batches = current_run.len() + usize::from(next_pdata.is_some());
+                        let remaining_items = current_run.remaining_signal_count()
+                            + next_pdata.as_ref().map_or(0, |pdata| pdata.num_items() as u64);
+                        if remaining_batches > 0 {
+                            self.metrics.smooth_runs_behind.inc();
+                            self.metrics
+                                .smooth_behind_remaining_batches
+                                .record(remaining_batches as f64);
+                            self.metrics
+                                .smooth_behind_remaining_items
+                                .record(remaining_items as f64);
                             otel_warn!(
                                 "Data generator is falling behind and didn't finish the current run. For highest
                                 possible throughput, use production_mode: open",
-                                remaining=current_run.len(),
+                                remaining=remaining_batches,
+                                remaining_items,
                             );
+                        } else if !run_completed {
+                            self.metrics.smooth_runs_completed.inc();
+                            run_completed = true;
+                        }
+
+                        if next_pdata.is_some() {
+                            continue;
                         }
+
                         break;
                     }
 
-                    _ = batch_ticker.tick() => {
+                    scheduled = batch_ticker.tick() => {
+                        let tick_lateness = tokio::time::Instant::now()
+                            .saturating_duration_since(scheduled);
+                        self.metrics
+                            .smooth_batch_tick_lateness_duration_ns
+                            .record(duration_nanos(tick_lateness));
 
-                        let Some(payload) = current_run.next() else {
-                            continue;
+                        let channel_result = match next_pdata.take() {
+                            Some(pdata) => {
+                                self.metrics.smooth_payload_send_retry.inc();
+                                let send_start = StdInstant::now();
+                                let result = self.export_pdata(handler, pdata)?;
+                                self.metrics
+                                    .smooth_payload_send_duration_ns
+                                    .record(elapsed_nanos(send_start));
+                                result
+                            }
+                            None => {
+                                let generate_start = StdInstant::now();
+                                let payload = current_run.next();
+
+                                let Some(payload) = payload else {
+                                    if !run_completed {
+                                        self.metrics.smooth_runs_completed.inc();
+                                        run_completed = true;
+                                    }
+                                    continue;
+                                };
+                                self.metrics
+                                    .smooth_payload_generate_duration_ns
+                                    .record(elapsed_nanos(generate_start));
+
+                                let send_start = StdInstant::now();
+                                let result = self.handle_payload(handler, payload, &transport_headers)?;
+                                self.metrics
+                                    .smooth_payload_send_duration_ns
+                                    .record(elapsed_nanos(send_start));
+                                result
+                            }
                         };
 
-                        let channel_result = self.handle_payload(handler, payload, &transport_headers)?;
                         match channel_result {
                             Ok(count) => {
                                 run_produced += count;
                             }
-                            Err(e) => {
-                                otel_warn!("Failed to push in smooth mode, skipping tick", err=?e);
+                            Err(pdata) => {
+                                self.metrics.smooth_payload_send_full.inc();
+                                next_pdata = Some(pdata);
                             }
                         }
                     }
@@ -448,18 +527,22 @@ impl local::Receiver<OtapPdata> for FakeGeneratorReceiver {
             .await?;
 
         let run_len = producer.run_len();
-        let batch_duration_millis = 1000u64.div_euclid(run_len as u64);
 
         // We consume one tick here because it's always immediately ready and would
         // make us think we're lagging;
         let mut run_ticker = interval(Duration::from_secs(1));
+        run_ticker.set_missed_tick_behavior(MissedTickBehavior::Skip);
         _ = run_ticker.tick().await;
 
         match self.config.get_traffic_config().production_mode {
             config::ProductionMode::Smooth => {
-                if batch_duration_millis > 0 {
-                    let batch_ticker =
-                        interval(Duration::from_millis(1000u64.div_euclid(run_len as u64)));
+                if let Some(batch_duration) = smooth_batch_interval(run_len) {
+                    self.metrics.smooth_run_batches.set(run_len as u64);
+                    self.metrics
+                        .smooth_batch_interval_ns
+                        .set(batch_duration.as_nanos() as u64);
+                    let mut batch_ticker = interval(batch_duration);
+                    batch_ticker.set_missed_tick_behavior(MissedTickBehavior::Skip);
                     self.run_smooth(
                         ctrl_msg_recv,
                         &effect_handler,
@@ -470,7 +553,9 @@ impl local::Receiver<OtapPdata> for FakeGeneratorReceiver {
                     )
                     .await
                 } else {
-                    otel_warn!("Falling back to Open production mode as batch interval is sub 1ms");
+                    otel_warn!(
+                        "Falling back to Open production mode because smooth batch interval is zero"
+                    );
                     self.run_open(
                         ctrl_msg_recv,
                         &effect_handler,
@@ -533,6 +618,21 @@ mod tests {
     const MAX_SIGNALS: u64 = 3;
     const MAX_BATCH: usize = 30;
 
+    #[test]
+    fn test_smooth_batch_interval_uses_sub_millisecond_precision() {
+        let interval = smooth_batch_interval(2000).expect("interval should exist");
+
+        assert_eq!(interval, Duration::from_micros(500));
+    }
+
+    #[test]
+    fn test_smooth_batch_interval_does_not_overdrive_run() {
+        let interval = smooth_batch_interval(88).expect("interval should exist");
+
+        assert!(interval * 88 >= Duration::from_secs(1));
+        assert!(interval * 87 < Duration::from_secs(1));
+    }
+
     /// Convert OtapPdata signal to OtlpProtoMessage for testing purposes.
     fn pdata_to_otlp_message(value: OtapPdata) -> OtlpProtoMessage {
         let otlp_bytes: OtlpProtoBytes = value
diff --git a/rust/otap-dataflow/crates/core-nodes/src/receivers/fake_data_generator/producer.rs b/rust/otap-dataflow/crates/core-nodes/src/receivers/fake_data_generator/producer.rs
@@ -201,6 +201,16 @@ pub struct TrafficRun<'a> {
     idx: usize,
 }
 
+impl TrafficRun<'_> {
+    /// The number of signals remaining in the current run.
+    #[must_use]
+    pub fn remaining_signal_count(&self) -> u64 {
+        (self.idx..self.strategy.len())
+            .map(|idx| self.strategy.size_at(idx) as u64)
+            .sum()
+    }
+}
+
 impl<'a> Iterator for TrafficRun<'a> {
     type Item = GenerateResult;