DataDog · lym953 · Sep 25, 2025 · Sep 19, 2025 · Sep 19, 2025 · Sep 23, 2025
@@ -1,38 +1,216 @@
 use crate::config::Config;
 use datadog_trace_protobuf::pb;
-use std::sync::Arc;
+use std::time::{SystemTime, UNIX_EPOCH};
+use std::{collections::HashMap, sync::Arc};
+use tracing::error;
 
 // Event sent to the stats concentrator
-#[derive(Clone, Copy)]
+#[derive(Clone)]
 pub struct StatsEvent {
     pub time: u64,
     pub aggregation_key: AggregationKey,
     pub stats: Stats,
 }
 
-#[derive(Clone, Debug, PartialEq, Eq, Hash, Copy)]
-pub struct AggregationKey {}
+#[derive(Clone, Debug, PartialEq, Eq, Hash)]
+pub struct AggregationKey {
+    pub env: String,
+    pub service: String,
+    // e.g. "aws.lambda.load", "aws.lambda.import"
+    pub name: String,
+    // e.g. "my-lambda-function-name", "datadog_lambda.handler", "urllib.request"
+    pub resource: String,
+    // e.g. "serverless"
+    pub r#type: String,
+}
+
+// Aggregated stats for a time interval across all the aggregation keys.
+#[derive(Default)]
+struct Bucket {
+    data: HashMap<AggregationKey, Stats>,
+}
 
 #[derive(Clone, Debug, Default, Copy)]
-pub struct Stats {}
+pub struct Stats {
+    pub hits: i32,
+    // in nanoseconds
+    pub duration: i64,
+    // error count
+    pub errors: i32,
+    pub top_level_hits: f64,
+}
 
 pub struct StatsConcentrator {
-    _config: Arc<Config>,
+    config: Arc<Config>,
+    buckets: HashMap<u64, Bucket>,
 }
 
+// The number of latest buckets to not flush when force_flush is false.
+// For example, if we have buckets with timestamps 10, 20, 40, the current timestamp is 45,
+// and NO_FLUSH_BUCKET_COUNT is 3, then we will flush bucket 10 but not bucket 20 or 40.
+// Note that the bucket 30 is included in the 3 latest buckets even if it has no data.
+// This is to reduce the chance of flushing stats that are still being collected to save some cost.
+const NO_FLUSH_BUCKET_COUNT: u64 = 2;
+
+const S_TO_NS: u64 = 1_000_000_000;
 pub const S_TO_NS: f64 = 1_000_000_000.0; 
 pub const S_TO_NS: f64 = 1_000_000_000.0; 
+
+// The duration of a bucket in nanoseconds.
+const BUCKET_DURATION_NS: u64 = 10 * S_TO_NS; // 10 seconds
+
 // Aggregates stats into buckets, which are then pulled by the stats aggregator.
 impl StatsConcentrator {
     #[must_use]
     pub fn new(config: Arc<Config>) -> Self {
-        Self { _config: config }
+        Self {
+            config,
+            buckets: HashMap::new(),
+        }
+    }
+
+    pub fn add(&mut self, stats_event: StatsEvent) {
+        let bucket_timestamp = Self::get_bucket_timestamp(stats_event.time);
+        let bucket = self.buckets.entry(bucket_timestamp).or_default();
+
+        let stats = bucket.data.entry(stats_event.aggregation_key).or_default();
+
+        stats.hits += stats_event.stats.hits;
+        stats.errors += stats_event.stats.errors;
+        stats.duration += stats_event.stats.duration;
+        stats.top_level_hits += stats_event.stats.top_level_hits;
     }
 
-    pub fn add(&mut self, _stats_event: StatsEvent) {}
+    fn get_bucket_timestamp(timestamp: u64) -> u64 {
+        timestamp - timestamp % BUCKET_DURATION_NS
+    }
 
-    // force_flush: If true, flush all stats. If false, flush stats except for the few latest
+    // force: If true, flush all stats. If false, flush stats except for the few latest
     // buckets, which may still be getting data.
     #[must_use]
-    pub fn flush(&mut self, _force_flush: bool) -> Vec<pb::ClientStatsPayload> {
-        vec![]
+    pub fn flush(&mut self, force: bool) -> Vec<pb::ClientStatsPayload> {
+        let current_timestamp: u64 = match SystemTime::now().duration_since(UNIX_EPOCH) {
+            Ok(duration) => u64::try_from(duration.as_nanos()).unwrap_or_default(),
+            Err(e) => {
+                error!("Failed to get current timestamp: {e}, skipping stats flush");
+                return Vec::new();
+            }
+        };
+
+        let mut ret = Vec::new();
+        self.buckets.retain(|&timestamp, bucket| {
+            if force || Self::should_flush_bucket(current_timestamp, timestamp) {
+                // Flush and remove this bucket
+                for (aggregation_key, stats) in &bucket.data {
+                    ret.push(Self::construct_stats_payload(
+                        &self.config,
+                        timestamp,
+                        aggregation_key,
+                        *stats,
+                    ));
+                }
+                false
+            } else {
+                // Keep this bucket
+                true
+            }
+        });
+
+        ret
+    }
+
+    fn should_flush_bucket(current_timestamp: u64, bucket_timestamp: u64) -> bool {
+        current_timestamp - bucket_timestamp >= BUCKET_DURATION_NS * NO_FLUSH_BUCKET_COUNT
+    }
+
+    #[allow(clippy::cast_possible_truncation)]
+    #[allow(clippy::cast_sign_loss)]
+    fn construct_stats_payload(
+        config: &Config,
+        timestamp: u64,
+        aggregation_key: &AggregationKey,
+        stats: Stats,
+    ) -> pb::ClientStatsPayload {
+        pb::ClientStatsPayload {
+            // TODO: handle this
+            hostname: String::new(),
+            env: aggregation_key.env.clone(),
+            // Version is not in the trace payload. Need to read it from config.
+            version: config.version.clone().unwrap_or_default(),
+            // TODO: handle this
+            lang: "rust".to_string(),
+            // TODO: handle this
+            tracer_version: String::new(),
+            // TODO: handle this
+            runtime_id: String::new(),
+            // TODO: handle this
+            sequence: 0,
+            // TODO: handle this
+            agent_aggregation: String::new(),
+            service: aggregation_key.service.clone(),
+            // TODO: handle this
+            container_id: String::new(),
+            // TODO: handle this
+            tags: vec![],
+            // TODO: handle this
+            git_commit_sha: String::new(),
+            // TODO: handle this
+            image_tag: String::new(),
+            stats: vec![pb::ClientStatsBucket {
+                start: timestamp,
+                duration: BUCKET_DURATION_NS,
+                stats: vec![pb::ClientGroupedStats {
+                    service: aggregation_key.service.clone(),
+                    name: aggregation_key.name.clone(),
+                    resource: aggregation_key.resource.clone(),
+                    // TODO: handle this
+                    http_status_code: 0,
+                    r#type: aggregation_key.r#type.clone(),
+                    // TODO: handle this
+                    db_type: String::new(),
+                    hits: stats.hits.try_into().unwrap_or_default(),
+                    errors: stats.errors.try_into().unwrap_or_default(),
+                    duration: stats.duration.try_into().unwrap_or_default(),
+                    // TODO: handle this
+                    ok_summary: vec![],
+                    // TODO: handle this
+                    error_summary: vec![],
+                    // TODO: handle this
+                    synthetics: false,
+                    top_level_hits: stats.top_level_hits.round() as u64,
+                    // TODO: handle this
+                    span_kind: String::new(),
+                    // TODO: handle this
+                    peer_tags: vec![],
+                    // TODO: handle this
+                    is_trace_root: 1,
+                }],
+                // TODO: handle this
+                agent_time_shift: 0,
+            }],
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_should_flush_bucket_false_when_not_enough_time_passed() {
+        let bucket_timestamp = 1_000_000_000;
+        let current_timestamp = bucket_timestamp + BUCKET_DURATION_NS * NO_FLUSH_BUCKET_COUNT - 1;
+        assert!(
+            !StatsConcentrator::should_flush_bucket(current_timestamp, bucket_timestamp),
+            "Should not flush when current_timestamp is less than threshold ahead"
+        );
+    }
+
+    #[test]
+    fn test_should_flush_bucket_true_when_later() {
+        let bucket_timestamp = 1_000_000_000;
+        let current_timestamp = bucket_timestamp + BUCKET_DURATION_NS * NO_FLUSH_BUCKET_COUNT + 1;
+        assert!(
+            StatsConcentrator::should_flush_bucket(current_timestamp, bucket_timestamp),
+            "Should flush when current_timestamp is greater than threshold"
+        );
     }
 }
@@ -33,8 +33,22 @@ impl StatsGenerator {
                     for span in &chunk.spans {
                         let stats = StatsEvent {
                             time: span.start.try_into().unwrap_or_default(),
-                            aggregation_key: AggregationKey {},
-                            stats: Stats {},
+                            aggregation_key: AggregationKey {
+                                env: span.meta.get("env").cloned().unwrap_or_default(),
+                                service: span.service.clone(),
+                                name: span.name.clone(),
+                                resource: span.resource.clone(),
+                                r#type: span.r#type.clone(),
+                            },
+                            stats: Stats {
+                                hits: 1,
+                                errors: span.error,
+                                duration: span.duration,
+                                top_level_hits: span
+                                    .metrics
+                                    .get("_dd.top_level")
+                                    .map_or(0.0, |v| *v),
+                            },
                         };
                         if let Err(err) = self.stats_concentrator.add(stats) {
                             error!("Failed to send trace stats: {err}");