From 8b799d404a8cae77bb6c9332b73b93e9fe13224c Mon Sep 17 00:00:00 2001 From: Jan-Erik Rediger Date: Fri, 24 May 2024 10:37:19 +0200 Subject: [PATCH] (Memory|Timing) Distribution: snapshot only contains non-zero buckets now **BREAKING CHANGE**: This changes the ping payload for memory/timing distributions. --- glean-core/src/histogram/functional.rs | 40 +------------------ glean-core/src/metrics/memory_distribution.rs | 2 +- glean-core/src/metrics/timing_distribution.rs | 6 +-- glean-core/tests/memory_distribution.rs | 2 - glean-core/tests/timing_distribution.rs | 2 - 5 files changed, 4 insertions(+), 48 deletions(-) diff --git a/glean-core/src/histogram/functional.rs b/glean-core/src/histogram/functional.rs index 64df9a1a4d..836c255089 100644 --- a/glean-core/src/histogram/functional.rs +++ b/glean-core/src/histogram/functional.rs @@ -85,44 +85,8 @@ impl Histogram { /// **Caution** This is a more specific implementation of `snapshot_values` on functional /// histograms. `snapshot_values` cannot be used with those, due to buckets not being /// precomputed. - pub fn snapshot(&self) -> HashMap { - if self.values.is_empty() { - return HashMap::new(); - } - - let mut min_key = None; - let mut max_key = None; - - // `Iterator#min` and `Iterator#max` would do the same job independently, - // but we want to avoid iterating the keys twice, so we loop ourselves. - for key in self.values.keys() { - let key = *key; - - // safe unwrap, we checked it's not none - if min_key.is_none() || key < min_key.unwrap() { - min_key = Some(key); - } - - // safe unwrap, we checked it's not none - if max_key.is_none() || key > max_key.unwrap() { - max_key = Some(key); - } - } - - // Non-empty values, therefore minimum/maximum exists. - // safe unwraps, we set it at least once. - let min_bucket = self.bucketing.sample_to_bucket_index(min_key.unwrap()); - let max_bucket = self.bucketing.sample_to_bucket_index(max_key.unwrap()) + 1; - - let mut values = self.values.clone(); - - for idx in min_bucket..=max_bucket { - // Fill in missing entries. - let min_bucket = self.bucketing.bucket_index_to_bucket_minimum(idx); - let _ = values.entry(min_bucket).or_insert(0); - } - - values + pub fn snapshot(&self) -> &HashMap { + &self.values } } diff --git a/glean-core/src/metrics/memory_distribution.rs b/glean-core/src/metrics/memory_distribution.rs index 7b5e5ee192..e18a934152 100644 --- a/glean-core/src/metrics/memory_distribution.rs +++ b/glean-core/src/metrics/memory_distribution.rs @@ -42,7 +42,7 @@ pub(crate) fn snapshot(hist: &Histogram) -> DistributionData { values: hist .snapshot() .into_iter() - .map(|(k, v)| (k as i64, v as i64)) + .map(|(&k, &v)| (k as i64, v as i64)) .collect(), sum: hist.sum() as i64, count: hist.count() as i64, diff --git a/glean-core/src/metrics/timing_distribution.rs b/glean-core/src/metrics/timing_distribution.rs index 28a47b1125..6ad6e51764 100644 --- a/glean-core/src/metrics/timing_distribution.rs +++ b/glean-core/src/metrics/timing_distribution.rs @@ -74,7 +74,7 @@ pub(crate) fn snapshot(hist: &Histogram) -> DistributionData { values: hist .snapshot() .into_iter() - .map(|(k, v)| (k as i64, v as i64)) + .map(|(&k, &v)| (k as i64, v as i64)) .collect(), sum: hist.sum() as i64, count: hist.count() as i64, @@ -585,7 +585,6 @@ mod test { "8": 1, "9": 1, "10": 1, - "11": 0, }, }); @@ -610,10 +609,7 @@ mod test { "values": { "1024": 2, "1116": 1, - "1217": 0, - "1327": 0, "1448": 1, - "1579": 0, }, }); diff --git a/glean-core/tests/memory_distribution.rs b/glean-core/tests/memory_distribution.rs index 83ca84ddd5..e81e7ecdbb 100644 --- a/glean-core/tests/memory_distribution.rs +++ b/glean-core/tests/memory_distribution.rs @@ -59,7 +59,6 @@ fn serializer_should_correctly_serialize_memory_distribution() { "sum": 100_000 * kb, "values": { "99108124": 1, - "103496016": 0, } }); assert_eq!( @@ -93,7 +92,6 @@ fn set_value_properly_sets_the_value_in_all_stores() { "sum": 100_000, "values": { "96785": 1, - "101070": 0, } }); for store_name in store_names { diff --git a/glean-core/tests/timing_distribution.rs b/glean-core/tests/timing_distribution.rs index 78dd53ad8b..2e87f3f5a9 100644 --- a/glean-core/tests/timing_distribution.rs +++ b/glean-core/tests/timing_distribution.rs @@ -64,7 +64,6 @@ fn serializer_should_correctly_serialize_timing_distribution() { "sum": duration, "values": { "58": 1, - "64": 0, } }); assert_eq!( @@ -102,7 +101,6 @@ fn set_value_properly_sets_the_value_in_all_stores() { "sum": 1, "values": { "1": 1, - "2": 0, } }); for store_name in store_names {