diff --git a/read_buffer/src/column/float.rs b/read_buffer/src/column/float.rs index 09f5f280ce..be4fb43abd 100644 --- a/read_buffer/src/column/float.rs +++ b/read_buffer/src/column/float.rs @@ -1,3 +1,5 @@ +use std::mem::size_of; + use arrow::{self, array::Array}; use super::encoding::{scalar::Fixed, scalar::FixedNull}; @@ -10,7 +12,7 @@ pub enum FloatEncoding { } impl FloatEncoding { - /// The total size in bytes of the store columnar data. + /// The total size in bytes of to store columnar data in memory. pub fn size(&self) -> usize { match self { Self::Fixed64(enc) => enc.size(), @@ -18,6 +20,19 @@ impl FloatEncoding { } } + /// The estimated total size in bytes of the underlying float values in the + /// column if they were stored contiguously and uncompressed. `include_nulls` + /// will effectively size each NULL value as 8b if `true`. + pub fn size_raw(&self, include_nulls: bool) -> usize { + match self { + // this will be the size of a Vec + Self::Fixed64(enc) => { + size_of::>() + (enc.num_rows() as usize * size_of::()) + } + Self::FixedNull64(enc) => enc.size_raw(include_nulls), + } + } + /// The total number of rows in the column. pub fn num_rows(&self) -> u32 { match self { @@ -212,3 +227,30 @@ impl From for FloatEncoding { Self::FixedNull64(FixedNull::::from(arr)) } } + +#[cfg(test)] +mod test { + use super::*; + + #[test] + fn size_raw() { + let enc = FloatEncoding::from(&[2.2, 22.2, 12.2, 31.2][..]); + // (4 * 8) + 24 + assert_eq!(enc.size_raw(true), 56); + assert_eq!(enc.size_raw(false), 56); + + let enc = FloatEncoding::FixedNull64(FixedNull::::from( + &[2.0, 2.02, 1.02, 3.01][..], + )); + // (4 * 8) + 24 + assert_eq!(enc.size_raw(true), 56); + assert_eq!(enc.size_raw(false), 56); + + let enc = FloatEncoding::FixedNull64(FixedNull::::from( + &[Some(2.0), Some(2.02), None, Some(1.02), Some(3.01)][..], + )); + // (5 * 8) + 24 + assert_eq!(enc.size_raw(true), 64); + assert_eq!(enc.size_raw(false), 56); + } +}