diff --git a/read_buffer/src/column.rs b/read_buffer/src/column.rs
index 2a78bc0309..6109ccc19b 100644
--- a/read_buffer/src/column.rs
+++ b/read_buffer/src/column.rs
@@ -15,7 +15,7 @@ use arrow::array::Array;
 use crate::schema::LogicalDataType;
 use crate::value::{EncodedValues, OwnedValue, Scalar, Value, Values};
 use boolean::BooleanEncoding;
-use encoding::{bool, scalar};
+use encoding::bool;
 use float::FloatEncoding;
 use integer::IntegerEncoding;
 use string::StringEncoding;
@@ -1088,13 +1088,13 @@ impl From<arrow::array::Float64Array> for Column {
             _ => unreachable!("min/max must both be Some or None"),
         };
 
-        let data = scalar::FixedNull::<arrow::datatypes::Float64Type>::from(arr);
+        let data = FloatEncoding::from(arr);
         let meta = MetaData {
             range,
             ..MetaData::default()
         };
 
-        Self::Float(meta, FloatEncoding::FixedNull64(data))
+        Self::Float(meta, data)
     }
 }
 
@@ -1285,6 +1285,7 @@ impl RowIDs {
         }
     }
 
+    // Add all row IDs in the domain `[from, to)` to the collection.
     pub fn add_range(&mut self, from: u32, to: u32) {
         match self {
             Self::Bitmap(ids) => ids.add_range(from as u64..to as u64),
diff --git a/read_buffer/src/column/cmp.rs b/read_buffer/src/column/cmp.rs
index 63a6e84896..0f12aff66a 100644
--- a/read_buffer/src/column/cmp.rs
+++ b/read_buffer/src/column/cmp.rs
@@ -1,4 +1,4 @@
-use std::convert::TryFrom;
+use std::{convert::TryFrom, fmt::Display};
 
 /// Possible comparison operators
 #[derive(Debug, PartialEq, Copy, Clone)]
@@ -12,6 +12,23 @@ pub enum Operator {
     LTE,
 }
 
+impl Display for Operator {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(
+            f,
+            "{}",
+            match self {
+                Self::Equal => "=",
+                Self::NotEqual => "!=",
+                Self::GT => ">",
+                Self::GTE => ">=",
+                Self::LT => "<",
+                Self::LTE => "<=",
+            }
+        )
+    }
+}
+
 impl TryFrom<&str> for Operator {
     type Error = String;
 
diff --git a/read_buffer/src/column/encoding/scalar.rs b/read_buffer/src/column/encoding/scalar.rs
index ff8442dd93..e281d64858 100644
--- a/read_buffer/src/column/encoding/scalar.rs
+++ b/read_buffer/src/column/encoding/scalar.rs
@@ -1,5 +1,7 @@
 pub mod fixed;
 pub mod fixed_null;
+pub mod rle;
 
 pub use fixed::Fixed;
 pub use fixed_null::FixedNull;
+pub use rle::RLE;
diff --git a/read_buffer/src/column/encoding/scalar/rle.rs b/read_buffer/src/column/encoding/scalar/rle.rs
new file mode 100644
index 0000000000..a30b038702
--- /dev/null
+++ b/read_buffer/src/column/encoding/scalar/rle.rs
@@ -0,0 +1,1082 @@
+use crate::column::cmp;
+use crate::column::RowIDs;
+use std::{
+    cmp::Ordering,
+    fmt::{Debug, Display},
+    iter,
+    mem::size_of,
+};
+
+pub const ENCODING_NAME: &str = "RLE";
+
+#[allow(clippy::upper_case_acronyms)] // this looks weird as `Rle`
+/// An RLE encoding is one where identical "runs" of values in the column are
+/// stored as a tuple: `(run_length, value)`, where `run_length` indicates the
+/// number of times the value is to be repeated.
+#[derive(Debug, Default)]
+pub struct RLE<T>
+where
+    T: PartialOrd + Debug,
+{
+    // stores tuples of run-lengths. Each value is repeats the total number of
+    // times the second value should is repeated within the column.
+    //
+    // TODO(edd): can likely improve on 4B for run-length storage
+    //
+    // TODO(edd): Option<T> effectively doubles the size of storing `T` for many
+    //            `T`. I am not overly concerned about this right now because of
+    //            the massive savings the encoding can already provide. Further
+    //            when `T` is a `NonZeroX` then we get the niche optimisation
+    //            that makes `Option<T>` the same size as `T`.
+    //
+    //            For floats I plan to implement a check that will allow us to
+    //            store them as integers if they're natural numbers, then we can
+    //            make use of `Option<NonZeroX>` with no option overhead. If
+    //            they're not all natural numbers then I think we could make a
+    //            `NonZeroNaN` and perhaps figure out how to get `Option<NonZeroNan>`
+    //            to have no overhead.
+    //
+    // TODO(edd): another obvious thing that might be worth doing in the future
+    //            is to store all the run-lengths contiguously rather than in
+    //            `Vec<(,)>`. One advantage of this is that it is possible to
+    //            avoid a tuple "overhead" when there is only a single
+    //            occurrence of a value by using a specific marker to represent
+    //            when something is a run-length or something is just a single
+    //            value.
+    run_lengths: Vec<(u32, Option<T>)>,
+
+    // number of NULL values in the column
+    null_count: u32,
+
+    // number of total logical rows (values) in the columns.
+    num_rows: u32,
+}
+
+impl<T> std::fmt::Display for RLE<T>
+where
+    T: std::fmt::Debug + Display + PartialOrd + Copy,
+{
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(
+            f,
+            "[{}] size: {:?} rows: {:?} nulls: {} runs: {} ",
+            self.name(),
+            self.size(),
+            self.num_rows(),
+            self.null_count(),
+            self.run_lengths.len()
+        )
+    }
+}
+
+impl<T: PartialOrd + Debug + Copy> RLE<T> {
+    /// The name of this encoding.
+    pub fn name(&self) -> &'static str {
+        ENCODING_NAME
+    }
+
+    /// A reasonable estimation of the on-heap size this encoding takes up.
+    pub fn size(&self) -> usize {
+        std::mem::size_of::<Self>() + (self.run_lengths.len() * size_of::<(u32, Option<T>)>())
+    }
+
+    /// The estimated total size in bytes of the underlying values in the
+    /// column if they were stored contiguously and uncompressed. `include_nulls`
+    /// will effectively size each NULL value as size_of<T> if set to `true`.
+    pub fn size_raw(&self, include_nulls: bool) -> usize {
+        let base_size = size_of::<Self>();
+        if include_nulls {
+            return base_size + (self.num_rows() as usize * size_of::<Option<T>>());
+        }
+
+        // remove NULL values from calculation
+        base_size
+            + self
+                .run_lengths
+                .iter()
+                .filter_map(|(rl, v)| v.is_some().then(|| *rl as usize * size_of::<Option<T>>()))
+                .sum::<usize>()
+    }
+
+    /// The number of NULL values in this column.
+    pub fn null_count(&self) -> u32 {
+        self.null_count
+    }
+
+    /// The number of logical rows encoded in this column.
+    pub fn num_rows(&self) -> u32 {
+        self.num_rows
+    }
+
+    /// Determine if NULL is encoded in the column.
+    pub fn contains_null(&self) -> bool {
+        self.null_count() > 0
+    }
+
+    //
+    //
+    // ---- Helper methods for constructing an instance of the encoding
+    //
+    //
+
+    /// Adds the provided string value to the encoded data. It is the caller's
+    /// responsibility to ensure that the dictionary encoded remains sorted.
+    pub fn push(&mut self, v: T) {
+        self.push_additional(Some(v), 1);
+    }
+
+    /// Adds a NULL value to the encoded data. It is the caller's
+    /// responsibility to ensure that the dictionary encoded remains sorted.
+    pub fn push_none(&mut self) {
+        self.push_additional(None, 1);
+    }
+
+    /// Adds additional repetitions of the provided value to the encoded data.
+    /// It is the caller's responsibility to ensure that the dictionary encoded
+    /// remains sorted.
+    pub fn push_additional(&mut self, v: Option<T>, additional: u32) {
+        match v {
+            Some(v) => self.push_additional_some(v, additional),
+            None => self.push_additional_none(additional),
+        }
+    }
+
+    fn push_additional_some(&mut self, v: T, additional: u32) {
+        if let Some((rl, rlv)) = self.run_lengths.last_mut() {
+            if rlv.as_ref() == Some(&v) {
+                *rl += additional; // update run-length
+            } else {
+                // new run-length
+                self.run_lengths.push((additional, Some(v)));
+            }
+        } else {
+            //First entry in the encoding
+            self.run_lengths.push((additional, Some(v)));
+        }
+
+        self.num_rows += additional;
+    }
+
+    fn push_additional_none(&mut self, additional: u32) {
+        if let Some((rl, v)) = self.run_lengths.last_mut() {
+            if v.is_none() {
+                *rl += additional; // update run-length
+            } else {
+                // new run-length
+                self.run_lengths.push((additional, None));
+            }
+        } else {
+            //First entry in the encoding
+            self.run_lengths.push((additional, None));
+        }
+
+        self.null_count += additional;
+        self.num_rows += additional;
+    }
+
+    //
+    //
+    // ---- Methods for getting row ids from values.
+    //
+    //
+
+    /// Populates the provided destination container with the row ids satisfying
+    /// the provided predicate.
+    ///
+    /// TODO(edd): To get the correct behaviour when comparing against NaN, ∞ or -∞
+    /// need to implement some comparator functions for all the types of `T` we
+    /// plan to accept.
+    pub fn row_ids_filter(&self, value: T, op: &cmp::Operator, dst: RowIDs) -> RowIDs {
+        match op {
+            cmp::Operator::Equal | cmp::Operator::NotEqual => {
+                self.row_ids_cmp_equal(value, op, dst)
+            }
+            cmp::Operator::LT | cmp::Operator::LTE | cmp::Operator::GT | cmp::Operator::GTE => {
+                self.row_ids_cmp(value, op, dst)
+            }
+        }
+    }
+
+    /// Returns the set of row ids that satisfy a pair of binary operators
+    /// against two values of the same physical type.
+    ///
+    /// This method is a special case optimisation for common cases where one
+    /// wishes to do the equivalent of WHERE x > y AND x <= y` for example.
+    ///
+    /// Essentially, this supports:
+    ///     `x {>, >=, <, <=} value1 AND x {>, >=, <, <=} value2`.
+    ///
+    /// Note, this doesn't currently support all possible combinations of
+    /// operator.
+    pub fn row_ids_filter_range(
+        &self,
+        left: (T, &cmp::Operator),
+        right: (T, &cmp::Operator),
+        dst: RowIDs,
+    ) -> RowIDs {
+        match (&left.1, &right.1) {
+            (cmp::Operator::GT, cmp::Operator::LT)
+            | (cmp::Operator::GT, cmp::Operator::LTE)
+            | (cmp::Operator::GTE, cmp::Operator::LT)
+            | (cmp::Operator::GTE, cmp::Operator::LTE)
+            | (cmp::Operator::LT, cmp::Operator::GT)
+            | (cmp::Operator::LT, cmp::Operator::GTE)
+            | (cmp::Operator::LTE, cmp::Operator::GT)
+            | (cmp::Operator::LTE, cmp::Operator::GTE) => self.row_ids_cmp_range(
+                (&left.0, Self::ord_from_op(&left.1)),
+                (&right.0, Self::ord_from_op(&right.1)),
+                dst,
+            ),
+
+            (_, _) => panic!("unsupported operators provided"),
+        }
+    }
+
+    // Finds row ids for non-null values, based on = or != operator.
+    //
+    // TODO(edd): predicate filtering could be improved here because we need to
+    //            effectively check all the run-lengths to find any that match
+    //            the predicate. Performance will be proportional to the number
+    //            of run-lengths in the column. For scalar columns where
+    //            predicates are less common for out use-cases this is probably
+    //            OK for a while. Improvements: (1) we could add bitsets of
+    //            pre-computed rows for each distinct value, which is what we
+    //            do for string RLE where equality predicates are very common,
+    //            or (2) we could add a sparse index to allow us to jump to the
+    //            run-lengths that contain matching logical row_ids.
+    fn row_ids_cmp_equal(&self, value: T, op: &cmp::Operator, mut dst: RowIDs) -> RowIDs {
+        dst.clear();
+
+        if self.num_rows() == 0 {
+            return dst;
+        }
+
+        // Given an operator `cmp` is a predicate function that applies it.
+        let cmp = match op {
+            cmp::Operator::Equal => {
+                |left: &T, right: &T| matches!(left.partial_cmp(right), Some(Ordering::Equal))
+            }
+            cmp::Operator::NotEqual => {
+                |left: &T, right: &T| !matches!(left.partial_cmp(right), Some(Ordering::Equal))
+            }
+            op => unreachable!("{:?} is an invalid operator", op),
+        };
+
+        let mut curr_logical_row_id = 0;
+        for (rl, next) in &self.run_lengths {
+            if let Some(next) = next {
+                if cmp(next, &value) {
+                    dst.add_range(curr_logical_row_id, curr_logical_row_id + rl);
+                }
+            }
+            curr_logical_row_id += rl;
+        }
+
+        dst
+    }
+
+    // Finds row ids for non-null values based on <, <=, > or >= operator.
+    // TODO(edd): predicate filtering could be improved here because we need to
+    //            effectively check all the run-lengths to find any that match
+    //            the predicate. Performance will be proportional to the number
+    //            of run-lengths in the column. For scalar columns where
+    //            predicates are less common for out use-cases this is probably
+    //            OK for a while. Improvements: (1) we could add bitsets of
+    //            pre-computed rows for each distinct value, which is what we
+    //            do for string RLE where predicates are very common.
+    fn row_ids_cmp(&self, value: T, op: &cmp::Operator, mut dst: RowIDs) -> RowIDs {
+        dst.clear();
+
+        if self.num_rows() == 0 {
+            return dst;
+        }
+
+        // Given an operator `cmp` is a predicate function that applies it.
+        let cmp = match op {
+            cmp::Operator::GT => PartialOrd::gt,
+            cmp::Operator::GTE => PartialOrd::ge,
+            cmp::Operator::LT => PartialOrd::lt,
+            cmp::Operator::LTE => PartialOrd::le,
+            op => unreachable!("{:?} is an invalid operator", op),
+        };
+
+        let mut curr_logical_row_id = 0;
+        for (rl, next) in &self.run_lengths {
+            if let Some(next) = next {
+                if cmp(next, &value) {
+                    dst.add_range(curr_logical_row_id, curr_logical_row_id + rl);
+                }
+            }
+            curr_logical_row_id += rl;
+        }
+
+        dst
+    }
+
+    // Special case function for finding all rows that satisfy two operators on
+    // two values.
+    //
+    // This function exists because it is more performant than calling
+    // `row_ids_filter` twice on predicates like `WHERE X > y and X <= x`
+    // which are very common, e.g., for timestamp columns.
+    //
+    // The method accepts two orderings for each predicate. If the predicate is
+    // `x < y` then the orderings provided will be
+    // `(Ordering::Less, Ordering::Less)`. This does lead to a slight overhead
+    // in checking non-matching values, but it means that the predicate `x <= y`
+    // can be supported by providing the ordering
+    // `(Ordering::Less, Ordering::Equal)`.
+    //.
+    fn row_ids_cmp_range(
+        &self,
+        left: (&T, (Ordering, Ordering)),
+        right: (&T, (Ordering, Ordering)),
+        mut dst: RowIDs,
+    ) -> RowIDs {
+        dst.clear();
+
+        let left_op = left.1;
+        let right_op = right.1;
+
+        let mut curr_logical_row_id = 0;
+        for (rl, next) in &self.run_lengths {
+            if let Some(next) = next {
+                // compare next value against the left and right's values
+                let left_cmp_result = next.partial_cmp(left.0);
+                let right_cmp_result = next.partial_cmp(right.0);
+
+                // TODO(edd): eurgh I still don't understand how I got this to
+                // be correct. Need to revisit to make it simpler.
+                let left_result_ok =
+                    !(left_cmp_result == Some(left_op.0) || left_cmp_result == Some(left_op.1));
+                let right_result_ok =
+                    !(right_cmp_result == Some(right_op.0) || right_cmp_result == Some(right_op.1));
+
+                if !(left_result_ok || right_result_ok) {
+                    dst.add_range(curr_logical_row_id, curr_logical_row_id + rl);
+                }
+                curr_logical_row_id += rl;
+            }
+        }
+
+        dst
+    }
+
+    // Helper function to convert comparison operators to cmp orderings.
+    fn ord_from_op(op: &cmp::Operator) -> (Ordering, Ordering) {
+        match op {
+            cmp::Operator::GT => (Ordering::Greater, Ordering::Greater),
+            cmp::Operator::GTE => (Ordering::Greater, Ordering::Equal),
+            cmp::Operator::LT => (Ordering::Less, Ordering::Less),
+            cmp::Operator::LTE => (Ordering::Less, Ordering::Equal),
+            _ => panic!("cannot convert operator to ordering"),
+        }
+    }
+
+    //
+    //
+    // ---- Methods for getting materialised values from row IDs.
+    //
+    //
+
+    /// Returns the logical value present at the provided row id.
+    ///
+    /// TODO(edd): a sparse index on this can help with materialisation cost by
+    /// providing starting indexes into the in the run length collection.
+    pub fn value(&self, row_id: u32) -> Option<T> {
+        assert!(
+            row_id < self.num_rows(),
+            "row_id {:?} out of bounds for {:?} rows",
+            row_id,
+            self.num_rows()
+        );
+
+        let mut ordinal_offset = 0;
+        for (rl, v) in &self.run_lengths {
+            if ordinal_offset + rl > row_id {
+                // this run-length overlaps desired row id
+                return *v;
+            }
+            ordinal_offset += rl;
+        }
+
+        // we are guaranteed to find a value at the provided row_id because
+        // `row_id < num_rows`
+        unreachable!(
+            "could not find value at row ID {:?}. num_rows = {:?}",
+            row_id,
+            self.num_rows()
+        )
+    }
+
+    fn check_row_ids_ordered(&self, row_ids: &[u32]) -> bool {
+        if row_ids.is_empty() {
+            return true;
+        }
+
+        let mut last = row_ids[0];
+        for &row_id in row_ids.iter().skip(1) {
+            if row_id <= last {
+                return false;
+            }
+            last = row_id;
+        }
+        true
+    }
+
+    /// Materialises a vector of references to the decoded values in the
+    /// provided ordered set of row ids.
+    ///
+    /// NULL values are represented by None.
+    ///
+    /// # Panics
+    ///
+    /// The behaviour of providing row IDs that are not an ordered set is
+    /// undefined. `values` may panic if the provided row IDs are are not an
+    /// ordered set in ascending order.
+    ///
+    /// Panics if the number of row IDs requested is more than the number of
+    /// rows in the column.
+    ///
+    /// Panics if a requested row ID is out of bounds of the ordinal offset of
+    /// a logical value.
+    ///
+    pub fn values(&self, row_ids: &[u32], mut dst: Vec<Option<T>>) -> Vec<Option<T>> {
+        assert!(!row_ids.is_empty(), "no row IDs provided");
+        assert!(
+            row_ids.len() <= self.num_rows() as usize,
+            "more row_ids {:?} than rows {:?}",
+            row_ids.len(),
+            self.num_rows()
+        );
+
+        dst.clear();
+        dst.reserve(row_ids.len());
+
+        // Ensure row ids ordered
+        debug_assert!(self.check_row_ids_ordered(row_ids));
+
+        let mut curr_logical_row_id = 0;
+        let (mut curr_entry_rl, mut curr_value) = self.run_lengths[0];
+
+        let mut i = 1;
+        for &row_id in row_ids {
+            assert!(
+                row_id < self.num_rows(),
+                "row_id {:?} beyond max row {:?}",
+                row_id,
+                self.num_rows() - 1
+            );
+
+            while curr_logical_row_id + curr_entry_rl <= row_id {
+                // this encoded entry does not cover the row we need.
+                // move on to next entry
+                curr_logical_row_id += curr_entry_rl;
+                curr_entry_rl = self.run_lengths[i].0;
+                curr_value = self.run_lengths[i].1;
+
+                i += 1;
+            }
+
+            // this encoded entry covers the row_id we want.
+            dst.push(curr_value);
+
+            curr_logical_row_id += 1; // move forwards a logical row
+            curr_entry_rl -= 1;
+        }
+
+        assert_eq!(row_ids.len(), dst.len());
+        dst
+    }
+
+    /// Returns references to the logical (decoded) values for all the rows in
+    /// the column.
+    ///
+    /// NULL values are represented by None.
+    pub fn all_values(&self, mut dst: Vec<Option<T>>) -> Vec<Option<T>> {
+        dst.clear();
+        dst.reserve(self.num_rows as usize);
+
+        for (rl, v) in &self.run_lengths {
+            dst.extend(iter::repeat(v).take(*rl as usize));
+        }
+        dst
+    }
+
+    // /// Returns true if a non-null value exists at any of the row ids.
+    pub fn has_non_null_value(&self, row_ids: &[u32]) -> bool {
+        assert!(!row_ids.is_empty(), "no row IDs provided");
+        // Ensure row ids ordered
+        debug_assert!(self.check_row_ids_ordered(row_ids));
+
+        assert!(
+            row_ids.len() <= self.num_rows() as usize,
+            "more row_ids {:?} than rows {:?}",
+            row_ids.len(),
+            self.num_rows()
+        );
+
+        let mut curr_logical_row_id = 0;
+        let (mut curr_entry_rl, mut curr_value) = self.run_lengths[0];
+
+        let mut i = 1;
+        for &row_id in row_ids {
+            assert!(
+                row_id < self.num_rows(),
+                "row_id {:?} beyond max row {:?}",
+                row_id,
+                self.num_rows() - 1
+            );
+
+            // find correctly logical row for `row_id`.
+            while curr_logical_row_id + curr_entry_rl <= row_id {
+                // this encoded entry does not cover the row we need.
+                // move on to next entry
+                curr_logical_row_id += curr_entry_rl;
+                curr_entry_rl = self.run_lengths[i].0;
+                curr_value = self.run_lengths[i].1;
+
+                i += 1;
+            }
+
+            if curr_value.is_some() {
+                return true;
+            }
+
+            curr_logical_row_id += 1; // move forwards a logical row
+            curr_entry_rl -= 1;
+        }
+
+        // all provide row IDs contain NULL values
+        false
+    }
+
+    /// Determines if the column contains a non-null value.
+    pub fn has_any_non_null_value(&self) -> bool {
+        self.null_count() < self.num_rows()
+    }
+
+    //
+    //
+    // ---- Methods for aggregation.
+    //
+    //
+
+    /// Returns the count of the values for the provided
+    /// row IDs.
+    ///
+    /// Since this encoding cannot have NULL values this is just the number of
+    /// rows requested.
+    pub fn count(&self, _row_ids: &[u32]) -> u32 {
+        todo!()
+    }
+
+    /// Returns the summation of the logical (decoded) values for the provided
+    /// row IDs.
+    pub fn sum(&self, _row_ids: &[u32]) -> Option<T> {
+        todo!()
+    }
+
+    /// Returns the first logical (decoded) value from the provided
+    /// row IDs.
+    pub fn first(&self, _row_ids: &[u32]) -> Option<T> {
+        todo!()
+    }
+
+    /// Returns the last logical (decoded) value from the provided
+    /// row IDs.
+    pub fn last(&self, _row_ids: &[u32]) -> Option<T> {
+        todo!()
+    }
+
+    /// Returns the minimum logical (decoded) value from the provided
+    /// row IDs.
+    pub fn min(&self, _row_ids: &[u32]) -> Option<T> {
+        todo!()
+    }
+
+    /// Returns the maximum logical (decoded) value from the provided
+    /// row IDs.
+    pub fn max(&self, _row_ids: &[u32]) -> Option<T> {
+        todo!()
+    }
+}
+
+impl<T> iter::FromIterator<T> for RLE<T>
+where
+    T: PartialOrd + Debug + Default + Copy,
+{
+    fn from_iter<I: IntoIterator<Item = T>>(itr: I) -> Self {
+        let mut itr = itr.into_iter();
+        let mut enc = Self::default();
+        let first = match itr.next() {
+            Some(v) => v,
+            None => return enc,
+        };
+        let (mut rl, mut v) = (1, first);
+        for next in itr {
+            if next == v {
+                rl += 1;
+                continue;
+            }
+
+            enc.push_additional(Some(v), rl);
+            rl = 1;
+            v = next;
+        }
+
+        // push the final run length
+        enc.push_additional(Some(v), rl);
+        enc
+    }
+}
+
+impl<T> iter::FromIterator<Option<T>> for RLE<T>
+where
+    T: PartialOrd + Debug + Default + Copy,
+{
+    fn from_iter<I: IntoIterator<Item = Option<T>>>(itr: I) -> Self {
+        let mut itr = itr.into_iter();
+        let mut enc = Self::default();
+        let first = match itr.next() {
+            Some(v) => v,
+            None => return enc,
+        };
+
+        let (mut rl, mut v) = (1, first);
+        for next in itr {
+            if next == v {
+                rl += 1;
+                continue;
+            }
+
+            enc.push_additional(v, rl);
+            rl = 1;
+            v = next;
+        }
+
+        // push the final run length
+        enc.push_additional(v, rl);
+        enc
+    }
+}
+
+#[cfg(test)]
+mod test {
+    use super::*;
+    use arrow::array::Int8Array;
+    use cmp::Operator;
+    use std::iter::FromIterator;
+
+    #[test]
+    fn from_slice() {
+        let cases = vec![
+            (&[][..], vec![]),
+            (&[1][..], vec![(1, Some(1))]),
+            (&[100, 22][..], vec![(1, Some(100)), (1, Some(22))]),
+            (
+                &[100, 22, 100, 100][..],
+                vec![(1, Some(100)), (1, Some(22)), (2, Some(100))],
+            ),
+        ];
+
+        for (input, exp_rl) in cases {
+            let enc: RLE<i32> = RLE::from_iter(input.to_vec());
+            assert_eq!(enc.run_lengths, exp_rl);
+        }
+    }
+
+    #[test]
+    fn from_slice_opt() {
+        let cases = vec![
+            (&[][..], vec![]),
+            (&[Some(1)][..], vec![(1, Some(1))]),
+            (
+                &[Some(100), Some(22)][..],
+                vec![(1, Some(100)), (1, Some(22))],
+            ),
+            (
+                &[Some(100), Some(22), Some(100), Some(100)][..],
+                vec![(1, Some(100)), (1, Some(22)), (2, Some(100))],
+            ),
+            (&[None][..], vec![(1, None)]),
+            (
+                &[None, None, Some(1), None][..],
+                vec![(2, None), (1, Some(1)), (1, None)],
+            ),
+        ];
+
+        for (input, exp_rl) in cases {
+            let enc: RLE<u8> = RLE::from_iter(input.to_vec());
+            assert_eq!(enc.run_lengths, exp_rl);
+        }
+    }
+
+    #[test]
+    fn from_arrow_array() {
+        let cases = vec![
+            (vec![], vec![]),
+            (vec![Some(1)], vec![(1, Some(1))]),
+            (
+                vec![Some(100), Some(22)],
+                vec![(1, Some(100)), (1, Some(22))],
+            ),
+            (
+                vec![Some(100), Some(22), Some(100), Some(100)],
+                vec![(1, Some(100)), (1, Some(22)), (2, Some(100))],
+            ),
+            (vec![None], vec![(1, None)]),
+            (
+                vec![None, None, Some(1), None],
+                vec![(2, None), (1, Some(1)), (1, None)],
+            ),
+        ];
+
+        for (input, exp_rl) in cases {
+            let arr = Int8Array::from(input);
+            let enc: RLE<i8> = RLE::from_iter(&arr);
+            assert_eq!(enc.run_lengths, exp_rl);
+        }
+    }
+
+    #[test]
+    fn push() {
+        let mut enc = RLE::default();
+        enc.push_additional(Some(45), 3);
+        enc.push_additional(Some(-1), 1);
+        enc.push_additional(Some(45), 5);
+        enc.push_additional(Some(45), 1);
+        enc.push_additional(Some(336), 2);
+        enc.push_additional(None, 2);
+        enc.push_none();
+        enc.push(22);
+
+        assert_eq!(
+            enc.run_lengths,
+            vec![
+                (3, Some(45)),
+                (1, Some(-1)),
+                (6, Some(45)),
+                (2, Some(336)),
+                (3, None),
+                (1, Some(22))
+            ]
+        );
+    }
+
+    #[test]
+    fn null_count() {
+        let mut enc = RLE::default();
+        enc.push_additional(Some(45), 3);
+        assert_eq!(enc.null_count(), 0);
+
+        enc.push_none();
+        assert_eq!(enc.null_count(), 1);
+
+        enc.push_none();
+        assert_eq!(enc.null_count(), 2);
+    }
+
+    #[test]
+    fn num_rows() {
+        let mut enc = RLE::default();
+        enc.push_additional(Some(45), 3);
+        assert_eq!(enc.num_rows(), 3);
+
+        enc.push_none();
+        assert_eq!(enc.num_rows(), 4);
+    }
+
+    #[test]
+    fn contains_null() {
+        let mut enc = RLE::default();
+        enc.push_additional(Some(45), 3);
+        assert!(!enc.contains_null());
+
+        enc.push_none();
+        assert!(enc.contains_null());
+    }
+
+    #[test]
+    fn size() {
+        let mut enc: RLE<i64> = RLE::default();
+
+        // 32b Self + (0 rl * 24) = 32
+        assert_eq!(enc.size(), 32);
+
+        enc.push_none();
+        // 32b Self + (1 rl * 24) = 56
+        assert_eq!(enc.size(), 56);
+
+        enc.push_additional_some(1, 10);
+        // 32b Self + (2 rl * 24) = 80
+        assert_eq!(enc.size(), 80);
+    }
+
+    #[test]
+    fn size_raw() {
+        let mut enc: RLE<i64> = RLE::default();
+
+        // 32b Self + (0 * 16)
+        assert_eq!(enc.size_raw(true), 32);
+        assert_eq!(enc.size_raw(false), 32);
+
+        enc.push_none();
+        // 32b Self + (1 * 16) = 48
+        assert_eq!(enc.size_raw(true), 48);
+        assert_eq!(enc.size_raw(false), 32);
+
+        enc.push_additional_some(1, 10);
+        // 32b Self + (11 * 16) = 208
+        assert_eq!(enc.size_raw(true), 208);
+        assert_eq!(enc.size_raw(false), 192);
+    }
+
+    #[test]
+    fn value() {
+        let mut enc = RLE::default();
+        enc.push_none();
+        enc.push_additional(Some(45), 3);
+        enc.push_additional(Some(90), 2);
+        enc.push(21);
+
+        assert_eq!(enc.value(0), None);
+        assert_eq!(enc.value(1), Some(45));
+        assert_eq!(enc.value(3), Some(45));
+        assert_eq!(enc.value(4), Some(90));
+        assert_eq!(enc.value(6), Some(21));
+    }
+
+    #[test]
+    fn check_row_ids_ordered() {
+        let cases = vec![
+            (&[0, 1, 2][..], true),
+            (&[0], true),
+            (&[], true),
+            (&[0, 2], true),
+            (&[1, 2], true),
+            (&[0, 0, 2], false),
+            (&[0, 1, 0], false),
+            (&[2, 1, 0], false),
+            (&[1, 1], false),
+            (&[1, 2, 2], false),
+        ];
+
+        let enc: RLE<i16> = RLE::default();
+
+        for (input, exp) in cases {
+            assert_eq!(enc.check_row_ids_ordered(input), exp);
+        }
+    }
+
+    #[test]
+    fn values() {
+        let mut enc = RLE::default();
+        enc.push_none();
+        enc.push_additional(Some(45), 3);
+        enc.push_additional(Some(90), 2);
+        enc.push(21);
+
+        // ensure buffer cleared by populating it
+        assert_eq!(
+            enc.values(&[0, 1, 2], vec![Some(33)]),
+            vec![None, Some(45), Some(45)]
+        );
+
+        assert_eq!(
+            enc.values(&[0, 1, 2, 3, 4], vec![]),
+            vec![None, Some(45), Some(45), Some(45), Some(90)]
+        );
+
+        assert_eq!(enc.values(&[2, 5], vec![]), vec![Some(45), Some(90)]);
+    }
+
+    #[test]
+    fn all_values() {
+        let mut enc = RLE::default();
+        // ensure buffer cleared by populating it
+        assert!(enc.all_values(vec![Some(33)]).is_empty());
+
+        enc.push_additional(Some(45), 3);
+        enc.push_additional(Some(90), 2);
+        enc.push_additional(None, 2);
+        enc.push(21);
+
+        assert_eq!(
+            enc.all_values(vec![None, Some(99)]),
+            vec![
+                Some(45),
+                Some(45),
+                Some(45),
+                Some(90),
+                Some(90),
+                None,
+                None,
+                Some(21)
+            ]
+        );
+
+        let mut enc: RLE<u8> = RLE::default();
+        enc.push_none();
+        assert_eq!(enc.all_values(vec![]), vec![None]);
+    }
+
+    #[test]
+    fn has_non_null_value() {
+        let mut enc: RLE<f64> = RLE::default();
+        enc.push_none();
+        assert!(!enc.has_non_null_value(&[0]));
+
+        enc.push_additional(Some(45.2), 3);
+        assert!(!enc.has_non_null_value(&[0]));
+        assert!(enc.has_non_null_value(&[0, 1]));
+        assert!(enc.has_non_null_value(&[2, 3]));
+        assert!(enc.has_non_null_value(&[0, 1, 2, 3]));
+
+        enc.push_additional(None, 3);
+        assert!(!enc.has_non_null_value(&[0, 5]));
+        assert!(!enc.has_non_null_value(&[6]));
+
+        // NULL, 45.2, 45.2, 45.2, NULL, NULL, NULL, 19.3
+        enc.push(19.3);
+        assert!(enc.has_non_null_value(&[3, 7]));
+        assert!(enc.has_non_null_value(&[7]));
+    }
+
+    #[test]
+    fn has_any_non_null_value() {
+        let mut enc: RLE<f64> = RLE::default();
+        assert!(!enc.has_any_non_null_value());
+
+        enc.push_none();
+        assert!(!enc.has_any_non_null_value());
+
+        enc.push_additional(None, 3);
+        assert!(!enc.has_any_non_null_value());
+
+        enc.push(22.34);
+        assert!(enc.has_any_non_null_value());
+
+        enc.push_additional(None, 3);
+        assert!(enc.has_any_non_null_value());
+    }
+
+    #[test]
+    fn row_ids_filter() {
+        // NULL, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, NULL, 19, 2, 2
+        let mut enc: RLE<u8> = RLE::default();
+        enc.push_none();
+        enc.push_additional_some(2, 10);
+        enc.push_none();
+        enc.push_additional_some(19, 1);
+        enc.push_additional_some(2, 2);
+
+        let all_non_null = vec![1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14];
+        let cases = vec![
+            (22, Operator::Equal, vec![]),
+            (22, Operator::NotEqual, all_non_null.clone()),
+            (22, Operator::LT, all_non_null.clone()),
+            (22, Operator::LTE, all_non_null.clone()),
+            (22, Operator::GT, vec![]),
+            (22, Operator::GTE, vec![]),
+            (0, Operator::Equal, vec![]),
+            (0, Operator::NotEqual, all_non_null.clone()),
+            (0, Operator::LT, vec![]),
+            (0, Operator::LTE, vec![]),
+            (0, Operator::GT, all_non_null.clone()),
+            (0, Operator::GTE, all_non_null.clone()),
+            (
+                2,
+                Operator::Equal,
+                vec![1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14],
+            ),
+            (2, Operator::NotEqual, vec![12]),
+            (2, Operator::LT, vec![]),
+            (
+                2,
+                Operator::LTE,
+                vec![1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14],
+            ),
+            (2, Operator::GT, vec![12]),
+            (2, Operator::GTE, all_non_null.clone()),
+            (19, Operator::Equal, vec![12]),
+            (
+                19,
+                Operator::NotEqual,
+                vec![1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14],
+            ),
+            (
+                19,
+                Operator::LT,
+                vec![1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 13, 14],
+            ),
+            (19, Operator::LTE, all_non_null),
+            (19, Operator::GT, vec![]),
+            (19, Operator::GTE, vec![12]),
+        ];
+
+        for (v, op, exp) in cases {
+            let dst = enc.row_ids_filter(v, &op, RowIDs::new_vector());
+            assert_eq!(dst.unwrap_vector(), &exp, "example '{} {:?}' failed", op, v);
+        }
+    }
+
+    #[test]
+    fn row_ids_filter_nulls() {
+        // Test all null encoding
+        let mut enc: RLE<u8> = RLE::default();
+        enc.push_additional_none(10);
+
+        let cases = vec![
+            (22, Operator::Equal),
+            (22, Operator::NotEqual),
+            (22, Operator::LT),
+            (22, Operator::LTE),
+            (22, Operator::GT),
+            (22, Operator::GTE),
+        ];
+
+        for (v, op) in cases {
+            let dst = enc.row_ids_filter(v, &op, RowIDs::new_vector());
+            assert!(
+                dst.unwrap_vector().is_empty(),
+                "example '{} {:?}' failed",
+                op,
+                v,
+            );
+        }
+    }
+
+    #[test]
+    fn row_ids_filter_range() {
+        let v = RLE::from_iter(vec![
+            100, 100, 101, 101, 101, 200, 300, 2030, 3, 101, 4, 5, 21, 100,
+        ]);
+
+        let cases = vec![
+            (
+                (100, &Operator::GTE),
+                (240, &Operator::LT),
+                vec![0, 1, 2, 3, 4, 5, 9, 13],
+            ),
+            (
+                (100, &Operator::GT),
+                (240, &Operator::LT),
+                vec![2, 3, 4, 5, 9],
+            ),
+            ((10, &Operator::LT), (-100, &Operator::GT), vec![8, 10, 11]),
+            ((21, &Operator::GTE), (21, &Operator::LTE), vec![12]),
+            (
+                (101, &Operator::GTE),
+                (2030, &Operator::LTE),
+                vec![2, 3, 4, 5, 6, 7, 9],
+            ),
+            ((10000, &Operator::LTE), (3999, &Operator::GT), vec![]),
+        ];
+
+        for (left, right, exp) in cases {
+            let dst = v.row_ids_filter_range(left, right, RowIDs::new_vector());
+            assert_eq!(dst.unwrap_vector(), &exp);
+        }
+    }
+}
diff --git a/read_buffer/src/column/float.rs b/read_buffer/src/column/float.rs
index c9d3967a58..76cbb00ca9 100644
--- a/read_buffer/src/column/float.rs
+++ b/read_buffer/src/column/float.rs
@@ -1,14 +1,25 @@
-use std::mem::size_of;
-
 use arrow::{self, array::Array};
+use std::iter::FromIterator;
+use std::{cmp::Ordering, mem::size_of};
 
-use super::encoding::{scalar::Fixed, scalar::FixedNull};
+use super::encoding::{
+    scalar::Fixed,
+    scalar::{rle::RLE, FixedNull},
+};
 use super::{cmp, Statistics};
 use crate::column::{RowIDs, Scalar, Value, Values};
 
+#[allow(clippy::upper_case_acronyms)] // TODO(edd): these will be OK in 1.52
+#[derive(Debug)]
 pub enum FloatEncoding {
+    // A fixed-width "no compression" vector of non-nullable values
     Fixed64(Fixed<f64>),
+
+    // A fixed-width "no compression" vector of nullable values (as Arrow array)
     FixedNull64(FixedNull<arrow::datatypes::Float64Type>),
+
+    // A RLE compressed encoding of nullable values.
+    RLE64(RLE<f64>),
 }
 
 impl FloatEncoding {
@@ -17,6 +28,7 @@ impl FloatEncoding {
         match self {
             Self::Fixed64(enc) => enc.size(),
             Self::FixedNull64(enc) => enc.size(),
+            Self::RLE64(enc) => enc.size(),
         }
     }
 
@@ -30,6 +42,7 @@ impl FloatEncoding {
                 size_of::<Vec<f64>>() + (enc.num_rows() as usize * size_of::<f64>())
             }
             Self::FixedNull64(enc) => enc.size_raw(include_nulls),
+            Self::RLE64(enc) => enc.size_raw(include_nulls),
         }
     }
 
@@ -38,6 +51,7 @@ impl FloatEncoding {
         match self {
             Self::Fixed64(enc) => enc.num_rows(),
             Self::FixedNull64(enc) => enc.num_rows(),
+            Self::RLE64(enc) => enc.num_rows(),
         }
     }
 
@@ -59,6 +73,7 @@ impl FloatEncoding {
         match self {
             Self::Fixed64(_) => false,
             Self::FixedNull64(enc) => enc.contains_null(),
+            Self::RLE64(enc) => enc.contains_null(),
         }
     }
 
@@ -67,6 +82,7 @@ impl FloatEncoding {
         match self {
             Self::Fixed64(_) => 0,
             Self::FixedNull64(enc) => enc.null_count(),
+            Self::RLE64(enc) => enc.null_count(),
         }
     }
 
@@ -75,6 +91,7 @@ impl FloatEncoding {
         match self {
             Self::Fixed64(_) => true,
             Self::FixedNull64(enc) => enc.has_any_non_null_value(),
+            Self::RLE64(enc) => enc.has_any_non_null_value(),
         }
     }
 
@@ -84,6 +101,7 @@ impl FloatEncoding {
         match self {
             Self::Fixed64(_) => !row_ids.is_empty(), // all rows will be non-null
             Self::FixedNull64(enc) => enc.has_non_null_value(row_ids),
+            Self::RLE64(enc) => enc.has_non_null_value(row_ids),
         }
     }
 
@@ -95,6 +113,10 @@ impl FloatEncoding {
                 Some(v) => Value::Scalar(Scalar::F64(v)),
                 None => Value::Null,
             },
+            Self::RLE64(c) => match c.value(row_id) {
+                Some(v) => Value::Scalar(Scalar::F64(v)),
+                None => Value::Null,
+            },
         }
     }
 
@@ -105,6 +127,7 @@ impl FloatEncoding {
         match &self {
             Self::Fixed64(c) => Values::F64(c.values::<f64>(row_ids, vec![])),
             Self::FixedNull64(c) => Values::F64N(c.values(row_ids, vec![])),
+            Self::RLE64(c) => Values::F64N(c.values(row_ids, vec![])),
         }
     }
 
@@ -115,6 +138,7 @@ impl FloatEncoding {
         match &self {
             Self::Fixed64(c) => Values::F64(c.all_values::<f64>(vec![])),
             Self::FixedNull64(c) => Values::F64N(c.all_values(vec![])),
+            Self::RLE64(c) => Values::F64N(c.all_values(vec![])),
         }
     }
 
@@ -127,6 +151,7 @@ impl FloatEncoding {
         match &self {
             Self::Fixed64(c) => c.row_ids_filter(value.as_f64(), op, dst),
             Self::FixedNull64(c) => c.row_ids_filter(value.as_f64(), op, dst),
+            Self::RLE64(c) => c.row_ids_filter(value.as_f64(), op, dst),
         }
     }
 
@@ -146,6 +171,9 @@ impl FloatEncoding {
                 c.row_ids_filter_range((low.1.as_f64(), &low.0), (high.1.as_f64(), &high.0), dst)
             }
             Self::FixedNull64(_) => todo!(),
+            Self::RLE64(c) => {
+                c.row_ids_filter_range((low.1.as_f64(), &low.0), (high.1.as_f64(), &high.0), dst)
+            }
         }
     }
 
@@ -156,6 +184,10 @@ impl FloatEncoding {
                 Some(v) => Value::Scalar(Scalar::F64(v)),
                 None => Value::Null,
             },
+            Self::RLE64(c) => match c.min(row_ids) {
+                Some(v) => Value::Scalar(Scalar::F64(v)),
+                None => Value::Null,
+            },
         }
     }
 
@@ -166,6 +198,10 @@ impl FloatEncoding {
                 Some(v) => Value::Scalar(Scalar::F64(v)),
                 None => Value::Null,
             },
+            Self::RLE64(c) => match c.max(row_ids) {
+                Some(v) => Value::Scalar(Scalar::F64(v)),
+                None => Value::Null,
+            },
         }
     }
 
@@ -176,6 +212,10 @@ impl FloatEncoding {
                 Some(v) => Scalar::F64(v),
                 None => Scalar::Null,
             },
+            Self::RLE64(c) => match c.sum(row_ids) {
+                Some(v) => Scalar::F64(v),
+                None => Scalar::Null,
+            },
         }
     }
 
@@ -183,6 +223,7 @@ impl FloatEncoding {
         match &self {
             Self::Fixed64(c) => c.count(row_ids),
             Self::FixedNull64(c) => c.count(row_ids),
+            Self::RLE64(c) => c.count(row_ids),
         }
     }
 
@@ -191,6 +232,7 @@ impl FloatEncoding {
         match &self {
             Self::Fixed64(_) => "None",
             Self::FixedNull64(_) => "None",
+            Self::RLE64(enc) => enc.name(),
         }
     }
 
@@ -199,6 +241,7 @@ impl FloatEncoding {
         match &self {
             Self::Fixed64(_) => "f64",
             Self::FixedNull64(_) => "f64",
+            Self::RLE64(_) => "f64",
         }
     }
 }
@@ -209,30 +252,100 @@ impl std::fmt::Display for FloatEncoding {
         match self {
             Self::Fixed64(enc) => write!(f, "[{}]: {}", name, enc),
             Self::FixedNull64(enc) => write!(f, "[{}]: {}", name, enc),
+            Self::RLE64(enc) => write!(f, "[{}]: {}", name, enc),
         }
     }
 }
 
+fn rle_rows(arr: &[f64]) -> usize {
+    arr.len()
+        - arr
+            .iter()
+            .zip(arr.iter().skip(1))
+            .filter(|(curr, next)| matches!(curr.partial_cmp(next), Some(Ordering::Equal)))
+            .count()
+}
+
+fn rle_rows_opt(mut itr: impl Iterator<Item = Option<f64>>) -> usize {
+    let mut v = match itr.next() {
+        Some(v) => v,
+        None => return 0,
+    };
+
+    let mut total_rows = 0;
+    for next in itr {
+        if let Some(Ordering::Equal) = v.partial_cmp(&next) {
+            continue;
+        }
+
+        total_rows += 1;
+        v = next;
+    }
+
+    total_rows + 1 // account for original run
+}
+
+/// A lever to decide the minimum size in bytes that RLE the column needs to
+/// reduce the overall footprint by. 0.1 means that the size of the column must
+/// be reduced by 10%
+pub const MIN_RLE_SIZE_REDUCTION: f64 = 0.3; // 30%
+
 /// Converts a slice of `f64` values into a `FloatEncoding`.
+///
+/// There are two possible encodings for &[f64]:
+///    * "None": effectively store the slice in a vector;
+///    * "RLE": for slices that have a sufficiently low cardinality they may
+///             benefit from being run-length encoded.
+///
+/// The encoding is chosen based on the heuristics in the `From` implementation
 impl From<&[f64]> for FloatEncoding {
     fn from(arr: &[f64]) -> Self {
+        // The number of rows we would reduce the column by if we encoded it
+        // as RLE.
+        let base_size = arr.len() * size_of::<f64>();
+        let rle_size = rle_rows(arr) * size_of::<(u32, Option<f64>)>(); // size of a run length
+        if (base_size as f64 - rle_size as f64) / base_size as f64 >= MIN_RLE_SIZE_REDUCTION {
+            return Self::RLE64(RLE::from_iter(arr.to_vec()));
+        }
+
+        // Don't apply a compression encoding to the column
         Self::Fixed64(Fixed::<f64>::from(arr))
     }
 }
 
-/// Converts an Arrow `Float64Array` into a `FloatEncoding`.
+/// Converts an Arrow Float array into a `FloatEncoding`.
+///
+/// There are two possible encodings for an Arrow array:
+///    * "None": effectively keep the data in its Arrow array;
+///    * "RLE": for arrays that have a sufficiently large number of NULL values
+///             they may benefit from being run-length encoded.
+///
+/// The encoding is chosen based on the heuristics in the `From` implementation
 impl From<arrow::array::Float64Array> for FloatEncoding {
     fn from(arr: arrow::array::Float64Array) -> Self {
         if arr.null_count() == 0 {
             return Self::from(arr.values());
         }
+
+        // The number of rows we would reduce the column by if we encoded it
+        // as RLE.
+        let base_size = arr.len() * size_of::<f64>();
+        let rle_size = rle_rows_opt(arr.iter()) * size_of::<(u32, Option<f64>)>(); // size of a run length
+        if (base_size as f64 - rle_size as f64) / base_size as f64 >= MIN_RLE_SIZE_REDUCTION {
+            return Self::RLE64(RLE::from_iter(&arr));
+        }
+
         Self::FixedNull64(FixedNull::<arrow::datatypes::Float64Type>::from(arr))
     }
 }
 
 #[cfg(test)]
 mod test {
+    use std::iter;
+
     use super::*;
+    use arrow::array::Float64Array;
+    use cmp::Operator;
 
     #[test]
     fn size_raw() {
@@ -255,4 +368,114 @@ mod test {
         assert_eq!(enc.size_raw(true), 64);
         assert_eq!(enc.size_raw(false), 56);
     }
+
+    fn rle_rows() {
+        let cases = vec![
+            (vec![0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0], 9),
+            (vec![0.0, 0.0], 1),
+            (vec![1.0, 2.0, 1.0], 3),
+            (vec![1.0, 2.0, 1.0, 1.0], 3),
+            (vec![1.0], 1),
+        ];
+
+        for (input, exp) in cases {
+            assert_eq!(super::rle_rows(input.as_slice()), exp);
+        }
+    }
+
+    #[test]
+    fn rle_rows_opt() {
+        let cases = vec![
+            (vec![Some(0.0), Some(2.0), Some(1.0)], 3),
+            (vec![Some(0.0), Some(0.0)], 1),
+        ];
+
+        for (input, exp) in cases {
+            assert_eq!(super::rle_rows_opt(input.into_iter()), exp);
+        }
+    }
+
+    #[test]
+    fn from_arrow_array() {
+        // Rows not reduced
+        let input: Vec<Option<f64>> = vec![Some(33.2), Some(1.2), Some(2.2), None, Some(3.2)];
+        let arr = Float64Array::from(input);
+        let enc = FloatEncoding::from(arr);
+        assert!(matches!(enc, FloatEncoding::FixedNull64(_)));
+
+        // Rows not reduced and no nulls so can go in `Fixed64`.
+        let input: Vec<Option<f64>> = vec![Some(33.2), Some(1.2), Some(2.2), Some(3.2)];
+        let arr = Float64Array::from(input);
+        let enc = FloatEncoding::from(arr);
+        assert!(matches!(enc, FloatEncoding::Fixed64(_)));
+
+        // Goldilocks - encode as RLE
+        let input: Vec<Option<f64>> = vec![Some(33.2); 10];
+        let arr = Float64Array::from(input);
+        let enc = FloatEncoding::from(arr);
+        assert!(matches!(enc, FloatEncoding::RLE64(_)));
+
+        // Goldilocks - encode as RLE
+        let mut input: Vec<Option<f64>> = vec![Some(33.2); 10];
+        input.extend(iter::repeat(None).take(10));
+        let arr = Float64Array::from(input);
+        let enc = FloatEncoding::from(arr);
+        assert!(matches!(enc, FloatEncoding::RLE64(_)));
+    }
+
+    #[test]
+    // Test NaN behaviour when `FloatEncoder`s are used.
+    //
+    // TODO(edd): I need to add the correct comparators to the scalar encodings
+    //            so that they behave the same as PG
+    //
+    fn row_ids_filter_nan() {
+        let data = vec![22.3, f64::NAN, f64::NEG_INFINITY, f64::INFINITY];
+
+        let cases = vec![
+            FloatEncoding::RLE64(RLE::from_iter(data.clone())),
+            FloatEncoding::Fixed64(Fixed::from(data.as_slice())),
+            FloatEncoding::FixedNull64(FixedNull::from(data.as_slice())),
+        ];
+
+        for enc in cases {
+            _row_ids_filter_nan(enc)
+        }
+    }
+
+    fn _row_ids_filter_nan(_enc: FloatEncoding) {
+        // These cases replicate the behaviour in PG.
+        let cases = vec![
+            (2.0, Operator::Equal, vec![0]),                        // 22.3
+            (2.0, Operator::NotEqual, vec![0, 1, 2, 3]),            // 22.3, NaN, -∞, ∞
+            (2.0, Operator::LT, vec![2]),                           // -∞
+            (2.0, Operator::LTE, vec![2]),                          // -∞
+            (2.0, Operator::GT, vec![0, 1, 3]),                     // 22.3, NaN, ∞
+            (2.0, Operator::GTE, vec![0, 1, 3]),                    // 22.3, NaN, ∞
+            (f64::NAN, Operator::Equal, vec![1]),                   // NaN
+            (f64::NAN, Operator::NotEqual, vec![0, 2, 3]),          // 22.3, -∞, ∞
+            (f64::NAN, Operator::LT, vec![0, 2, 3]),                // 22.3, -∞, ∞
+            (f64::NAN, Operator::LTE, vec![0, 1, 2, 3]),            // 22.3, NaN, -∞, ∞
+            (f64::NAN, Operator::GT, vec![]),                       //
+            (f64::NAN, Operator::GTE, vec![1]),                     // NaN
+            (f64::INFINITY, Operator::Equal, vec![3]),              // ∞
+            (f64::INFINITY, Operator::NotEqual, vec![0, 1, 2]),     // 22.3, NaN, -∞
+            (f64::INFINITY, Operator::LT, vec![0, 2]),              // 22.3, -∞
+            (f64::INFINITY, Operator::LTE, vec![0, 2, 3]),          // 22.3, -∞, ∞
+            (f64::INFINITY, Operator::GT, vec![1]),                 // NaN
+            (f64::INFINITY, Operator::GTE, vec![1, 3]),             // NaN, ∞
+            (f64::NEG_INFINITY, Operator::Equal, vec![2]),          // -∞
+            (f64::NEG_INFINITY, Operator::NotEqual, vec![0, 1, 3]), // 22.3, NaN, ∞
+            (f64::NEG_INFINITY, Operator::LT, vec![]),              //
+            (f64::NEG_INFINITY, Operator::LTE, vec![2]),            // -∞
+            (f64::NEG_INFINITY, Operator::GT, vec![0, 1, 3]),       // 22.3, NaN, ∞
+            (f64::NEG_INFINITY, Operator::GTE, vec![0, 1, 2, 3]),   // 22.3, NaN, -∞, ∞
+        ];
+
+        // TODO(edd): I need to add support for PG-like comparators for NaN etc.
+        for (_v, _op, _exp) in cases {
+            //let dst = enc.row_ids_filter(v, &op, RowIDs::new_vector());
+            //assert_eq!(dst.unwrap_vector(), &exp, "example '{} {:?}' failed", op, v);
+        }
+    }
 }