test: add read_filter benchmark

2021-04-29 22:44:27 +01:00 · 2021-04-29 22:44:27 +01:00 · b7b87c1c96
parent 4e766d7085
commit b7b87c1c96
3 changed files with 328 additions and 4 deletions
--- a/read_buffer/benches/read.rs
+++ b/read_buffer/benches/read.rs
@ -1,8 +1,9 @@
-mod read_group;
-
 use criterion::{criterion_group, criterion_main};

+mod read_filter;
+mod read_group;
+use read_filter::read_filter;
 use read_group::read_group;

-criterion_group!(benches, read_group);
+criterion_group!(benches, read_filter, read_group);
 criterion_main!(benches);
--- a/read_buffer/benches/read_filter.rs
+++ b/read_buffer/benches/read_filter.rs
@ -0,0 +1,314 @@
+use criterion::{BenchmarkId, Criterion, Throughput};
+use rand::distributions::Alphanumeric;
+use rand::prelude::*;
+use rand::Rng;
+use rand_distr::{Distribution, Normal};
+
+use internal_types::selection::Selection;
+use packers::{sorter, Packers};
+use read_buffer::{
+    benchmarks::{Column, ColumnType, RowGroup},
+    Chunk,
+};
+use read_buffer::{BinaryExpr, Predicate};
+
+const ONE_MS: i64 = 1_000_000;
+
+pub fn read_filter(c: &mut Criterion) {
+    let mut rng = rand::thread_rng();
+
+    let mut chunk = Chunk::new(22, read_buffer::ChunkMetrics::new_unregistered());
+    let row_group = generate_row_group(200_000, &mut rng);
+    read_buffer::benchmarks::upsert_table_with_row_group(&mut chunk, "table", row_group);
+
+    read_filter_no_pred_vary_proj(c, &chunk);
+    read_filter_with_pred_vary_proj(c, &chunk);
+}
+
+// These benchmarks track the performance of read_filter without any predicate
+// but varying the size of projection (columns) requested
+fn read_filter_no_pred_vary_proj(c: &mut Criterion, chunk: &Chunk) {
+    let mut group = c.benchmark_group("read_filter/no_pred");
+
+    // All these projections involve the same number of rows but with varying
+    // cardinalities.
+    let projections = vec![
+        (Selection::Some(&["user_id"]), 200_000),
+        (Selection::Some(&["node_id"]), 2_000),
+        (Selection::Some(&["cluster"]), 200),
+        (Selection::Some(&["env"]), 2),
+    ];
+
+    for (projection, exp_card) in projections {
+        // benchmark measures the throughput of group creation.
+        group.throughput(Throughput::Elements(200_000));
+
+        group.bench_with_input(
+            BenchmarkId::from_parameter(format!("cardinality_{:?}_rows_{:?}", exp_card, 200_000)),
+            &exp_card,
+            |b, _| {
+                b.iter(|| {
+                    let result = chunk
+                        .read_filter("table", Predicate::default(), projection)
+                        .unwrap();
+                    let rbs = result.collect::<Vec<_>>();
+                    assert_eq!(rbs.len(), 1);
+                    assert_eq!(rbs[0].num_rows(), 200_000);
+                    assert_eq!(rbs[0].num_columns(), 1);
+                });
+            },
+        );
+    }
+    group.finish();
+}
+
+// These benchmarks track the performance of read_filter with different predicates
+fn read_filter_with_pred_vary_proj(c: &mut Criterion, chunk: &Chunk) {
+    let mut group = c.benchmark_group("read_filter/with_pred");
+
+    // these predicates vary the number of rows returned
+    let predicates = vec![(
+        Predicate::with_time_range(
+            &[BinaryExpr::from(("env", "=", "env-1"))],
+            i64::MIN,
+            i64::MAX,
+        ),
+        100_000,
+    )];
+
+    for (predicate, exp_rows) in predicates {
+        // benchmark measures the throughput of group creation.
+        group.throughput(Throughput::Elements(exp_rows as u64));
+
+        group.bench_with_input(
+            BenchmarkId::from_parameter(format!("rows_{:?}", exp_rows)),
+            &exp_rows,
+            |b, _| {
+                b.iter(|| {
+                    let result = chunk
+                        .read_filter("table", predicate.clone(), Selection::All)
+                        .unwrap();
+                    let rbs = result.collect::<Vec<_>>();
+                    assert_eq!(rbs.len(), 1);
+                    assert!(rbs[0].num_rows() > 0); // data randomly generated so row numbers not exact
+                    assert_eq!(rbs[0].num_columns(), 11);
+                });
+            },
+        );
+    }
+    group.finish();
+}
+
+// TODO(edd): figure out how to DRY this into a single place in `benches` "crate".
+//
+// This generates a `RowGroup` with a known schema, ~known column cardinalities
+// and variable number of rows.
+//
+// The schema and cardinalities are in-line with a tracing data use-case.
+fn generate_row_group(rows: usize, rng: &mut ThreadRng) -> RowGroup {
+    let mut timestamp = 1351700038292387000_i64;
+    let spans_per_trace = 10;
+
+    let mut column_packers: Vec<Packers> = vec![
+        Packers::from(Vec::<Option<String>>::with_capacity(rows)), // env (card 2)
+        Packers::from(Vec::<Option<String>>::with_capacity(rows)), // data_centre (card 20)
+        Packers::from(Vec::<Option<String>>::with_capacity(rows)), // cluster (card 200)
+        Packers::from(Vec::<Option<String>>::with_capacity(rows)), // user_id (card 200,000)
+        Packers::from(Vec::<Option<String>>::with_capacity(rows)), // request_id (card 2,000,000)
+        Packers::from(Vec::<Option<String>>::with_capacity(rows)), // node_id (card 2,000)
+        Packers::from(Vec::<Option<String>>::with_capacity(rows)), // pod_id (card 20,000)
+        Packers::from(Vec::<Option<String>>::with_capacity(rows)), // trace_id (card "rows / 10")
+        Packers::from(Vec::<Option<String>>::with_capacity(rows)), // span_id (card "rows")
+        Packers::from(Vec::<Option<i64>>::with_capacity(rows)),    // duration
+        Packers::from(Vec::<Option<i64>>::with_capacity(rows)),    // time
+    ];
+
+    let n = rows / spans_per_trace;
+    for _ in 0..n {
+        column_packers =
+            generate_trace_for_row_group(spans_per_trace, timestamp, column_packers, rng);
+
+        // next trace is ~10 seconds in the future
+        timestamp += 10_000 * ONE_MS;
+    }
+
+    // sort the packers according to lowest to highest cardinality excluding
+    // columns that are likely to be unique.
+    //
+    // - env, data_centre, cluster, node_id, pod_id, user_id, request_id, time
+    sorter::sort(&mut column_packers, &[0, 1, 2, 5, 6, 3, 4, 10]).unwrap();
+
+    // create columns
+    let columns = vec![
+        (
+            "env".to_string(),
+            ColumnType::Tag(Column::from(column_packers[0].str_packer().values())),
+        ),
+        (
+            "data_centre".to_string(),
+            ColumnType::Tag(Column::from(column_packers[1].str_packer().values())),
+        ),
+        (
+            "cluster".to_string(),
+            ColumnType::Tag(Column::from(column_packers[2].str_packer().values())),
+        ),
+        (
+            "user_id".to_string(),
+            ColumnType::Tag(Column::from(column_packers[3].str_packer().values())),
+        ),
+        (
+            "request_id".to_string(),
+            ColumnType::Tag(Column::from(column_packers[4].str_packer().values())),
+        ),
+        (
+            "node_id".to_string(),
+            ColumnType::Tag(Column::from(column_packers[5].str_packer().values())),
+        ),
+        (
+            "pod_id".to_string(),
+            ColumnType::Tag(Column::from(column_packers[6].str_packer().values())),
+        ),
+        (
+            "trace_id".to_string(),
+            ColumnType::Tag(Column::from(column_packers[7].str_packer().values())),
+        ),
+        (
+            "span_id".to_string(),
+            ColumnType::Tag(Column::from(column_packers[8].str_packer().values())),
+        ),
+        (
+            "duration".to_string(),
+            ColumnType::Field(Column::from(
+                column_packers[9].i64_packer().some_values().as_slice(),
+            )),
+        ),
+        (
+            "time".to_string(),
+            ColumnType::Time(Column::from(
+                column_packers[10].i64_packer().some_values().as_slice(),
+            )),
+        ),
+    ];
+
+    RowGroup::new(rows as u32, columns)
+}
+
+fn generate_trace_for_row_group(
+    spans_per_trace: usize,
+    timestamp: i64,
+    mut column_packers: Vec<Packers>,
+    rng: &mut ThreadRng,
+) -> Vec<Packers> {
+    let env_idx = 0;
+    let data_centre_idx = 1;
+    let cluster_idx = 2;
+    let user_id_idx = 3;
+    let request_id_idx = 4;
+    let node_id_idx = 5;
+    let pod_id_idx = 6;
+    let trace_id_idx = 7;
+    let span_id_idx = 8;
+    let duration_idx = 9;
+    let time_idx = 10;
+
+    let env_value = rng.gen_range(0_u8..2);
+    let env = format!("env-{:?}", env_value); // cardinality of 2.
+
+    let data_centre_value = rng.gen_range(0_u8..10);
+    let data_centre = format!("data_centre-{:?}-{:?}", env_value, data_centre_value); // cardinality of 2 * 10  = 20
+
+    let cluster_value = rng.gen_range(0_u8..10);
+    let cluster = format!(
+        "cluster-{:?}-{:?}-{:?}",
+        env_value,
+        data_centre_value,
+        cluster_value // cardinality of 2 * 10 * 10 = 200
+    );
+
+    // user id is dependent on the cluster
+    let user_id_value = rng.gen_range(0_u32..1000);
+    let user_id = format!(
+        "uid-{:?}-{:?}-{:?}-{:?}",
+        env_value,
+        data_centre_value,
+        cluster_value,
+        user_id_value // cardinality of 2 * 10 * 10 * 1000 = 200,000
+    );
+
+    let request_id_value = rng.gen_range(0_u32..10);
+    let request_id = format!(
+        "rid-{:?}-{:?}-{:?}-{:?}-{:?}",
+        env_value,
+        data_centre_value,
+        cluster_value,
+        user_id_value,
+        request_id_value // cardinality of 2 * 10 * 10 * 1000 * 10 = 2,000,000
+    );
+
+    let trace_id = rng
+        .sample_iter(&Alphanumeric)
+        .map(char::from)
+        .take(8)
+        .collect::<String>();
+
+    // the trace should move across hosts, which in this setup would be nodes
+    // and pods.
+    let normal = Normal::new(10.0, 5.0).unwrap();
+    let node_id_prefix = format!("{}-{}-{}", env_value, data_centre_value, cluster_value,);
+    for _ in 0..spans_per_trace {
+        // these values are not the same for each span so need to be generated
+        // separately.
+        let node_id = rng.gen_range(0..10); // cardinality is 2 * 10 * 10 * 10 = 2,000
+
+        column_packers[pod_id_idx].str_packer_mut().push(format!(
+            "pod_id-{}-{}-{}",
+            node_id_prefix,
+            node_id,
+            rng.gen_range(0..10) // cardinality is 2 * 10 * 10 * 10 * 10 = 20,000
+        ));
+
+        column_packers[node_id_idx]
+            .str_packer_mut()
+            .push(format!("node_id-{}-{}", node_id_prefix, node_id));
+
+        // randomly generate a span_id
+        column_packers[span_id_idx].str_packer_mut().push(
+            rng.sample_iter(&Alphanumeric)
+                .map(char::from)
+                .take(8)
+                .collect::<String>(),
+        );
+
+        // randomly generate some duration times in milliseconds.
+        column_packers[duration_idx].i64_packer_mut().push(
+            (normal.sample(rng) * ONE_MS as f64)
+                .max(ONE_MS as f64) // minimum duration is 1ms
+                .round() as i64,
+        );
+    }
+
+    column_packers[env_idx]
+        .str_packer_mut()
+        .fill_with(env, spans_per_trace);
+    column_packers[data_centre_idx]
+        .str_packer_mut()
+        .fill_with(data_centre, spans_per_trace);
+    column_packers[cluster_idx]
+        .str_packer_mut()
+        .fill_with(cluster, spans_per_trace);
+    column_packers[user_id_idx]
+        .str_packer_mut()
+        .fill_with(user_id, spans_per_trace);
+    column_packers[request_id_idx]
+        .str_packer_mut()
+        .fill_with(request_id, spans_per_trace);
+    column_packers[trace_id_idx]
+        .str_packer_mut()
+        .fill_with(trace_id, spans_per_trace);
+
+    column_packers[time_idx]
+        .i64_packer_mut()
+        .fill_with(timestamp, spans_per_trace);
+
+    column_packers
+}
--- a/read_buffer/src/lib.rs
+++ b/read_buffer/src/lib.rs
@ -25,6 +25,15 @@ pub mod benchmarks {
        cmp::Operator, encoding::scalar::Fixed, encoding::scalar::FixedNull, encoding::string,
        Column, RowIDs,
    };
-
    pub use crate::row_group::{ColumnType, RowGroup};
+    use crate::Chunk;
+
+    // Allow external benchmarks to use this crate-only test method
+    pub fn upsert_table_with_row_group(
+        chunk: &mut Chunk,
+        table_name: impl Into<String>,
+        row_group: RowGroup,
+    ) {
+        chunk.upsert_table_with_row_group(table_name, row_group)
+    }
 }