test(bench): ingester2 write benchmarks

Adds a single-line & batched write request benchmarks to ingester2. When using the WAL, a floor of 10ms is added to all writes (the WAL linger time, configurable). With the WAL disabled in code, benchmarked writes complete in less than a millisecond: single row/write time: [1.9138 µs 1.9168 µs 1.9197 µs] thrpt: [520.92 Kelem/s 521.70 Kelem/s 522.51 Kelem/s] batched/write/1000 time: [129.15 µs 129.97 µs 131.28 µs] thrpt: [7.6173 Melem/s 7.6941 Melem/s 7.7429 Melem/s] Note these benchmarks exclude network I/O, and measure single-threaded, synchronous write client performance.
2023-04-12 12:38:05 +02:00 · 2023-04-12 12:38:05 +02:00 · dd92459c41
parent 02c7ec0727
commit dd92459c41
2 changed files with 145 additions and 0 deletions
--- a/ingester2/Cargo.toml
+++ b/ingester2/Cargo.toml
@ -75,3 +75,8 @@ name = "wal"
 harness = false
 # Require some internal types be made visible for benchmark code.
 required-features = ["benches"]
+
+[[bench]]
+name = "write"
+harness = false
+ # Require some internal types be made visible for benchmark code.
--- a/ingester2/benches/write.rs
+++ b/ingester2/benches/write.rs
@ -0,0 +1,140 @@
+use std::sync::Arc;
+
+use criterion::{criterion_group, criterion_main, BenchmarkId, Criterion, Throughput};
+use data_types::{PartitionKey, Sequence, SequenceNumber, ShardIndex};
+use dml::{DmlMeta, DmlWrite};
+use futures::{stream::FuturesUnordered, StreamExt};
+use generated_types::influxdata::{
+    iox::ingester::v1::write_service_server::WriteService, pbdata::v1::DatabaseBatch,
+};
+use influxdb_iox_client::ingester::generated_types::WriteRequest;
+use ingester2::IngesterRpcInterface;
+use ingester2_test_ctx::{TestContext, TestContextBuilder};
+use iox_time::TimeProvider;
+use mutable_batch_lp::lines_to_batches;
+use mutable_batch_pb::encode::encode_write;
+
+const TEST_NAMESPACE: &str = "bananas";
+const PARTITION_KEY: &str = "platanos";
+
+/// Return an initialised and pre-warmed ingester instance backed by a catalog
+/// correctly populated to accept writes of `lp`.
+async fn init(lp: impl AsRef<str>) -> (TestContext<impl IngesterRpcInterface>, DatabaseBatch) {
+    let lp = lp.as_ref();
+
+    let mut ctx = TestContextBuilder::default()
+        // Don't stop ingest during benchmarks
+        .with_max_persist_queue_depth(10_000_000)
+        .with_persist_hot_partition_cost(10_000_000_000)
+        .build()
+        .await;
+
+    // Ensure the namespace exists in the catalog.
+    let ns = ctx.ensure_namespace(TEST_NAMESPACE, None).await;
+
+    // Perform a write to drive table / schema population in the catalog.
+    ctx.write_lp(TEST_NAMESPACE, lp, PartitionKey::from(PARTITION_KEY), 42)
+        .await;
+
+    // Construct the write request once, and reuse it for each iteration.
+    let batches = lines_to_batches(lp, 0).unwrap();
+
+    // Build the TableId -> Batch map, resolving the tables IDs from the catalog
+    // in the process.
+    let batches_by_ids = batches
+        .into_iter()
+        .map(|(table_name, batch)| {
+            let catalog = Arc::clone(&ctx.catalog());
+            async move {
+                let id = catalog
+                    .repositories()
+                    .await
+                    .tables()
+                    .create_or_get(table_name.as_str(), ns.id)
+                    .await
+                    .expect("table should create OK")
+                    .id;
+
+                (id, batch)
+            }
+        })
+        .collect::<FuturesUnordered<_>>()
+        .collect::<hashbrown::HashMap<_, _>>()
+        .await;
+
+    let op = DmlWrite::new(
+        ns.id,
+        batches_by_ids,
+        PartitionKey::from(PARTITION_KEY),
+        DmlMeta::sequenced(
+            Sequence::new(ShardIndex::new(42), SequenceNumber::new(42)),
+            iox_time::SystemProvider::new().now(),
+            None,
+            50,
+        ),
+    );
+
+    (ctx, encode_write(ns.id.get(), &op))
+}
+
+/// Benchmark writes containing varying volumes of line protocol.
+///
+/// This is definitely a more "macro" benchmark than micro, as it covers the
+/// entire ingester write process (RPC request handler, RPC message
+/// deserialisation, WAL commit, buffering write, RPC response, etc) but does
+/// not include transport overhead (measuring only the processing time, not
+/// including the network read time).
+///
+/// Note that this benchmark covers the single threaded / uncontended case - as
+/// the number of parallel writes increases, so does the lock contention on the
+/// underlying buffer tree.
+fn bench_write(c: &mut Criterion) {
+    let runtime = tokio::runtime::Builder::new_multi_thread()
+        .enable_all()
+        .build()
+        .expect("failed to initialise tokio runtime for benchmark");
+
+    {
+        let (ctx, op) = runtime.block_on(init("bananas greatness=\"unbounded\" 42"));
+        let rpc = ctx.rpc();
+
+        let mut group = c.benchmark_group("single row");
+        group.throughput(Throughput::Elements(1));
+        group.bench_function("write", |b| {
+            b.to_async(&runtime).iter(|| {
+                let op = op.clone();
+                async move {
+                    rpc.write_service()
+                        .write(tonic::Request::new(WriteRequest { payload: Some(op) }))
+                        .await
+                        .unwrap();
+                }
+            });
+        });
+    }
+
+    {
+        let lp = std::fs::read_to_string("../test_fixtures/lineproto/metrics.lp").unwrap();
+        let line_count = lp.lines().count() as u64;
+
+        let (ctx, op) = runtime.block_on(init(lp));
+        let rpc = ctx.rpc();
+
+        let mut group = c.benchmark_group("batched");
+        group.throughput(Throughput::Elements(line_count));
+        group.bench_function(BenchmarkId::new("write", line_count), |b| {
+            b.to_async(&runtime).iter(|| {
+                let op = op.clone();
+                async move {
+                    rpc.write_service()
+                        .write(tonic::Request::new(WriteRequest { payload: Some(op) }))
+                        .await
+                        .unwrap();
+                }
+            });
+        });
+    }
+}
+
+criterion_group!(benches, bench_write);
+criterion_main!(benches);