influxdb/wal/tests/end_to_end.rs

use data_types::{NamespaceId, SequenceNumber, TableId};
use dml::DmlWrite;
use generated_types::influxdata::{
    iox::wal::v1::sequenced_wal_op::Op as WalOp,
    pbdata::v1::{DatabaseBatch, TableBatch},
};
use mutable_batch_lp::lines_to_batches;
use tokio::sync::watch;
use wal::{SequencedWalOp, WriteResult, WriteSummary};

#[tokio::test]
async fn crud() {
    let dir = test_helpers::tmp_dir().unwrap();

    let wal = wal::Wal::new(dir.path()).await.unwrap();

    // Just-created WALs have no closed segments.
    let closed = wal.closed_segments();
    assert!(
        closed.is_empty(),
        "Expected empty closed segments; got {closed:?}"
    );

    // Can write an entry to the open segment
    let op = arbitrary_sequenced_wal_op([42, 43]);
    let summary = unwrap_summary(wal.write_op(op)).await;
    assert_eq!(summary.total_bytes, 140);
    assert_eq!(summary.bytes_written, 124);

    // Can write another entry; total_bytes accumulates
    let op = arbitrary_sequenced_wal_op([44, 45]);
    let summary = unwrap_summary(wal.write_op(op)).await;
    assert_eq!(summary.total_bytes, 264);
    assert_eq!(summary.bytes_written, 124);

    // Still no closed segments
    let closed = wal.closed_segments();
    assert!(
        closed.is_empty(),
        "Expected empty closed segments; got {closed:?}"
    );

    // Can't read entries from the open segment; have to rotate first
    let (closed_segment_details, ids) = wal.rotate().unwrap();
    assert_eq!(closed_segment_details.size(), 264);
    assert_eq!(
        ids.iter().collect::<Vec<_>>(),
        [
            SequenceNumber::new(42),
            SequenceNumber::new(43),
            SequenceNumber::new(44),
            SequenceNumber::new(45)
        ]
    );

    // There's one closed segment
    let closed = wal.closed_segments();
    let closed_segment_ids: Vec<_> = closed.iter().map(|c| c.id()).collect();
    assert_eq!(closed_segment_ids, &[closed_segment_details.id()]);

    // Can read the written entries from the closed segment, ensuring that the
    // per-partition sequence numbers are preserved.
    let mut reader = wal.reader_for_segment(closed_segment_details.id()).unwrap();
    let mut op = reader.next().unwrap().unwrap();
    let mut got_sequence_numbers = op
        .remove(0)
        .table_write_sequence_numbers
        .into_values()
        .collect::<Vec<_>>();
    got_sequence_numbers.sort();
    assert_eq!(got_sequence_numbers, Vec::<u64>::from([42, 43]),);
    let mut op = reader.next().unwrap().unwrap();
    let mut got_sequence_numbers = op
        .remove(0)
        .table_write_sequence_numbers
        .into_values()
        .collect::<Vec<_>>();
    got_sequence_numbers.sort();
    assert_eq!(got_sequence_numbers, Vec::<u64>::from([44, 45]),);

    // Can delete a segment, leaving no closed segments again
    wal.delete(closed_segment_details.id()).await.unwrap();
    let closed = wal.closed_segments();
    assert!(
        closed.is_empty(),
        "Expected empty closed segments; got {closed:?}"
    );
}

#[tokio::test]
async fn replay() {
    let dir = test_helpers::tmp_dir().unwrap();

    // Create a WAL with an entry, rotate to close the segment, create another entry, then drop the
    // WAL.
    {
        let wal = wal::Wal::new(dir.path()).await.unwrap();
        let op = arbitrary_sequenced_wal_op([42]);
        let _ = unwrap_summary(wal.write_op(op)).await;
        wal.rotate().unwrap();
        let op = arbitrary_sequenced_wal_op([43, 44]);
        let _ = unwrap_summary(wal.write_op(op)).await;
    }

    // Create a new WAL instance with the same directory to replay from the files
    let wal = wal::Wal::new(dir.path()).await.unwrap();

    // There's two closed segments -- one for the previously closed segment, one for the previously
    // open segment. Replayed WALs treat all files as closed, because effectively they are.
    let closed = wal.closed_segments();
    let closed_segment_ids: Vec<_> = closed.iter().map(|c| c.id()).collect();
    assert_eq!(closed_segment_ids.len(), 2);

    // Can read the written entries from the previously closed segment
    // ensuring the per-partition sequence numbers are preserved.
    let mut reader = wal.reader_for_segment(closed_segment_ids[0]).unwrap();
    let mut op = reader.next().unwrap().unwrap();
    let mut got_sequence_numbers = op
        .remove(0)
        .table_write_sequence_numbers
        .into_values()
        .collect::<Vec<_>>();
    got_sequence_numbers.sort();
    assert_eq!(got_sequence_numbers, Vec::<u64>::from([42]));

    // Can read the written entries from the previously open segment
    let mut reader = wal.reader_for_segment(closed_segment_ids[1]).unwrap();
    let mut op = reader.next().unwrap().unwrap();
    let mut got_sequence_numbers = op
        .remove(0)
        .table_write_sequence_numbers
        .into_values()
        .collect::<Vec<_>>();
    got_sequence_numbers.sort();
    assert_eq!(got_sequence_numbers, Vec::<u64>::from([43, 44]));
}

#[tokio::test]
async fn ordering() {
    let dir = test_helpers::tmp_dir().unwrap();

    // Create a WAL with two closed segments and an open segment with entries, then drop the WAL
    {
        let wal = wal::Wal::new(dir.path()).await.unwrap();

        let op = arbitrary_sequenced_wal_op([42, 43]);
        let _ = unwrap_summary(wal.write_op(op)).await;
        let (_, ids) = wal.rotate().unwrap();
        assert_eq!(
            ids.iter().collect::<Vec<_>>(),
            [SequenceNumber::new(42), SequenceNumber::new(43)]
        );

        let op = arbitrary_sequenced_wal_op([44]);
        let _ = unwrap_summary(wal.write_op(op)).await;
        let (_, ids) = wal.rotate().unwrap();
        assert_eq!(ids.iter().collect::<Vec<_>>(), [SequenceNumber::new(44)]);

        let op = arbitrary_sequenced_wal_op([45]);
        let _ = unwrap_summary(wal.write_op(op)).await;
    }

    // Create a new WAL instance with the same directory to replay from the files
    let wal = wal::Wal::new(dir.path()).await.unwrap();

    // There are 3 segments (from the 2 closed and 1 open) and they're in the order they were
    // created
    let closed = wal.closed_segments();
    let closed_segment_ids: Vec<_> = closed.iter().map(|c| c.id().get()).collect();
    assert_eq!(closed_segment_ids, &[0, 1, 2]);

    // The open segment is next in order
    let (closed_segment_details, ids) = wal.rotate().unwrap();
    assert_eq!(closed_segment_details.id().get(), 3);
    assert!(ids.is_empty());

    // Creating new files after replay are later in the ordering
    let (closed_segment_details, ids) = wal.rotate().unwrap();
    assert_eq!(closed_segment_details.id().get(), 4);
    assert!(ids.is_empty());
}

fn arbitrary_sequenced_wal_op<I: IntoIterator<Item = u64>>(sequence_numbers: I) -> SequencedWalOp {
    let sequence_numbers = sequence_numbers.into_iter().collect::<Vec<_>>();
    let lp = sequence_numbers
        .iter()
        .enumerate()
        .fold(String::new(), |string, (idx, _)| {
            string + &format!("m{},t=foo v=1i 1\n", idx)
        });
    let w = test_data(lp.as_str());
    SequencedWalOp {
        table_write_sequence_numbers: w
            .table_batches
            .iter()
            .zip(sequence_numbers.iter())
            .map(|(table_batch, &id)| (TableId::new(table_batch.table_id), id))
            .collect(),
        op: WalOp::Write(w),
    }
}

fn test_data(lp: &str) -> DatabaseBatch {
    let batches = lines_to_batches(lp, 0).unwrap();
    let batches = batches
        .into_iter()
        .enumerate()
        .map(|(i, (_table_name, batch))| (TableId::new(i as _), batch))
        .collect();

    let write = DmlWrite::new(
        NamespaceId::new(42),
        batches,
        "bananas".into(),
        Default::default(),
    );

    let database_batch = mutable_batch_pb::encode::encode_write(42, &write);

    // `encode_write` returns tables and columns in an arbitrary order. Sort tables and columns
    // to make tests deterministic.
    let DatabaseBatch {
        database_id,
        partition_key,
        table_batches,
    } = database_batch;

    let mut table_batches: Vec<_> = table_batches
        .into_iter()
        .map(|table_batch| {
            let TableBatch {
                table_id,
                mut columns,
                row_count,
            } = table_batch;

            columns.sort_by(|a, b| a.column_name.cmp(&b.column_name));

            TableBatch {
                table_id,
                columns,
                row_count,
            }
        })
        .collect();

    table_batches.sort_by_key(|t| t.table_id);

    DatabaseBatch {
        database_id,
        partition_key,
        table_batches,
    }
}

async fn unwrap_summary(mut res: watch::Receiver<Option<WriteResult>>) -> WriteSummary {
    res.changed().await.unwrap();

    match res.borrow().clone().unwrap() {
        WriteResult::Ok(summary) => summary,
        WriteResult::Err(err) => panic!("error getting write summary: {err}"),
    }
}