influxdb/tests/end_to_end_cases/write_api.rs

353 lines
11 KiB
Rust

use influxdb_iox_client::write::WriteError;
use test_helpers::assert_contains;
use crate::common::server_fixture::ServerFixture;
use super::scenario::{create_readable_database, rand_name};
use arrow_deps::assert_batches_sorted_eq;
use generated_types::influxdata::iox::management::v1::{
node_group::Node, HashRing, Matcher, MatcherToShard, NodeGroup, ShardConfig,
};
use influxdb_line_protocol::parse_lines;
use internal_types::entry::lines_to_sharded_entries;
use internal_types::entry::test_helpers::{partitioner, sharder};
use std::collections::HashMap;
use std::num::NonZeroU32;
#[tokio::test]
async fn test_write() {
let fixture = ServerFixture::create_shared().await;
let mut write_client = fixture.write_client();
let db_name = rand_name();
create_readable_database(&db_name, fixture.grpc_channel()).await;
// ---- test successful writes ----
let lp_lines = vec![
"cpu,region=west user=23.2 100",
"cpu,region=west user=21.0 150",
"disk,region=east bytes=99i 200",
];
let num_lines_written = write_client
.write(&db_name, lp_lines.join("\n"))
.await
.expect("cannot write");
assert_eq!(num_lines_written, 3);
// ---- test bad data ----
let err = write_client
.write(&db_name, "XXX")
.await
.expect_err("expected write to fail");
assert_contains!(
err.to_string(),
r#"Client specified an invalid argument: Violation for field "lp_data": Invalid Line Protocol: A generic parsing error occurred"#
);
assert!(matches!(dbg!(err), WriteError::ServerError(_)));
// ---- test non existent database ----
let err = write_client
.write("Non_existent_database", lp_lines.join("\n"))
.await
.expect_err("expected write to fail");
assert_contains!(
err.to_string(),
r#"Unexpected server error: Some requested entity was not found: Resource database/Non_existent_database not found"#
);
assert!(matches!(dbg!(err), WriteError::ServerError(_)));
// ---- test hard limit ----
// stream data until limit is reached
let mut maybe_err = None;
for i in 0..1_000 {
let lp_lines: Vec<_> = (0..1_000)
.map(|j| format!("flood,tag1={},tag2={} x={},y={} 0", i, j, i, j))
.collect();
if let Err(err) = write_client.write(&db_name, lp_lines.join("\n")).await {
maybe_err = Some(err);
break;
}
}
assert!(maybe_err.is_some());
let err = maybe_err.unwrap();
let WriteError::ServerError(status) = dbg!(err);
assert_eq!(status.code(), tonic::Code::ResourceExhausted);
// IMPORTANT: At this point, the database is flooded and pretty much
// useless. Don't append any tests after the "hard limit" test!
}
#[tokio::test]
async fn test_write_entry() {
let fixture = ServerFixture::create_shared().await;
let mut write_client = fixture.write_client();
let db_name = rand_name();
create_readable_database(&db_name, fixture.grpc_channel()).await;
let lp_data = vec!["cpu bar=1 10", "cpu bar=2 20"].join("\n");
let lines: Vec<_> = parse_lines(&lp_data).map(|l| l.unwrap()).collect();
let sharded_entries =
lines_to_sharded_entries(&lines, sharder(1).as_ref(), &partitioner(1)).unwrap();
let entry: Vec<u8> = sharded_entries.into_iter().next().unwrap().entry.into();
write_client.write_entry(&db_name, entry).await.unwrap();
let mut query_results = fixture
.flight_client()
.perform_query(&db_name, "select * from cpu")
.await
.unwrap();
let mut batches = Vec::new();
while let Some(data) = query_results.next().await.unwrap() {
batches.push(data);
}
let expected = vec![
"+-----+-------------------------------+",
"| bar | time |",
"+-----+-------------------------------+",
"| 1 | 1970-01-01 00:00:00.000000010 |",
"| 2 | 1970-01-01 00:00:00.000000020 |",
"+-----+-------------------------------+",
];
assert_batches_sorted_eq!(&expected, &batches);
}
#[tokio::test]
async fn test_write_routed() {
const TEST_ROUTER_ID: NonZeroU32 = unsafe { NonZeroU32::new_unchecked(1) };
const TEST_TARGET_ID_1: NonZeroU32 = unsafe { NonZeroU32::new_unchecked(2) };
const TEST_TARGET_ID_2: NonZeroU32 = unsafe { NonZeroU32::new_unchecked(3) };
const TEST_REMOTE_ID_1: u32 = 2;
const TEST_REMOTE_ID_2: u32 = 3;
const TEST_SHARD_ID_1: u32 = 42;
const TEST_SHARD_ID_2: u32 = 43;
let router = ServerFixture::create_single_use().await;
let mut router_mgmt = router.management_client();
router_mgmt
.update_writer_id(TEST_ROUTER_ID)
.await
.expect("set ID failed");
let target_1 = ServerFixture::create_single_use().await;
let mut target_1_mgmt = target_1.management_client();
target_1_mgmt
.update_writer_id(TEST_TARGET_ID_1)
.await
.expect("set ID failed");
router_mgmt
.update_remote(TEST_REMOTE_ID_1, target_1.grpc_base())
.await
.expect("set remote failed");
let target_2 = ServerFixture::create_single_use().await;
let mut target_2_mgmt = target_2.management_client();
target_2_mgmt
.update_writer_id(TEST_TARGET_ID_2)
.await
.expect("set ID failed");
router_mgmt
.update_remote(TEST_REMOTE_ID_2, target_2.grpc_base())
.await
.expect("set remote failed");
let db_name = rand_name();
create_readable_database(&db_name, router.grpc_channel()).await;
create_readable_database(&db_name, target_1.grpc_channel()).await;
create_readable_database(&db_name, target_2.grpc_channel()).await;
// Set sharding rules on the router:
let mut router_db_rules = router_mgmt
.get_database(&db_name)
.await
.expect("cannot get database on router");
router_db_rules.shard_config = Some(ShardConfig {
specific_targets: Some(MatcherToShard {
matcher: Some(Matcher {
table_name_regex: "^cpu$".to_string(),
..Default::default()
}),
shard: TEST_SHARD_ID_1,
}),
hash_ring: Some(HashRing {
table_name: true,
shards: vec![TEST_SHARD_ID_2],
..Default::default()
}),
shards: vec![
(
TEST_SHARD_ID_1,
NodeGroup {
nodes: vec![Node {
id: TEST_REMOTE_ID_1,
}],
},
),
(
TEST_SHARD_ID_2,
NodeGroup {
nodes: vec![Node {
id: TEST_REMOTE_ID_2,
}],
},
),
]
.into_iter()
.collect::<HashMap<_, _>>(),
..Default::default()
});
router_mgmt
.update_database(router_db_rules)
.await
.expect("cannot update router db rules");
// Write some data
let mut write_client = router.write_client();
let lp_lines = vec!["cpu bar=1 100", "cpu bar=2 200", "disk bar=3 300"];
let num_lines_written = write_client
.write(&db_name, lp_lines.join("\n"))
.await
.expect("cannot write");
assert_eq!(num_lines_written, 3);
// The router will have split the write request by table name into two shards.
// Target 1 will have received only the "cpu" table.
// Target 2 will have received only the "disk" table.
let mut query_results = target_1
.flight_client()
.perform_query(&db_name, "select * from cpu")
.await
.expect("failed to query target 1");
let mut batches = Vec::new();
while let Some(data) = query_results.next().await.unwrap() {
batches.push(data);
}
let expected = vec![
"+-----+-------------------------------+",
"| bar | time |",
"+-----+-------------------------------+",
"| 1 | 1970-01-01 00:00:00.000000100 |",
"| 2 | 1970-01-01 00:00:00.000000200 |",
"+-----+-------------------------------+",
];
assert_batches_sorted_eq!(&expected, &batches);
assert!(target_1
.flight_client()
.perform_query(&db_name, "select * from disk")
.await
.unwrap_err()
.to_string()
.contains("Table or CTE with name \\\'disk\\\' not found\""));
let mut query_results = target_2
.flight_client()
.perform_query(&db_name, "select * from disk")
.await
.expect("failed to query target 2");
let mut batches = Vec::new();
while let Some(data) = query_results.next().await.unwrap() {
batches.push(data);
}
let expected = vec![
"+-----+-------------------------------+",
"| bar | time |",
"+-----+-------------------------------+",
"| 3 | 1970-01-01 00:00:00.000000300 |",
"+-----+-------------------------------+",
];
assert_batches_sorted_eq!(&expected, &batches);
assert!(target_2
.flight_client()
.perform_query(&db_name, "select * from cpu")
.await
.unwrap_err()
.to_string()
.contains("Table or CTE with name \\\'cpu\\\' not found\""));
}
#[tokio::test]
async fn test_write_routed_errors() {
const TEST_ROUTER_ID: NonZeroU32 = unsafe { NonZeroU32::new_unchecked(1) };
const TEST_REMOTE_ID: u32 = 2;
const TEST_SHARD_ID: u32 = 42;
let router = ServerFixture::create_single_use().await;
let mut router_mgmt = router.management_client();
router_mgmt
.update_writer_id(TEST_ROUTER_ID)
.await
.expect("set ID failed");
let db_name = rand_name();
create_readable_database(&db_name, router.grpc_channel()).await;
// Set sharding rules on the router:
let mut router_db_rules = router_mgmt
.get_database(&db_name)
.await
.expect("cannot get database on router");
router_db_rules.shard_config = Some(ShardConfig {
specific_targets: Some(MatcherToShard {
matcher: Some(Matcher {
table_name_regex: "^cpu$".to_string(),
..Default::default()
}),
shard: TEST_SHARD_ID,
}),
shards: vec![(
TEST_SHARD_ID,
NodeGroup {
nodes: vec![Node { id: TEST_REMOTE_ID }],
},
)]
.into_iter()
.collect::<HashMap<_, _>>(),
..Default::default()
});
router_mgmt
.update_database(router_db_rules)
.await
.expect("cannot update router db rules");
// We intentionally omit to configure the "remotes" name resolution on the
// router server.
let mut write_client = router.write_client();
let lp_lines = vec!["cpu bar=1 100", "cpu bar=2 200"];
let err = write_client
.write(&db_name, lp_lines.join("\n"))
.await
.unwrap_err();
assert_eq!(
err.to_string(),
format!(
"Unexpected server error: Some requested entity was not found: Resource remote/[{}] not found",
TEST_REMOTE_ID
)
);
// TODO(mkm): check connection error and successful communication with a
// target that replies with an error...
}