feat: Set up CLI for compactor generate

pull/24376/head
Carol (Nichols || Goulding) 2022-09-21 14:22:52 -04:00
parent da697815ff
commit d2dd38c2cf
No known key found for this signature in database
GPG Key ID: E907EE5A736F87D4
3 changed files with 114 additions and 1 deletions

View File

@ -1,3 +1,4 @@
use clap::ValueEnum;
use clap_blocks::{ use clap_blocks::{
catalog_dsn::CatalogDsnConfig, catalog_dsn::CatalogDsnConfig,
compactor::CompactorOnceConfig, compactor::CompactorOnceConfig,
@ -9,7 +10,7 @@ use ioxd_compactor::build_compactor_from_config;
use object_store::DynObjectStore; use object_store::DynObjectStore;
use object_store_metrics::ObjectStoreMetrics; use object_store_metrics::ObjectStoreMetrics;
use snafu::prelude::*; use snafu::prelude::*;
use std::sync::Arc; use std::{num::NonZeroUsize, sync::Arc};
#[derive(Debug, clap::Parser)] #[derive(Debug, clap::Parser)]
pub struct Config { pub struct Config {
@ -39,6 +40,74 @@ pub enum Command {
)] )]
query_exec_thread_count: usize, query_exec_thread_count: usize,
}, },
/// Generate Parquet files and catalog entries with different characteristics for the purposes
/// of investigating how the compactor handles them.
Generate {
#[clap(flatten)]
object_store_config: ObjectStoreConfig,
#[clap(flatten)]
catalog_dsn: CatalogDsnConfig,
/// The type of compaction to be done on the files. If `hot` is specified, the generated
/// files will have compaction level 0. If `cold` is specified, the generated files will
/// have compaction level 1 and will be marked that they were created at least 8 hours ago.
#[clap(
arg_enum,
value_parser,
long = "--compaction-type",
env = "INFLUXDB_IOX_COMPACTOR_GENERATE_TYPE",
default_value = "hot",
action
)]
compaction_type: CompactionType,
/// The number of IOx partitions to generate files for. Each partition will have the number
/// of files specified by `--num-files` generated.
#[clap(
long = "--num-partitions",
env = "INFLUXDB_IOX_COMPACTOR_GENERATE_NUM_PARTITIONS",
default_value = "1",
action
)]
num_partitions: NonZeroUsize,
/// The number of parquet files to generate per partition.
#[clap(
long = "--num-files",
env = "INFLUXDB_IOX_COMPACTOR_GENERATE_NUM_FILES",
default_value = "1",
action
)]
num_files: NonZeroUsize,
/// The number of columns to generate in each file. One column will always be the
/// timestamp. Additional columns will be given a type in I64, F64, U64, String, Bool, and
/// Tag in equal proportion.
#[clap(
long = "--num-cols",
env = "INFLUXDB_IOX_COMPACTOR_GENERATE_NUM_COLS",
default_value = "7",
action
)]
num_columns: NonZeroUsize,
/// The number of rows to generate in each file.
#[clap(
long = "--num-rows",
env = "INFLUXDB_IOX_COMPACTOR_GENERATE_NUM_ROWS",
default_value = "1",
action
)]
num_rows: NonZeroUsize,
},
}
#[derive(Debug, Copy, Clone, PartialEq, Eq, PartialOrd, Ord, ValueEnum)]
pub enum CompactionType {
Hot,
Cold,
} }
pub async fn command(config: Config) -> Result<()> { pub async fn command(config: Config) -> Result<()> {
@ -82,6 +151,7 @@ pub async fn command(config: Config) -> Result<()> {
compactor::handler::run_compactor_once(compactor).await; compactor::handler::run_compactor_once(compactor).await;
} }
Command::Generate { .. } => {}
} }
Ok(()) Ok(())

View File

@ -0,0 +1,42 @@
use assert_cmd::Command;
use predicates::prelude::*;
use test_helpers_end_to_end::maybe_skip_integration;
#[tokio::test]
async fn compactor_generate_has_defaults() {
let database_url = maybe_skip_integration!();
Command::cargo_bin("influxdb_iox")
.unwrap()
.arg("compactor")
.arg("generate")
.arg("--catalog-dsn")
.arg(database_url)
.assert()
.success();
}
#[tokio::test]
async fn compactor_generate_zeroes_are_invalid() {
let database_url = maybe_skip_integration!();
Command::cargo_bin("influxdb_iox")
.unwrap()
.arg("compactor")
.arg("generate")
.arg("--catalog-dsn")
.arg(database_url)
.arg("--num-partitions")
.arg("0")
.arg("--num-files")
.arg("0")
.arg("--num-cols")
.arg("0")
.arg("--num-rows")
.arg("0")
.assert()
.failure()
.stderr(predicate::str::contains(
"number would be zero for non-zero type",
));
}

View File

@ -3,6 +3,7 @@ mod all_in_one;
// loading shared libraries: libjemalloc.so.2: cannot open shared object file: No such file or directory" // loading shared libraries: libjemalloc.so.2: cannot open shared object file: No such file or directory"
#[cfg(not(feature = "heappy"))] #[cfg(not(feature = "heappy"))]
mod cli; mod cli;
mod compactor;
mod debug; mod debug;
mod error; mod error;
mod ingester; mod ingester;