397 lines
12 KiB
Rust
397 lines
12 KiB
Rust
use std::fs;
|
|
use std::fs::File;
|
|
use std::io::{BufReader, Read};
|
|
use std::path::Path;
|
|
|
|
use assert_cmd::assert::Assert;
|
|
use assert_cmd::Command;
|
|
use predicates::prelude::*;
|
|
|
|
/// Validates that p is a valid parquet file
|
|
fn validate_parquet_file(p: &Path) {
|
|
// Verify file extension is parquet
|
|
let file_extension = p
|
|
.extension()
|
|
.map_or(String::from(""), |ext| ext.to_string_lossy().to_string());
|
|
assert_eq!(file_extension, "parquet");
|
|
|
|
// TODO: verify we can decode the contents of the parquet file and
|
|
// it is as expected. For now, just use a check against the magic
|
|
// `PAR1` bytes all parquet files start with.
|
|
let mut reader = BufReader::new(File::open(p).expect("Error reading file"));
|
|
|
|
let mut first_four = [0; 4];
|
|
reader
|
|
.read_exact(&mut first_four)
|
|
.expect("Error reading first four bytes");
|
|
assert_eq!(&first_four, b"PAR1");
|
|
}
|
|
|
|
#[test]
|
|
fn convert_bad_input_filename() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd
|
|
.arg("-v")
|
|
.arg("convert")
|
|
.arg("non_existent_input.lp")
|
|
.arg("non_existent_output")
|
|
.assert();
|
|
|
|
assert
|
|
.failure()
|
|
.code(1)
|
|
.stderr(predicate::str::contains(
|
|
"Error opening non_existent_input.lp",
|
|
))
|
|
.stderr(predicate::str::contains("No such file or directory"));
|
|
}
|
|
|
|
#[test]
|
|
fn convert_bad_compression_level() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd
|
|
.arg("-v")
|
|
.arg("convert")
|
|
.arg("--compression-level")
|
|
.arg("maxxx")
|
|
.arg("tests/fixtures/lineproto/temperature.lp")
|
|
.arg("/tmp")
|
|
.assert();
|
|
|
|
assert.failure().code(1).stderr(predicate::str::contains(
|
|
"error: 'maxxx' isn't a valid value for '--compression-level <compression_level>",
|
|
));
|
|
}
|
|
|
|
#[test]
|
|
fn convert_line_protocol_good_input_filename() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
|
|
let parquet_path = test_helpers::tempfile::Builder::new()
|
|
.prefix("convert_e2e")
|
|
.suffix(".parquet")
|
|
.tempfile()
|
|
.expect("error creating temp file")
|
|
.into_temp_path();
|
|
let parquet_filename_string = parquet_path.to_string_lossy().to_string();
|
|
|
|
let assert = cmd
|
|
.arg("-v")
|
|
.arg("convert")
|
|
.arg("--compression-level")
|
|
.arg("compatibility")
|
|
.arg("tests/fixtures/lineproto/temperature.lp")
|
|
.arg(&parquet_filename_string)
|
|
.assert();
|
|
|
|
let expected_success_string = format!(
|
|
"Completing writing to {} successfully",
|
|
parquet_filename_string
|
|
);
|
|
|
|
assert
|
|
.success()
|
|
.stderr(predicate::str::contains("convert starting"))
|
|
.stderr(predicate::str::contains(
|
|
"Writing output for measurement h2o_temperature",
|
|
))
|
|
.stderr(predicate::str::contains(expected_success_string));
|
|
|
|
validate_parquet_file(&parquet_path);
|
|
}
|
|
|
|
#[test]
|
|
fn convert_tsm_good_input_filename() {
|
|
//
|
|
// TODO: this needs to work for a temp directory...
|
|
//
|
|
|
|
// let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
|
|
// let tmp_dir = test_helpers::tmp_dir();
|
|
// let parquet_path = tmp_dir.unwrap().into_path().to_str().unwrap();
|
|
|
|
// // ::Builder::new()
|
|
// // .prefix("dstool_e2e_tsm")
|
|
// // .suffix(".parquet")
|
|
// // .tempfile()
|
|
// // .expect("error creating temp file")
|
|
// // .into_temp_path();
|
|
// // let parquet_filename_string =
|
|
// parquet_path.to_string_lossy().to_string();
|
|
|
|
// let assert = cmd
|
|
// .arg("convert")
|
|
// .arg("tests/fixtures/cpu_usage.tsm")
|
|
// .arg(&parquet_path)
|
|
// .assert();
|
|
|
|
// // TODO this should succeed when TSM -> parquet conversion is
|
|
// implemented. // assert
|
|
// // .failure()
|
|
// // .code(1)
|
|
// // .stderr(predicate::str::contains("Conversion failed"))
|
|
// // .stderr(predicate::str::contains(
|
|
// // "Not implemented: TSM Conversion not supported yet",
|
|
// // ));
|
|
|
|
// // TODO add better success expectations
|
|
|
|
// // let expected_success_string = format!(
|
|
// // "Completing writing to {} successfully",
|
|
// // parquet_filename_string
|
|
// // );
|
|
|
|
// // assert
|
|
// // .success()
|
|
// // .stderr(predicate::str::contains("dstool convert starting"))
|
|
// // .stderr(predicate::str::contains(
|
|
// // "Writing output for measurement h2o_temperature",
|
|
// // ))
|
|
// // .stderr(predicate::str::contains(expected_success_string));
|
|
|
|
// // validate_parquet_file(&parquet_path);
|
|
}
|
|
|
|
#[test]
|
|
fn convert_multiple_measurements() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
|
|
// Create a directory
|
|
let parquet_output_path = test_helpers::tempfile::Builder::new()
|
|
.prefix("convert_multiple_e2e")
|
|
.tempdir()
|
|
.expect("error creating temp directory");
|
|
|
|
let parquet_output_dir_path = parquet_output_path.path().to_string_lossy().to_string();
|
|
|
|
let assert = cmd
|
|
.arg("-v")
|
|
.arg("convert")
|
|
.arg("tests/fixtures/lineproto/air_and_water.lp")
|
|
.arg(&parquet_output_dir_path)
|
|
.assert();
|
|
|
|
let expected_success_string = format!(
|
|
"Completing writing to {} successfully",
|
|
parquet_output_dir_path
|
|
);
|
|
|
|
assert
|
|
.success()
|
|
.stderr(predicate::str::contains("convert starting"))
|
|
.stderr(predicate::str::contains("Writing to output directory"))
|
|
.stderr(predicate::str::contains(
|
|
"Writing output for measurement h2o_temperature",
|
|
))
|
|
.stderr(predicate::str::contains(
|
|
"Writing output for measurement air_temperature",
|
|
))
|
|
.stderr(predicate::str::contains(expected_success_string));
|
|
|
|
// check that the two files have been written successfully
|
|
let mut output_files: Vec<_> = fs::read_dir(parquet_output_path.path())
|
|
.expect("reading directory")
|
|
.map(|dir_ent| {
|
|
let dir_ent = dir_ent.expect("error reading dir entry");
|
|
validate_parquet_file(&dir_ent.path());
|
|
dir_ent.file_name().to_string_lossy().to_string()
|
|
})
|
|
.collect();
|
|
|
|
// Ensure the order is consistent before comparing them
|
|
output_files.sort();
|
|
assert_eq!(
|
|
output_files,
|
|
vec!["air_temperature.parquet", "h2o_temperature.parquet"]
|
|
);
|
|
}
|
|
|
|
#[test]
|
|
fn meta_bad_input_filename() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd.arg("meta").arg("non_existent_input").assert();
|
|
|
|
assert
|
|
.failure()
|
|
.code(2)
|
|
.stderr(predicate::str::contains("Metadata dump failed"))
|
|
.stderr(predicate::str::contains(
|
|
"Metadata dump failed: Error opening input Unknown input type: non_existent_input has an unknown input extension",
|
|
));
|
|
}
|
|
|
|
#[test]
|
|
fn meta_non_existent_input_filename() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd.arg("meta").arg("non_existent_input.tsm").assert();
|
|
|
|
assert
|
|
.failure()
|
|
.code(2)
|
|
.stderr(predicate::str::contains("Metadata dump failed"))
|
|
.stderr(predicate::str::contains(
|
|
"Metadata dump failed: Error opening input Error opening non_existent_input.tsm",
|
|
));
|
|
}
|
|
|
|
#[test]
|
|
fn meta_bad_input_filename_gz() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd.arg("meta").arg("non_existent_input.gz").assert();
|
|
|
|
assert
|
|
.failure()
|
|
.code(2)
|
|
.stderr(predicate::str::contains("Metadata dump failed"))
|
|
.stderr(predicate::str::contains(
|
|
"Metadata dump failed: Error opening input Unknown input type: non_existent_input.gz has an unknown input extension before .gz",
|
|
));
|
|
}
|
|
|
|
// gunzip's the contents of the file at input_path into a temporary path
|
|
fn uncompress_gz(input_path: &str, output_extension: &str) -> test_helpers::tempfile::TempPath {
|
|
let gz_file = File::open(input_path).expect("Error opening input");
|
|
|
|
let output_path = test_helpers::tempfile::Builder::new()
|
|
.prefix("decompressed_e2e")
|
|
.suffix(output_extension)
|
|
.tempfile()
|
|
.expect("error creating temp file")
|
|
.into_temp_path();
|
|
|
|
let mut output_file = File::create(&output_path).expect("error opening output");
|
|
let mut decoder = flate2::read::GzDecoder::new(gz_file);
|
|
std::io::copy(&mut decoder, &mut output_file).expect("error copying stream");
|
|
output_path
|
|
}
|
|
|
|
/// Validates some of the metadata output content for this tsm file
|
|
fn assert_meta_000000000000005_000000002_tsm(assert: Assert) {
|
|
assert
|
|
.success()
|
|
.stdout(predicate::str::contains("TSM Metadata Report"))
|
|
.stdout(predicate::str::contains(
|
|
"(05c19117091a1000, 05c19117091a1001) 2159 index entries, 2159 total records",
|
|
))
|
|
.stdout(predicate::str::contains(
|
|
"task_scheduler_total_schedule_fails",
|
|
));
|
|
}
|
|
|
|
#[test]
|
|
fn meta_000000000000005_000000002_tsm() {
|
|
let input_tsm = uncompress_gz("tests/fixtures/000000000000005-000000002.tsm.gz", ".tsm");
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd
|
|
.arg("meta")
|
|
.arg(input_tsm.to_string_lossy().to_string())
|
|
.assert();
|
|
assert_meta_000000000000005_000000002_tsm(assert);
|
|
}
|
|
|
|
#[test]
|
|
fn meta_000000000000005_000000002_tsm_gz() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd
|
|
.arg("meta")
|
|
.arg("tests/fixtures/000000000000005-000000002.tsm.gz")
|
|
.assert();
|
|
|
|
assert_meta_000000000000005_000000002_tsm(assert);
|
|
}
|
|
|
|
/// Validates some of the metadata output content for this tsm file
|
|
fn assert_meta_cpu_usage_tsm(assert: Assert) {
|
|
assert
|
|
.success()
|
|
.stdout(predicate::str::contains("TSM Metadata Report"))
|
|
.stdout(predicate::str::contains(
|
|
"(05b4927b3fe38000, 05b4927b3fe38001) 2735 index entries, 2735 total records",
|
|
))
|
|
.stdout(predicate::str::contains(
|
|
"task_scheduler_total_schedule_fails",
|
|
));
|
|
}
|
|
|
|
#[test]
|
|
fn meta_cpu_usage_tsm() {
|
|
let input_tsm = uncompress_gz("tests/fixtures/cpu_usage.tsm.gz", ".tsm");
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd
|
|
.arg("meta")
|
|
.arg(input_tsm.to_string_lossy().to_string())
|
|
.assert();
|
|
|
|
assert_meta_cpu_usage_tsm(assert);
|
|
}
|
|
|
|
#[test]
|
|
fn meta_cpu_usage_tsm_gz() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd
|
|
.arg("meta")
|
|
.arg("tests/fixtures/cpu_usage.tsm.gz")
|
|
.assert();
|
|
|
|
assert_meta_cpu_usage_tsm(assert);
|
|
}
|
|
|
|
/// Validates some of the metadata output content for this tsm file
|
|
fn assert_meta_temperature_parquet(assert: Assert) {
|
|
assert
|
|
.success()
|
|
.stdout(predicate::str::contains("Parquet file metadata:"))
|
|
.stdout(predicate::str::contains(r#"created by: "Delorean""#))
|
|
.stdout(predicate::str::contains(
|
|
r#"Column Chunk [3]:
|
|
file_offset: 595
|
|
column_type: DOUBLE
|
|
column_path: bottom_degrees
|
|
num_values: 6
|
|
encodings: [PLAIN, RLE_DICTIONARY, RLE]
|
|
compression: GZIP
|
|
compressed_size: 125
|
|
uncompressed_size: 90
|
|
data_page_offset: 547
|
|
has_index_page: false
|
|
has_dictionary_page: true
|
|
dictionary_page_offset: 470
|
|
NO STATISTICS"#,
|
|
));
|
|
}
|
|
|
|
#[test]
|
|
fn meta_temperature_parquet() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd
|
|
.arg("meta")
|
|
.arg("tests/fixtures/parquet/temperature.parquet")
|
|
.assert();
|
|
|
|
assert_meta_temperature_parquet(assert);
|
|
}
|
|
|
|
#[test]
|
|
fn stats_temperature_parquet() {
|
|
let mut cmd = Command::cargo_bin("influxdb_iox").unwrap();
|
|
let assert = cmd
|
|
.arg("stats")
|
|
.arg("--per-column")
|
|
.arg("--per-file")
|
|
.arg("tests/fixtures/parquet/temperature.parquet")
|
|
.assert();
|
|
|
|
assert
|
|
.success()
|
|
.stdout(predicate::str::contains("Storage statistics:"))
|
|
.stdout(predicate::str::contains(
|
|
r#"Column Stats 'state' [1]
|
|
Total rows: 6.00 (6), DataType: Utf8, Compression: {"Enc: Dictionary, Comp: GZIP"}
|
|
Compressed/Uncompressed Bytes : 90.00 / 52.00 ( 90 / 52) 120.0000 bits per row
|
|
"#))
|
|
.stdout(predicate::str::contains(
|
|
"temperature.parquet: total columns ( 5), rows: 6.00 ( 6), size: 1.13 k ( 1128), bits per row: 1504.0000"
|
|
));
|
|
}
|