refactor: clean up querier code base (#6404)

* refactor: `s/QuerierChunk/QuerierParquetChunk/g` * refactor: isolate parquet chunk creation code * refactor: fuse `chunk` and `chunk_parts` * refactor: pass catalog cache instead of chunk adapter to state reconciler * refactor: move parquet chunks creation into its own method Co-authored-by: kodiakhq[bot] <49736102+kodiakhq[bot]@users.noreply.github.com>
2022-12-15 07:01:11 +00:00 · 2022-12-15 07:01:11 +00:00 · ffe8b98f47
parent be45889be1
commit ffe8b98f47
13 changed files with 312 additions and 304 deletions
--- a/querier/src/cache/projected_schema.rs
+++ b/querier/src/cache/projected_schema.rs
@ -1,7 +1,7 @@
 //! Cache for schema projections.
 //!
 //! While this is technically NOT caching catalog requests (i.e. CPU and IO work), it heavily reduced memory when
-//! creating [`QuerierChunk`](crate::chunk::QuerierChunk)s.
+//! creating [`QuerierParquetChunk`](crate::parquet::QuerierParquetChunk)s.
 use std::{
    collections::HashMap,
    mem::{size_of, size_of_val},
--- a/querier/src/database.rs
+++ b/querier/src/database.rs
@ -1,8 +1,8 @@
 //! Database for the querier that contains all namespaces.

 use crate::{
-    cache::CatalogCache, chunk::ChunkAdapter, ingester::IngesterConnection,
-    namespace::QuerierNamespace, query_log::QueryLog, table::PruneMetrics,
+    cache::CatalogCache, ingester::IngesterConnection, namespace::QuerierNamespace,
+    parquet::ChunkAdapter, query_log::QueryLog, table::PruneMetrics,
 };
 use async_trait::async_trait;
 use backoff::{Backoff, BackoffConfig};
--- a/querier/src/lib.rs
+++ b/querier/src/lib.rs
@ -12,11 +12,11 @@
 )]

 mod cache;
-mod chunk;
 mod database;
 mod handler;
 mod ingester;
 mod namespace;
+mod parquet;
 mod poison;
 mod query_log;
 mod server;
--- a/querier/src/namespace/mod.rs
+++ b/querier/src/namespace/mod.rs
@ -2,8 +2,8 @@

 use crate::{
    cache::{namespace::CachedNamespace, CatalogCache},
-    chunk::ChunkAdapter,
    ingester::IngesterConnection,
+    parquet::ChunkAdapter,
    query_log::QueryLog,
    table::{PruneMetrics, QuerierTable, QuerierTableArgs},
 };
--- a/querier/src/parquet/creation.rs
+++ b/querier/src/parquet/creation.rs
@ -0,0 +1,235 @@
+use std::{collections::HashSet, sync::Arc};
+
+use data_types::{ChunkId, ChunkOrder, ColumnId, ParquetFile, TimestampMinMax};
+use futures::StreamExt;
+use iox_catalog::interface::Catalog;
+use iox_query::{pruning::prune_summaries, util::create_basic_summary};
+use observability_deps::tracing::debug;
+use parquet_file::chunk::ParquetChunk;
+use predicate::Predicate;
+use rand::{rngs::StdRng, seq::SliceRandom, SeedableRng};
+use schema::sort::SortKey;
+use trace::span::{Span, SpanRecorder};
+use uuid::Uuid;
+
+use crate::{
+    cache::{namespace::CachedTable, CatalogCache},
+    parquet::QuerierParquetChunkMeta,
+    table::MetricPruningObserver,
+};
+
+use super::QuerierParquetChunk;
+
+/// Number of concurrent chunk creation jobs.
+///
+/// This is mostly to fetch per-partition data concurrently.
+const CONCURRENT_CHUNK_CREATION_JOBS: usize = 100;
+
+/// Adapter that can create chunks.
+#[derive(Debug)]
+pub struct ChunkAdapter {
+    /// Cache
+    catalog_cache: Arc<CatalogCache>,
+
+    /// Metric registry.
+    metric_registry: Arc<metric::Registry>,
+}
+
+impl ChunkAdapter {
+    /// Create new adapter with empty cache.
+    pub fn new(catalog_cache: Arc<CatalogCache>, metric_registry: Arc<metric::Registry>) -> Self {
+        Self {
+            catalog_cache,
+            metric_registry,
+        }
+    }
+
+    /// Metric registry getter.
+    pub fn metric_registry(&self) -> Arc<metric::Registry> {
+        Arc::clone(&self.metric_registry)
+    }
+
+    /// Get underlying catalog cache.
+    pub fn catalog_cache(&self) -> &Arc<CatalogCache> {
+        &self.catalog_cache
+    }
+
+    /// Get underlying catalog.
+    pub fn catalog(&self) -> Arc<dyn Catalog> {
+        self.catalog_cache.catalog()
+    }
+
+    pub(crate) async fn new_chunks(
+        &self,
+        cached_table: Arc<CachedTable>,
+        files: Arc<Vec<Arc<ParquetFile>>>,
+        predicate: &Predicate,
+        early_pruning_observer: MetricPruningObserver,
+        span: Option<Span>,
+    ) -> Vec<QuerierParquetChunk> {
+        let span_recorder = SpanRecorder::new(span);
+
+        let basic_summaries: Vec<_> = files
+            .iter()
+            .map(|p| {
+                Arc::new(create_basic_summary(
+                    p.row_count as u64,
+                    &cached_table.schema,
+                    TimestampMinMax {
+                        min: p.min_time.get(),
+                        max: p.max_time.get(),
+                    },
+                ))
+            })
+            .collect();
+
+        // Prune on the most basic summary data (timestamps and column names) before trying to fully load the chunks
+        let keeps = match prune_summaries(
+            Arc::clone(&cached_table.schema),
+            &basic_summaries,
+            predicate,
+        ) {
+            Ok(keeps) => keeps,
+            Err(reason) => {
+                // Ignore pruning failures here - the chunk pruner should have already logged them.
+                // Just skip pruning and gather all the metadata. We have another chance to prune them
+                // once all the metadata is available
+                debug!(?reason, "Could not prune before metadata fetch");
+                vec![true; basic_summaries.len()]
+            }
+        };
+
+        // Remove any unused parquet files up front to maximize the
+        // concurrent catalog requests that could be outstanding
+        let mut parquet_files = files
+            .iter()
+            .zip(keeps)
+            .filter_map(|(pf, keep)| {
+                if keep {
+                    Some(Arc::clone(pf))
+                } else {
+                    early_pruning_observer
+                        .was_pruned_early(pf.row_count as u64, pf.file_size_bytes as u64);
+                    None
+                }
+            })
+            .collect::<Vec<_>>();
+
+        // de-correlate parquet files so that subsequent items likely don't block/wait on the same cache lookup
+        // (they are likely ordered by partition)
+        let mut rng = StdRng::seed_from_u64(cached_table.id.get() as u64);
+        parquet_files.shuffle(&mut rng);
+
+        futures::stream::iter(parquet_files)
+            .map(|cached_parquet_file| {
+                let span_recorder = &span_recorder;
+                let cached_table = Arc::clone(&cached_table);
+                async move {
+                    let span = span_recorder.child_span("new_chunk");
+                    self.new_chunk(cached_table, cached_parquet_file, span)
+                        .await
+                }
+            })
+            .buffer_unordered(CONCURRENT_CHUNK_CREATION_JOBS)
+            .filter_map(|x| async { x })
+            .collect()
+            .await
+    }
+
+    async fn new_chunk(
+        &self,
+        cached_table: Arc<CachedTable>,
+        parquet_file: Arc<ParquetFile>,
+        span: Option<Span>,
+    ) -> Option<QuerierParquetChunk> {
+        let span_recorder = SpanRecorder::new(span);
+
+        let parquet_file_cols: HashSet<ColumnId> =
+            parquet_file.column_set.iter().copied().collect();
+
+        // relevant_pk_columns is everything from the primary key for the table, that is actually in this parquet file
+        let relevant_pk_columns: Vec<_> = cached_table
+            .primary_key_column_ids
+            .iter()
+            .filter(|c| parquet_file_cols.contains(c))
+            .copied()
+            .collect();
+        let partition_sort_key = self
+            .catalog_cache
+            .partition()
+            .sort_key(
+                Arc::clone(&cached_table),
+                parquet_file.partition_id,
+                &relevant_pk_columns,
+                span_recorder.child_span("cache GET partition sort key"),
+            )
+            .await
+            .expect("partition sort key should be set when a parquet file exists");
+
+        // NOTE: Because we've looked up the sort key AFTER the namespace schema, it may contain columns for which we
+        //       don't have any schema information yet. This is OK because we've ensured that all file columns are known
+        //       withing the schema and if a column is NOT part of the file, it will also not be part of the chunk sort
+        //       key, so we have consistency here.
+
+        // calculate schema
+        // IMPORTANT: Do NOT use the sort key to list columns because the sort key only contains primary-key columns.
+        // NOTE: The schema that we calculate here may have a different column order than the actual parquet file. This
+        //       is OK because the IOx parquet reader can deal with that (see #4921).
+        let column_ids: Vec<_> = cached_table
+            .column_id_map
+            .keys()
+            .filter(|id| parquet_file_cols.contains(id))
+            .copied()
+            .collect();
+        let schema = self
+            .catalog_cache
+            .projected_schema()
+            .get(
+                Arc::clone(&cached_table),
+                column_ids,
+                span_recorder.child_span("cache GET projected schema"),
+            )
+            .await;
+
+        // calculate sort key
+        let sort_key = SortKey::from_columns(
+            partition_sort_key
+                .column_order
+                .iter()
+                .filter(|c_id| parquet_file_cols.contains(c_id))
+                .filter_map(|c_id| cached_table.column_id_map.get(c_id))
+                .cloned(),
+        );
+        assert!(
+            !sort_key.is_empty(),
+            "Sort key can never be empty because there should at least be a time column",
+        );
+
+        let chunk_id = ChunkId::from(Uuid::from_u128(parquet_file.id.get() as _));
+
+        let order = ChunkOrder::new(parquet_file.max_sequence_number.get());
+
+        let meta = Arc::new(QuerierParquetChunkMeta {
+            parquet_file_id: parquet_file.id,
+            chunk_id,
+            order,
+            sort_key: Some(sort_key),
+            shard_id: parquet_file.shard_id,
+            partition_id: parquet_file.partition_id,
+            max_sequence_number: parquet_file.max_sequence_number,
+            compaction_level: parquet_file.compaction_level,
+        });
+
+        let parquet_chunk = Arc::new(ParquetChunk::new(
+            parquet_file,
+            schema,
+            self.catalog_cache.parquet_store(),
+        ));
+
+        Some(QuerierParquetChunk::new(
+            parquet_chunk,
+            meta,
+            Some(Arc::clone(&partition_sort_key.sort_key)),
+        ))
+    }
+}
--- a/querier/src/parquet/mod.rs
+++ b/querier/src/parquet/mod.rs
@ -1,24 +1,22 @@
 //! Querier Chunks

-use crate::cache::namespace::CachedTable;
-use crate::cache::CatalogCache;
 use data_types::{
-    ChunkId, ChunkOrder, ColumnId, CompactionLevel, DeletePredicate, ParquetFile, ParquetFileId,
-    PartitionId, SequenceNumber, ShardId, TableSummary,
+    ChunkId, ChunkOrder, CompactionLevel, DeletePredicate, ParquetFileId, PartitionId,
+    SequenceNumber, ShardId, TableSummary,
 };
-use iox_catalog::interface::Catalog;
 use iox_query::util::create_basic_summary;
 use parquet_file::chunk::ParquetChunk;
 use schema::{sort::SortKey, Schema};
-use std::{collections::HashSet, sync::Arc};
-use trace::span::{Span, SpanRecorder};
-use uuid::Uuid;
+use std::sync::Arc;

+mod creation;
 mod query_access;

-/// Immutable metadata attached to a [`QuerierChunk`].
+pub use creation::ChunkAdapter;
+
+/// Immutable metadata attached to a [`QuerierParquetChunk`].
 #[derive(Debug)]
-pub struct ChunkMeta {
+pub struct QuerierParquetChunkMeta {
    /// ID of the Parquet file of the chunk
    parquet_file_id: ParquetFileId,

@ -44,7 +42,7 @@ pub struct ChunkMeta {
    compaction_level: CompactionLevel,
 }

-impl ChunkMeta {
+impl QuerierParquetChunkMeta {
    /// ID of the Parquet file of the chunk
    pub fn parquet_file_id(&self) -> ParquetFileId {
        self.parquet_file_id
@ -82,9 +80,9 @@ impl ChunkMeta {
 }

 #[derive(Debug)]
-pub struct QuerierChunk {
+pub struct QuerierParquetChunk {
    /// Immutable chunk metadata
-    meta: Arc<ChunkMeta>,
+    meta: Arc<QuerierParquetChunkMeta>,

    /// Schema of the chunk
    schema: Arc<Schema>,
@ -102,11 +100,11 @@ pub struct QuerierChunk {
    table_summary: Arc<TableSummary>,
 }

-impl QuerierChunk {
+impl QuerierParquetChunk {
    /// Create new parquet-backed chunk (object store data).
    pub fn new(
        parquet_chunk: Arc<ParquetChunk>,
-        meta: Arc<ChunkMeta>,
+        meta: Arc<QuerierParquetChunkMeta>,
        partition_sort_key: Option<Arc<SortKey>>,
    ) -> Self {
        let schema = parquet_chunk.schema();
@ -136,7 +134,7 @@ impl QuerierChunk {
    }

    /// Get metadata attached to the given chunk.
-    pub fn meta(&self) -> &ChunkMeta {
+    pub fn meta(&self) -> &QuerierParquetChunkMeta {
        self.meta.as_ref()
    }

@ -165,180 +163,24 @@ impl QuerierChunk {
    }
 }

-/// Adapter that can create chunks.
-#[derive(Debug)]
-pub struct ChunkAdapter {
-    /// Cache
-    catalog_cache: Arc<CatalogCache>,
-
-    /// Metric registry.
-    metric_registry: Arc<metric::Registry>,
-}
-
-impl ChunkAdapter {
-    /// Create new adapter with empty cache.
-    pub fn new(catalog_cache: Arc<CatalogCache>, metric_registry: Arc<metric::Registry>) -> Self {
-        Self {
-            catalog_cache,
-            metric_registry,
-        }
-    }
-
-    /// Metric registry getter.
-    pub fn metric_registry(&self) -> Arc<metric::Registry> {
-        Arc::clone(&self.metric_registry)
-    }
-
-    /// Get underlying catalog cache.
-    pub fn catalog_cache(&self) -> &Arc<CatalogCache> {
-        &self.catalog_cache
-    }
-
-    /// Get underlying catalog.
-    pub fn catalog(&self) -> Arc<dyn Catalog> {
-        self.catalog_cache.catalog()
-    }
-
-    pub async fn new_chunk(
-        &self,
-        cached_table: Arc<CachedTable>,
-        parquet_file: Arc<ParquetFile>,
-        span: Option<Span>,
-    ) -> Option<QuerierChunk> {
-        let span_recorder = SpanRecorder::new(span);
-        let parts = self
-            .chunk_parts(
-                cached_table,
-                Arc::clone(&parquet_file),
-                span_recorder.child_span("chunk_parts"),
-            )
-            .await?;
-
-        let parquet_chunk = Arc::new(ParquetChunk::new(
-            parquet_file,
-            parts.schema,
-            self.catalog_cache.parquet_store(),
-        ));
-
-        Some(QuerierChunk::new(
-            parquet_chunk,
-            parts.meta,
-            parts.partition_sort_key,
-        ))
-    }
-
-    async fn chunk_parts(
-        &self,
-        cached_table: Arc<CachedTable>,
-        parquet_file: Arc<ParquetFile>,
-        span: Option<Span>,
-    ) -> Option<ChunkParts> {
-        let span_recorder = SpanRecorder::new(span);
-
-        let parquet_file_cols: HashSet<ColumnId> =
-            parquet_file.column_set.iter().copied().collect();
-
-        // relevant_pk_columns is everything from the primary key for the table, that is actually in this parquet file
-        let relevant_pk_columns: Vec<_> = cached_table
-            .primary_key_column_ids
-            .iter()
-            .filter(|c| parquet_file_cols.contains(c))
-            .copied()
-            .collect();
-        let partition_sort_key = self
-            .catalog_cache
-            .partition()
-            .sort_key(
-                Arc::clone(&cached_table),
-                parquet_file.partition_id,
-                &relevant_pk_columns,
-                span_recorder.child_span("cache GET partition sort key"),
-            )
-            .await
-            .expect("partition sort key should be set when a parquet file exists");
-
-        // NOTE: Because we've looked up the sort key AFTER the namespace schema, it may contain columns for which we
-        //       don't have any schema information yet. This is OK because we've ensured that all file columns are known
-        //       withing the schema and if a column is NOT part of the file, it will also not be part of the chunk sort
-        //       key, so we have consistency here.
-
-        // calculate schema
-        // IMPORTANT: Do NOT use the sort key to list columns because the sort key only contains primary-key columns.
-        // NOTE: The schema that we calculate here may have a different column order than the actual parquet file. This
-        //       is OK because the IOx parquet reader can deal with that (see #4921).
-        let column_ids: Vec<_> = cached_table
-            .column_id_map
-            .keys()
-            .filter(|id| parquet_file_cols.contains(id))
-            .copied()
-            .collect();
-        let schema = self
-            .catalog_cache
-            .projected_schema()
-            .get(
-                Arc::clone(&cached_table),
-                column_ids,
-                span_recorder.child_span("cache GET projected schema"),
-            )
-            .await;
-
-        // calculate sort key
-        let sort_key = SortKey::from_columns(
-            partition_sort_key
-                .column_order
-                .iter()
-                .filter(|c_id| parquet_file_cols.contains(c_id))
-                .filter_map(|c_id| cached_table.column_id_map.get(c_id))
-                .cloned(),
-        );
-        assert!(
-            !sort_key.is_empty(),
-            "Sort key can never be empty because there should at least be a time column",
-        );
-
-        let chunk_id = ChunkId::from(Uuid::from_u128(parquet_file.id.get() as _));
-
-        let order = ChunkOrder::new(parquet_file.max_sequence_number.get());
-
-        let meta = Arc::new(ChunkMeta {
-            parquet_file_id: parquet_file.id,
-            chunk_id,
-            order,
-            sort_key: Some(sort_key),
-            shard_id: parquet_file.shard_id,
-            partition_id: parquet_file.partition_id,
-            max_sequence_number: parquet_file.max_sequence_number,
-            compaction_level: parquet_file.compaction_level,
-        });
-
-        Some(ChunkParts {
-            meta,
-            schema,
-            partition_sort_key: Some(Arc::clone(&partition_sort_key.sort_key)),
-        })
-    }
-}
-
-struct ChunkParts {
-    meta: Arc<ChunkMeta>,
-    schema: Arc<Schema>,
-    partition_sort_key: Option<Arc<SortKey>>,
-}
-
 #[cfg(test)]
 pub mod tests {
-    use crate::cache::namespace::CachedNamespace;
+    use crate::{
+        cache::{namespace::CachedNamespace, CatalogCache},
+        table::MetricPruningObserver,
+    };

    use super::*;
    use arrow::{datatypes::DataType, record_batch::RecordBatch};
    use arrow_util::assert_batches_eq;
-    use data_types::{ColumnType, NamespaceSchema};
+    use data_types::{ColumnType, NamespaceSchema, ParquetFile};
    use iox_query::{
        exec::{ExecutorType, IOxSessionContext},
        QueryChunk, QueryChunkMeta,
    };
    use iox_tests::util::{TestCatalog, TestNamespace, TestParquetFileBuilder};
    use metric::{Attributes, Observation, RawReporter};
+    use predicate::Predicate;
    use schema::{builder::SchemaBuilder, sort::SortKeyBuilder};
    use test_helpers::maybe_start_logging;
    use tokio::runtime::Handle;
@ -449,17 +291,19 @@ pub mod tests {
            }
        }

-        async fn chunk(&self, namespace_schema: Arc<NamespaceSchema>) -> QuerierChunk {
+        async fn chunk(&self, namespace_schema: Arc<NamespaceSchema>) -> QuerierParquetChunk {
            let cached_namespace: CachedNamespace = namespace_schema.as_ref().clone().into();
            let cached_table = cached_namespace.tables.get("table").expect("table exists");
            self.adapter
-                .new_chunk(
+                .new_chunks(
                    Arc::clone(cached_table),
-                    Arc::clone(&self.parquet_file),
+                    Arc::new(vec![Arc::clone(&self.parquet_file)]),
+                    &Predicate::new(),
+                    MetricPruningObserver::new_unregistered(),
                    None,
                )
                .await
-                .unwrap()
+                .remove(0)
        }

        /// get catalog access metrics from metric registry
@ -488,7 +332,7 @@ pub mod tests {
        }
    }

-    fn assert_schema(chunk: &QuerierChunk) {
+    fn assert_schema(chunk: &QuerierParquetChunk) {
        let expected_schema = SchemaBuilder::new()
            .field("field_int", DataType::Int64)
            .unwrap()
@ -500,7 +344,7 @@ pub mod tests {
        assert_eq!(actual_schema.as_ref(), &expected_schema);
    }

-    fn assert_sort_key(chunk: &QuerierChunk) {
+    fn assert_sort_key(chunk: &QuerierParquetChunk) {
        let expected_sort_key = SortKeyBuilder::new()
            .with_col("tag1")
            .with_col("time")
@ -509,9 +353,9 @@ pub mod tests {
        assert_eq!(actual_sort_key, &expected_sort_key);
    }

-    async fn assert_content(chunk: &QuerierChunk, test_data: &TestData) {
+    async fn assert_content(chunk: &QuerierParquetChunk, test_data: &TestData) {
        let ctx = test_data.catalog.exec.new_context(ExecutorType::Query);
-        let parquet_store = test_data.adapter.catalog_cache.parquet_store();
+        let parquet_store = test_data.adapter.catalog_cache().parquet_store();
        ctx.inner().runtime_env().register_object_store(
            "iox",
            parquet_store.id(),
--- a/querier/src/parquet/query_access.rs
+++ b/querier/src/parquet/query_access.rs
@ -1,4 +1,4 @@
-use crate::chunk::QuerierChunk;
+use crate::parquet::QuerierParquetChunk;
 use data_types::{ChunkId, ChunkOrder, DeletePredicate, PartitionId, TableSummary};
 use datafusion::error::DataFusionError;
 use iox_query::{
@ -9,7 +9,7 @@ use predicate::Predicate;
 use schema::{sort::SortKey, Projection, Schema};
 use std::{any::Any, sync::Arc};

-impl QueryChunkMeta for QuerierChunk {
+impl QueryChunkMeta for QuerierParquetChunk {
    fn summary(&self) -> Arc<TableSummary> {
        Arc::clone(&self.table_summary)
    }
@ -35,7 +35,7 @@ impl QueryChunkMeta for QuerierChunk {
    }
 }

-impl QueryChunk for QuerierChunk {
+impl QueryChunk for QuerierParquetChunk {
    fn id(&self) -> ChunkId {
        self.meta().chunk_id
    }
--- a/querier/src/table/mod.rs
+++ b/querier/src/table/mod.rs
@ -1,24 +1,16 @@
 use self::query_access::QuerierTableChunkPruner;
 use self::state_reconciler::Reconciler;
-use crate::table::query_access::MetricPruningObserver;
 use crate::{
-    chunk::ChunkAdapter,
    ingester::{self, IngesterPartition},
+    parquet::ChunkAdapter,
    IngesterConnection,
 };
-use data_types::{
-    ColumnId, DeletePredicate, NamespaceId, PartitionId, ShardIndex, TableId, TimestampMinMax,
-};
+use data_types::{ColumnId, DeletePredicate, NamespaceId, PartitionId, ShardIndex, TableId};
 use datafusion::error::DataFusionError;
-use futures::{join, StreamExt};
-use iox_query::pruning::prune_summaries;
-use iox_query::util::create_basic_summary;
+use futures::join;
 use iox_query::{exec::Executor, provider, provider::ChunkPruner, QueryChunk};
 use observability_deps::tracing::{debug, trace};
 use predicate::Predicate;
-use rand::rngs::StdRng;
-use rand::seq::SliceRandom;
-use rand::SeedableRng;
 use schema::Schema;
 use sharder::JumpHash;
 use snafu::{ResultExt, Snafu};
@ -33,6 +25,7 @@ use trace::span::{Span, SpanRecorder};
 use uuid::Uuid;

 pub use self::query_access::metrics::PruneMetrics;
+pub(crate) use self::query_access::MetricPruningObserver;

 mod query_access;
 mod state_reconciler;
@ -40,11 +33,6 @@ mod state_reconciler;
 #[cfg(test)]
 mod test_util;

-/// Number of concurrent chunk creation jobs.
-///
-/// This is mostly to fetch per-partition data concurrently.
-const CONCURRENT_CHUNK_CREATION_JOBS: usize = 100;
-
 #[derive(Debug, Snafu)]
 #[allow(clippy::large_enum_variant)]
 pub enum Error {
@ -348,86 +336,20 @@ impl QuerierTable {
        let reconciler = Reconciler::new(
            Arc::clone(&self.table_name),
            Arc::clone(&self.namespace_name),
-            Arc::clone(&self.chunk_adapter),
+            Arc::clone(self.chunk_adapter.catalog_cache()),
        );

        // create parquet files
-        let parquet_files: Vec<_> = {
-            // use nested scope because we span many child scopes here and it's easier to
-            // aggregate / collapse in the UI
-            let span_recorder = span_recorder.child("parquet chunks");
-
-            let basic_summaries: Vec<_> = parquet_files
-                .files
-                .iter()
-                .map(|p| {
-                    Arc::new(create_basic_summary(
-                        p.row_count as u64,
-                        &cached_table.schema,
-                        TimestampMinMax {
-                            min: p.min_time.get(),
-                            max: p.max_time.get(),
-                        },
-                    ))
-                })
-                .collect();
-
-            // Prune on the most basic summary data (timestamps and column names) before trying to fully load the chunks
-            let keeps = match prune_summaries(
-                Arc::clone(&cached_table.schema),
-                &basic_summaries,
+        let parquet_files = self
+            .chunk_adapter
+            .new_chunks(
+                Arc::clone(cached_table),
+                Arc::clone(&parquet_files.files),
                &predicate,
-            ) {
-                Ok(keeps) => keeps,
-                Err(reason) => {
-                    // Ignore pruning failures here - the chunk pruner should have already logged them.
-                    // Just skip pruning and gather all the metadata. We have another chance to prune them
-                    // once all the metadata is available
-                    debug!(?reason, "Could not prune before metadata fetch");
-                    vec![true; basic_summaries.len()]
-                }
-            };
-
-            let early_pruning_observer =
-                &MetricPruningObserver::new(Arc::clone(&self.prune_metrics));
-
-            // Remove any unused parquet files up front to maximize the
-            // concurrent catalog requests that could be outstanding
-            let mut parquet_files = parquet_files
-                .files
-                .iter()
-                .zip(keeps)
-                .filter_map(|(pf, keep)| {
-                    if keep {
-                        Some(Arc::clone(pf))
-                    } else {
-                        early_pruning_observer
-                            .was_pruned_early(pf.row_count as u64, pf.file_size_bytes as u64);
-                        None
-                    }
-                })
-                .collect::<Vec<_>>();
-
-            // de-correlate parquet files so that subsequent items likely don't block/wait on the same cache lookup
-            // (they are likely ordered by partition)
-            let mut rng = StdRng::seed_from_u64(self.id().get() as u64);
-            parquet_files.shuffle(&mut rng);
-
-            futures::stream::iter(parquet_files)
-                .map(|cached_parquet_file| {
-                    let span_recorder = &span_recorder;
-                    async move {
-                        let span = span_recorder.child_span("new_chunk");
-                        self.chunk_adapter
-                            .new_chunk(Arc::clone(cached_table), cached_parquet_file, span)
-                            .await
-                    }
-                })
-                .buffer_unordered(CONCURRENT_CHUNK_CREATION_JOBS)
-                .filter_map(|x| async { x })
-                .collect()
-                .await
-        };
+                MetricPruningObserver::new(Arc::clone(&self.prune_metrics)),
+                span_recorder.child_span("new_chunks"),
+            )
+            .await;

        let chunks = reconciler
            .reconcile(
--- a/querier/src/table/query_access/metrics.rs
+++ b/querier/src/table/query_access/metrics.rs
@ -124,4 +124,9 @@ impl PruneMetrics {
            could_not_prune_df,
        }
    }
+
+    #[cfg(test)]
+    pub(crate) fn new_unregistered() -> Self {
+        Self::new(&metric::Registry::new())
+    }
 }
--- a/querier/src/table/query_access/mod.rs
+++ b/querier/src/table/query_access/mod.rs
@ -19,7 +19,7 @@ use iox_query::{
 use predicate::Predicate;
 use schema::Schema;

-use crate::{chunk::QuerierChunk, ingester::IngesterChunk};
+use crate::{ingester::IngesterChunk, parquet::QuerierParquetChunk};

 use self::metrics::PruneMetrics;

@ -152,6 +152,11 @@ impl MetricPruningObserver {
        Self { metrics }
    }

+    #[cfg(test)]
+    pub(crate) fn new_unregistered() -> Self {
+        Self::new(Arc::new(PruneMetrics::new_unregistered()))
+    }
+
    /// Called when pruning a chunk before fully creating the chunk structure
    pub(crate) fn was_pruned_early(&self, row_count: u64, size_estimate: u64) {
        self.metrics.pruned_early.inc(1, row_count, size_estimate);
@ -197,7 +202,7 @@ fn chunk_estimate_size(chunk: &dyn QueryChunk) -> usize {

    if let Some(chunk) = chunk.downcast_ref::<IngesterChunk>() {
        chunk.estimate_size()
-    } else if let Some(chunk) = chunk.downcast_ref::<QuerierChunk>() {
+    } else if let Some(chunk) = chunk.downcast_ref::<QuerierParquetChunk>() {
        chunk.estimate_size()
    } else {
        panic!("Unknown chunk type")
@ -207,7 +212,7 @@ fn chunk_estimate_size(chunk: &dyn QueryChunk) -> usize {
 fn chunk_rows(chunk: &dyn QueryChunk) -> usize {
    let chunk = chunk.as_any();

-    if let Some(chunk) = chunk.downcast_ref::<QuerierChunk>() {
+    if let Some(chunk) = chunk.downcast_ref::<QuerierParquetChunk>() {
        chunk.rows()
    } else if let Some(chunk) = chunk.downcast_ref::<IngesterChunk>() {
        chunk.rows()
--- a/querier/src/table/state_reconciler.rs
+++ b/querier/src/table/state_reconciler.rs
@ -14,10 +14,8 @@ use std::{
 use trace::span::{Span, SpanRecorder};

 use crate::{
-    chunk::{ChunkAdapter, QuerierChunk},
-    ingester::IngesterChunk,
-    tombstone::QuerierTombstone,
-    IngesterPartition,
+    cache::CatalogCache, ingester::IngesterChunk, parquet::QuerierParquetChunk,
+    tombstone::QuerierTombstone, IngesterPartition,
 };

 use self::interface::{IngesterPartitionInfo, ParquetFileInfo, TombstoneInfo};
@ -34,19 +32,19 @@ pub enum ReconcileError {
 pub struct Reconciler {
    table_name: Arc<str>,
    namespace_name: Arc<str>,
-    chunk_adapter: Arc<ChunkAdapter>,
+    catalog_cache: Arc<CatalogCache>,
 }

 impl Reconciler {
    pub(crate) fn new(
        table_name: Arc<str>,
        namespace_name: Arc<str>,
-        chunk_adapter: Arc<ChunkAdapter>,
+        catalog_cache: Arc<CatalogCache>,
    ) -> Self {
        Self {
            table_name,
            namespace_name,
-            chunk_adapter,
+            catalog_cache,
        }
    }

@ -57,7 +55,7 @@ impl Reconciler {
        ingester_partitions: Vec<IngesterPartition>,
        tombstones: Vec<Arc<Tombstone>>,
        retention_delete_pred: Option<DeletePredicate>,
-        parquet_files: Vec<QuerierChunk>,
+        parquet_files: Vec<QuerierParquetChunk>,
        span: Option<Span>,
    ) -> Result<Vec<Arc<dyn QueryChunk>>, ReconcileError> {
        let span_recorder = SpanRecorder::new(span);
@ -88,7 +86,7 @@ impl Reconciler {
        ingester_partitions: &[IngesterPartition],
        tombstones: Vec<Arc<Tombstone>>,
        retention_delete_pred: Option<DeletePredicate>,
-        parquet_files: Vec<QuerierChunk>,
+        parquet_files: Vec<QuerierParquetChunk>,
        span: Option<Span>,
    ) -> Result<Vec<Box<dyn UpdatableQuerierChunk>>, ReconcileError> {
        let span_recorder = SpanRecorder::new(span);
@ -180,8 +178,7 @@ impl Reconciler {

                    // check if tombstone is marked as processed
                    if self
-                        .chunk_adapter
-                        .catalog_cache()
+                        .catalog_cache
                        .processed_tombstones()
                        .exists(
                            chunk.meta().parquet_file_id(),
@ -281,7 +278,7 @@ trait UpdatableQuerierChunk: QueryChunk {
    fn upcast_to_querier_chunk(self: Box<Self>) -> Box<dyn QueryChunk>;
 }

-impl UpdatableQuerierChunk for QuerierChunk {
+impl UpdatableQuerierChunk for QuerierParquetChunk {
    fn partition_sort_key_arc(&self) -> Option<Arc<SortKey>> {
        self.partition_sort_key_arc()
    }
--- a/querier/src/table/state_reconciler/interface.rs
+++ b/querier/src/table/state_reconciler/interface.rs
@ -1,6 +1,6 @@
 //! Interface for reconciling Ingester and catalog state

-use crate::{chunk::QuerierChunk, ingester::IngesterPartition};
+use crate::{ingester::IngesterPartition, parquet::QuerierParquetChunk};
 use data_types::{
    CompactionLevel, ParquetFile, PartitionId, SequenceNumber, ShardId, Tombstone, TombstoneId,
 };
@ -78,7 +78,7 @@ impl ParquetFileInfo for Arc<ParquetFile> {
    }
 }

-impl ParquetFileInfo for QuerierChunk {
+impl ParquetFileInfo for QuerierParquetChunk {
    fn partition_id(&self) -> PartitionId {
        self.meta().partition_id()
    }
--- a/querier/src/table/test_util.rs
+++ b/querier/src/table/test_util.rs
@ -1,6 +1,6 @@
 use super::{PruneMetrics, QuerierTable, QuerierTableArgs};
 use crate::{
-    cache::CatalogCache, chunk::ChunkAdapter, create_ingester_connection_for_testing,
+    cache::CatalogCache, create_ingester_connection_for_testing, parquet::ChunkAdapter,
    IngesterPartition,
 };
 use arrow::record_batch::RecordBatch;