diff --git a/.github/workflows/parquet.yml b/.github/workflows/parquet.yml
index 9ae7d47eddc6..a0d8495170eb 100644
--- a/.github/workflows/parquet.yml
+++ b/.github/workflows/parquet.yml
@@ -175,8 +175,8 @@ jobs:
           rustup default ${{ matrix.rust }}
       - name: Install binary for checking
         run: |
-          cargo install --path parquet --bin parquet-show-bloom-filter --features=cli
-          cargo install --path parquet --bin parquet-fromcsv --features=arrow,cli
+          cargo install --path parquet --bin parquet-show-bloom-filter --features=cli --locked
+          cargo install --path parquet --bin parquet-fromcsv --features=arrow,cli --locked
       - name: Run pytest
         run: |
           cd parquet/pytest
diff --git a/parquet/benches/arrow_reader_row_filter.rs b/parquet/benches/arrow_reader_row_filter.rs
index 2b5a09eebcb3..cb26443fa3b0 100644
--- a/parquet/benches/arrow_reader_row_filter.rs
+++ b/parquet/benches/arrow_reader_row_filter.rs
@@ -35,37 +35,46 @@
 //!
 //! [Efficient Filter Pushdown in Parquet]: https://datafusion.apache.org/blog/2025/03/21/parquet-pushdown/
 //!
-//! The benchmark creates an in-memory Parquet file with 100K rows and ten columns.
-//! The first four columns are:
-//!   - int64: random integers (range: 0..100) generated with a fixed seed.
-//!   - float64: random floating-point values (range: 0.0..100.0) generated with a fixed seed.
-//!   - utf8View: random strings with some empty values and occasional constant "const" values.
-//!   - ts: sequential timestamps in milliseconds.
-//!
-//! The following six columns (for filtering) are generated to mimic different
-//! filter selectivity and clustering patterns:
-//!   - pt: for Point Lookup – exactly one row is set to "unique_point", all others are random strings.
-//!   - sel: for Selective Unclustered – exactly 1% of rows (those with i % 100 == 0) are "selected".
-//!   - mod_clustered: for Moderately Selective Clustered – in each 10K-row block, the first 10 rows are "mod_clustered".
-//!   - mod_unclustered: for Moderately Selective Unclustered – exactly 10% of rows (those with i % 10 == 1) are "mod_unclustered".
-//!   - unsel_unclustered: for Unselective Unclustered – exactly 99% of rows (those with i % 100 != 0) are "unsel_unclustered".
-//!   - unsel_clustered: for Unselective Clustered – in each 10K-row block, rows with an offset >= 1000 are "unsel_clustered".
+//! The benchmark creates an in-memory Parquet file with 500K rows and four root
+//! columns:
+//! - `int64`: random integers with an injected point-lookup value.
+//! - `float64`: random floating-point values used for sparse and dense filters.
+//! - `utf8View`: ClickBench-like string values with sparse sentinel values.
+//! - `ts`: sequential timestamps used for clustered filters.
 //!
+//! The benchmark groups cover a few distinct reader-level questions:
+//! - `arrow_reader_row_filter`: baseline filter/projection combinations.
+//! - `arrow_reader_row_filter_{async_,}strategy_matrix`: full post-filtering
+//!   versus row-filter pushdown with `Auto`, forced `Selectors`, and forced
+//!   `Mask`.
+//! - `arrow_reader_row_filter_async_auto_policy_focus`: focused synthetic shapes
+//!   derived from ClickBench and TPC-DS regressions, including sparse and dense
+//!   filters, clustered and fragmented selections, variable-width predicates,
+//!   projected predicate columns, count/filter-only outputs, and mixed predicate
+//!   order.
+//! - `arrow_reader_projection_scan_focus`: projection-only scans that do not
+//!   construct a `RowFilter`.
+//! - `arrow_reader_row_filter_async_nested_post_filter_focus`: nested root output
+//!   with a separate predicate column.
 
-use arrow::array::{ArrayRef, BooleanArray, Float64Array, Int64Array, TimestampMillisecondArray};
-use arrow::compute::and;
-use arrow::compute::kernels::cmp::{eq, gt, lt, neq};
+use arrow::array::{
+    ArrayRef, BooleanArray, Float64Array, Int64Array, StructArray, TimestampMillisecondArray,
+};
+use arrow::compute::kernels::cmp::{eq, gt, lt, lt_eq, neq};
+use arrow::compute::{and, or};
 use arrow::datatypes::{DataType, Field, Schema, TimeUnit};
 use arrow::record_batch::RecordBatch;
 use arrow_array::StringViewArray;
 use arrow_array::builder::{ArrayBuilder, StringViewBuilder};
-use arrow_cast::pretty::pretty_format_batches;
 use bytes::Bytes;
-use criterion::{BenchmarkId, Criterion, criterion_group, criterion_main};
+use criterion::{
+    BenchmarkGroup, BenchmarkId, Criterion, criterion_group, criterion_main, measurement::WallTime,
+};
 use futures::future::BoxFuture;
 use futures::{FutureExt, StreamExt};
 use parquet::arrow::arrow_reader::{
     ArrowPredicateFn, ArrowReaderOptions, ParquetRecordBatchReaderBuilder, RowFilter,
+    RowSelectionPolicy,
 };
 use parquet::arrow::async_reader::AsyncFileReader;
 use parquet::arrow::{ArrowWriter, ParquetRecordBatchStreamBuilder, ProjectionMask};
@@ -76,6 +85,9 @@ use rand::{Rng, SeedableRng, rngs::StdRng};
 use std::ops::Range;
 use std::sync::Arc;
 
+const COLUMN_NAMES: [&str; 4] = ["int64", "float64", "utf8View", "ts"];
+const UTF8_VIEW_MISSING_VALUE: &str = "__arrow_rs_missing__";
+
 /// Generates a random string. Has a 50% chance to generate a short string (3–11 characters)
 /// or a long string (13–20 characters).
 fn random_string(rng: &mut StdRng) -> String {
@@ -108,6 +120,14 @@ fn create_float64_array(size: usize) -> ArrayRef {
     Arc::new(Float64Array::from(values)) as ArrayRef
 }
 
+fn append_utf8_view_value(builder: &mut StringViewBuilder, value: &str) {
+    if builder.len() % 1_000 == 0 {
+        builder.append_value(UTF8_VIEW_MISSING_VALUE);
+    } else {
+        builder.append_value(value);
+    }
+}
+
 /// Creates a utf8View array of a given size with random strings.
 ///
 /// This is modeled after the "SearchPhrase" column in the ClickBench benchmark.
@@ -139,11 +159,11 @@ fn create_utf8_view_array(size: usize) -> ArrayRef {
         let choice = rng.random_range(0..100);
         if choice < EMPTY_DENSITY {
             for _ in 0..run_length {
-                builder.append_value("");
+                append_utf8_view_value(&mut builder, "");
             }
         } else {
             for _ in 0..run_length {
-                builder.append_value(random_string(&mut rng));
+                append_utf8_view_value(&mut builder, &random_string(&mut rng));
             }
         }
     }
@@ -158,7 +178,7 @@ fn create_ts_array(size: usize) -> ArrayRef {
 }
 
 /// Creates a RecordBatch with 100K rows and 4 columns: int64, float64, utf8View, and ts.
-fn create_record_batch(size: usize) -> RecordBatch {
+pub(crate) fn create_record_batch(size: usize) -> RecordBatch {
     let fields = vec![
         Field::new("int64", DataType::Int64, false),
         Field::new("float64", DataType::Float64, false),
@@ -188,32 +208,77 @@ const ROW_GROUP_SIZE: usize = 100_000;
 
 /// Writes the RecordBatch to an in memory buffer, returning the buffer
 fn write_parquet_file() -> Vec<u8> {
-    let batch = create_record_batch(TOTAL_ROWS);
-    println!("Batch created with {TOTAL_ROWS} rows, row group size = {ROW_GROUP_SIZE}");
-    println!(
-        "First 100 rows:\n{}",
-        pretty_format_batches(&[batch.clone().slice(0, 100)]).unwrap()
-    );
+    write_parquet_file_with_rows(TOTAL_ROWS, ROW_GROUP_SIZE)
+}
+
+/// Writes a RecordBatch with a configurable shape to an in memory buffer,
+/// returning the buffer.
+fn write_parquet_file_with_rows(total_rows: usize, row_group_size: usize) -> Vec<u8> {
+    let batch = create_record_batch(total_rows);
+    write_record_batch_to_parquet(&batch, row_group_size)
+}
+
+fn write_record_batch_to_parquet(batch: &RecordBatch, row_group_size: usize) -> Vec<u8> {
     let schema = batch.schema();
     let props = WriterProperties::builder()
         .set_compression(Compression::SNAPPY)
-        .set_max_row_group_row_count(Some(ROW_GROUP_SIZE))
+        .set_max_row_group_row_count(Some(row_group_size))
         .build();
     let mut buffer = vec![];
     {
         let mut writer = ArrowWriter::try_new(&mut buffer, schema.clone(), Some(props)).unwrap();
-        writer.write(&batch).unwrap();
+        writer.write(batch).unwrap();
         writer.close().unwrap();
     }
     buffer
 }
 
+fn create_nested_record_batch(size: usize) -> RecordBatch {
+    let tag = Arc::new(StringViewArray::from_iter_values(
+        (0..size).map(|idx| format!("tag_{}", idx % 7)),
+    )) as ArrayRef;
+    let payload = StructArray::from(vec![
+        (
+            Arc::new(Field::new("id", DataType::Int64, false)),
+            Arc::new(Int64Array::from_iter_values(
+                (0..size).map(|idx| idx as i64 + 1_000),
+            )) as ArrayRef,
+        ),
+        (
+            Arc::new(Field::new("label", DataType::Utf8View, false)),
+            Arc::new(StringViewArray::from_iter_values(
+                (0..size).map(|idx| format!("payload_{idx}")),
+            )) as ArrayRef,
+        ),
+    ]);
+    let payload = Arc::new(payload) as ArrayRef;
+    let value = Arc::new(Int64Array::from_iter_values(
+        (0..size).map(|idx| idx as i64 + 10_000),
+    )) as ArrayRef;
+
+    RecordBatch::try_from_iter(vec![("tag", tag), ("payload", payload), ("value", value)]).unwrap()
+}
+
+fn write_nested_parquet_file_with_rows(total_rows: usize, row_group_size: usize) -> Vec<u8> {
+    let batch = create_nested_record_batch(total_rows);
+    write_record_batch_to_parquet(&batch, row_group_size)
+}
+
 /// ProjectionCase defines the projection mode for the benchmark:
 /// either projecting all columns or excluding the column that is used for filtering.
-#[derive(Clone)]
+#[derive(Clone, Copy)]
 enum ProjectionCase {
     AllColumns,
     ExcludeFilterColumn,
+    FilterColumnsOnly,
+    CountOnly,
+    FixedColumns,
+    Float64AndTs,
+    Float64Only,
+    Int64AndFloat64,
+    Int64AndUtf8,
+    TsAndUtf8,
+    Utf8Only,
 }
 
 impl std::fmt::Display for ProjectionCase {
@@ -221,6 +286,53 @@ impl std::fmt::Display for ProjectionCase {
         match self {
             ProjectionCase::AllColumns => write!(f, "all_columns"),
             ProjectionCase::ExcludeFilterColumn => write!(f, "exclude_filter_column"),
+            ProjectionCase::FilterColumnsOnly => write!(f, "filter_columns_only"),
+            ProjectionCase::CountOnly => write!(f, "count_only"),
+            ProjectionCase::FixedColumns => write!(f, "fixed_columns"),
+            ProjectionCase::Float64AndTs => write!(f, "float64_and_ts"),
+            ProjectionCase::Float64Only => write!(f, "float64_only"),
+            ProjectionCase::Int64AndFloat64 => write!(f, "int64_and_float64"),
+            ProjectionCase::Int64AndUtf8 => write!(f, "int64_and_utf8"),
+            ProjectionCase::TsAndUtf8 => write!(f, "ts_and_utf8"),
+            ProjectionCase::Utf8Only => write!(f, "utf8_only"),
+        }
+    }
+}
+
+#[derive(Clone, Copy)]
+enum SyncStrategy {
+    FullPostFilter,
+    PushdownAuto,
+    PushdownSelectors,
+    PushdownMask,
+}
+
+impl std::fmt::Display for SyncStrategy {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        match self {
+            SyncStrategy::FullPostFilter => write!(f, "full_post_filter"),
+            SyncStrategy::PushdownAuto => write!(f, "pushdown_auto"),
+            SyncStrategy::PushdownSelectors => write!(f, "pushdown_selectors"),
+            SyncStrategy::PushdownMask => write!(f, "pushdown_mask"),
+        }
+    }
+}
+
+#[derive(Clone, Copy)]
+enum AsyncStrategy {
+    FullPostFilter,
+    PushdownAuto,
+    PushdownSelectors,
+    PushdownMask,
+}
+
+impl std::fmt::Display for AsyncStrategy {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        match self {
+            AsyncStrategy::FullPostFilter => write!(f, "full_post_filter"),
+            AsyncStrategy::PushdownAuto => write!(f, "pushdown_auto"),
+            AsyncStrategy::PushdownSelectors => write!(f, "pushdown_selectors"),
+            AsyncStrategy::PushdownMask => write!(f, "pushdown_mask"),
         }
     }
 }
@@ -228,7 +340,7 @@ impl std::fmt::Display for ProjectionCase {
 /// FilterType encapsulates the different filter comparisons.
 /// The variants correspond to the different filter patterns.
 #[derive(Clone, Copy, Debug)]
-enum FilterType {
+pub(crate) enum FilterType {
     /// "Point Lookup": selects a single row
     /// ```text
     /// ┌───────────────┐    ┌───────────────┐
@@ -334,6 +446,278 @@ enum FilterType {
     /// [ClickBench]: https://github.com/ClickHouse/ClickBench
     /// [Q21-Q27]: https://github.com/apache/datafusion/blob/b7177234e65cbbb2dcc04c252f6acd80bb026362/benchmarks/queries/clickbench/queries.sql#L22-L28
     Utf8ViewNonEmpty,
+
+    // Deferred-output shapes. Predicate columns are separate from the output,
+    // so rejected rows can skip output-column decoding.
+    /// Scalar-prefix shape derived from DataFusion ClickBench Q37:
+    ///
+    /// ```sql
+    /// WHERE CounterID = 62
+    ///   AND EventDate BETWEEN ...
+    ///   AND DontCountHits = 0
+    ///   AND IsRefresh = 0
+    ///   AND Title <> ''
+    /// ```
+    ///
+    /// DataFusion `Auto` does not push down the `Title <> ''` string predicate,
+    /// but it can push down the scalar prefix to defer decoding `Title`.
+    /// Fragmented ~0.9% selection: approx 4,500 selected rows in 500K.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    ScalarPrefixUtf8Output,
+    /// Sparse fragmented scalar predicates (~7%, approx 36,000 selected rows
+    /// in 500K) with a cheap fixed-width output projection, derived from a
+    /// ClickBench Q41-like shape.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │               │    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    SparseScalarFixedOutput,
+    /// Scalar range predicate derived from TPC-DS Q9 `ss_quantity BETWEEN ...`
+    /// subqueries. The selected rows are random and moderately selective, and
+    /// benchmark projections cover both count-only and numeric aggregate cases.
+    /// Fragmented ~20% selection: approx 100,000 selected rows in 500K.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    QuantityRangePredicate,
+
+    // Multi-predicate shapes. These focus predicate ordering and predicate
+    // evaluation cost independently of projection cost.
+    /// Predicate-order shape derived from DataFusion ClickBench extended Q6:
+    /// an early cheap fixed-width predicate can prune almost all rows before a
+    /// later unprojected variable-width predicate is decoded.
+    /// Point-lookup prefix: at most 1 row reaches the variable-width predicate.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │      ...      │
+    /// │               │    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │      ...      │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │      ...      │
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    FixedThenVarWidthPredicates,
+    /// Same scalar + variable-width predicate columns as
+    /// [`Self::FixedThenVarWidthPredicates`], but with the variable-width
+    /// predicate evaluated first. This anchors the static post-filter gate
+    /// against predicate-order drift.
+    /// At most 1 row survives the final point lookup.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │      ...      │
+    /// │               │    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │      ...      │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │      ...      │
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    VarWidthThenFixedPredicates,
+    /// Multiple cheap scalar predicates, very small output, and projected
+    /// predicate columns used later by grouping. Derived from ClickBench Q40.
+    /// Fragmented ~0.8% selection: approx 4,000 selected rows in 500K.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    MultiScalarProjectedKey,
+    /// Complex OR predicate over dictionary/string-like and scalar columns
+    /// where predicate evaluation dominates reader time. Derived from TPC-DS
+    /// Q41.
+    /// Mixed string/scalar OR branches select approx 1% of rows.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │      ...      │    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │               │
+    /// │               │    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │      ...      │    │               │
+    /// │               │    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    ComplexOrMixedPredicates,
+
+    // Projected-predicate shapes. At least one predicate column is also needed
+    // in the final projection.
+    /// Multiple fixed-width dynamic filters where predicate columns are also
+    /// projected. Derived from TPC-DS Q20 catalog_sales.
+    /// Fragmented ~11% selection: approx 54,000 selected rows in 500K.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    ProjectedDynamicFilters,
+    /// Shape of TPC-DS Q21 after dynamic-filter pruning: sparse fragmented
+    /// fixed-width predicates where the final projection still includes the
+    /// predicate columns. This protects against choosing selectors for columns
+    /// that were already decoded/cached by predicate evaluation.
+    /// Fragmented ~7% selection: approx 36,000 selected rows in 500K.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │               │    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    SparseProjectedPredicatesFixedOutput,
+    /// Projected-predicate shape derived from TPC-DS Q2 fact scans: the
+    /// dynamic filter applies to the date key, the same date key is projected,
+    /// and an additional fixed-width sales value can still be deferred by
+    /// predicate pushdown.
+    /// Selectivity ranges from 5% to 50%: approx 25K to 250K selected rows in
+    /// 500K.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │      ...      │    │      ...      │
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    ProjectedPredicate5Pct,
+    ProjectedPredicate8Pct,
+    ProjectedPredicate10Pct,
+    ProjectedPredicate20Pct,
+    ProjectedPredicate30Pct,
+    ProjectedPredicate40Pct,
+    ProjectedPredicate50Pct,
+    /// Exact shape for the projected-predicate moderate-selectivity gate:
+    /// a clustered 20% timestamp predicate where the predicate column is
+    /// projected and the deferred output is variable-width.
+    /// Clustered 8% or 20% selection: 40,000 or 100,000 selected rows in 500K.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │               │    │               │
+    /// │               │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │      ...      │    │      ...      │
+    /// │               │    │               │
+    /// │               │    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    ClusteredTs8PctProjectedPredicate,
+    ClusteredTs20PctProjectedPredicate,
+    /// Sparse variable-width predicate shaped like TPC-DS Q83 dynamic
+    /// `i_item_id` filters, where the predicate column is also projected.
+    /// Sparse 0.1% selection: 500 sentinel rows in 500K, one every 1,000 rows.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    Utf8ViewMissing,
+    /// Very sparse projected fixed-width scan shaped like TPC-DS fact-table
+    /// filters where the predicate column is also needed in the output projection.
+    /// Sparse 0.1% selection: 500 rows in 500K, one timestamp match every
+    /// 1,000 rows.
+    ///
+    /// ```text
+    /// ┌───────────────┐    ┌───────────────┐
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// │               │    │               │
+    /// │               │    │               │
+    /// │      ...      │    │      ...      │
+    /// │               │    │               │
+    /// │               │    │               │
+    /// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+    /// └───────────────┘    └───────────────┘
+    /// ```
+    SparseProjectedFactScan,
 }
 
 impl std::fmt::Display for FilterType {
@@ -347,6 +731,46 @@ impl std::fmt::Display for FilterType {
             FilterType::UnselectiveClustered => "ts < 9000",
             FilterType::Composite => "float64 > 99.0 AND ts >= 9000",
             FilterType::Utf8ViewNonEmpty => "utf8View <> ''",
+            FilterType::Utf8ViewMissing => "utf8View == '<missing>'",
+            FilterType::ScalarPrefixUtf8Output => "int64 == 62 AND ts < 9000",
+            FilterType::FixedThenVarWidthPredicates => "int64 == 9999 AND utf8View <> ''",
+            FilterType::VarWidthThenFixedPredicates => "utf8View <> '' AND int64 == 9999",
+            FilterType::SparseScalarFixedOutput => "int64 < 8 AND ts < 9000",
+            FilterType::MultiScalarProjectedKey => "int64 == 62 AND float64 > 10.0 AND ts < 9000",
+            FilterType::ComplexOrMixedPredicates => {
+                "(utf8View <> '' AND int64 < 8) OR (ts < 100 AND float64 > 95.0)"
+            }
+            FilterType::ProjectedDynamicFilters => {
+                "int64 < 12 AND ts < 9000 projected dynamic filters"
+            }
+            FilterType::SparseProjectedPredicatesFixedOutput => {
+                "int64 < 8 AND ts < 9000 projected predicates"
+            }
+            FilterType::ProjectedPredicate10Pct => {
+                "int64 < 10 projected predicate with fixed output"
+            }
+            FilterType::ProjectedPredicate5Pct => "int64 < 5 projected predicate with fixed output",
+            FilterType::ProjectedPredicate8Pct => "int64 < 8 projected predicate with fixed output",
+            FilterType::ProjectedPredicate20Pct => {
+                "int64 < 20 projected predicate with fixed output"
+            }
+            FilterType::ProjectedPredicate30Pct => {
+                "int64 < 30 projected predicate with fixed output"
+            }
+            FilterType::ProjectedPredicate40Pct => {
+                "int64 < 40 projected predicate with fixed output"
+            }
+            FilterType::ProjectedPredicate50Pct => {
+                "int64 < 50 projected predicate with fixed output"
+            }
+            FilterType::QuantityRangePredicate => "int64 > 0 AND int64 < 21",
+            FilterType::ClusteredTs20PctProjectedPredicate => {
+                "ts < 2000 projected predicate with utf8 output"
+            }
+            FilterType::ClusteredTs8PctProjectedPredicate => {
+                "ts < 800 projected predicate with utf8 output"
+            }
+            FilterType::SparseProjectedFactScan => "ts % 1000 == 0",
         };
         write!(f, "{s}")
     }
@@ -354,7 +778,7 @@ impl std::fmt::Display for FilterType {
 
 impl FilterType {
     /// Applies the specified filter on the given RecordBatch and returns a BooleanArray mask.
-    fn filter_batch(&self, batch: &RecordBatch) -> arrow::error::Result<BooleanArray> {
+    pub(crate) fn filter_batch(&self, batch: &RecordBatch) -> arrow::error::Result<BooleanArray> {
         match self {
             // Point Lookup on int64 column
             FilterType::PointLookup => {
@@ -382,7 +806,7 @@ impl FilterType {
             // Unselective Unclustered on float64 column: NOT (float64 > 99.0)
             FilterType::UnselectiveUnclustered => {
                 let array = batch.column(batch.schema().index_of("float64")?);
-                gt(array, &Float64Array::new_scalar(99.0))
+                lt_eq(array, &Float64Array::new_scalar(99.0))
             }
             // Unselective Clustered on ts column: ts < 9000
             FilterType::UnselectiveClustered => {
@@ -401,6 +825,113 @@ impl FilterType {
                 let scalar = StringViewArray::new_scalar("");
                 neq(array, &scalar)
             }
+            FilterType::Utf8ViewMissing => {
+                let array = batch.column(batch.schema().index_of("utf8View")?);
+                let scalar = StringViewArray::new_scalar(UTF8_VIEW_MISSING_VALUE);
+                eq(array, &scalar)
+            }
+            // ScalarPrefixUtf8Output: a cheap fragmented scalar predicate
+            // evaluated before decoding a variable-width output column.
+            FilterType::ScalarPrefixUtf8Output => {
+                let int64 = batch.column(batch.schema().index_of("int64")?);
+                let ts = batch.column(batch.schema().index_of("ts")?);
+                let counter_match = eq(int64, &Int64Array::new_scalar(62))?;
+                let date_like_range = lt(ts, &TimestampMillisecondArray::new_scalar(9000))?;
+                and(&counter_match, &date_like_range)
+            }
+            FilterType::FixedThenVarWidthPredicates | FilterType::VarWidthThenFixedPredicates => {
+                let int64 = batch.column(batch.schema().index_of("int64")?);
+                let utf8 = batch.column(batch.schema().index_of("utf8View")?);
+                let cheap_prefix = eq(int64, &Int64Array::new_scalar(9999))?;
+                let string_suffix = neq(utf8, &StringViewArray::new_scalar(""))?;
+                and(&cheap_prefix, &string_suffix)
+            }
+            FilterType::SparseScalarFixedOutput
+            | FilterType::SparseProjectedPredicatesFixedOutput => {
+                let int64 = batch.column(batch.schema().index_of("int64")?);
+                let ts = batch.column(batch.schema().index_of("ts")?);
+                let counter_like = lt(int64, &Int64Array::new_scalar(8))?;
+                let date_like = lt(ts, &TimestampMillisecondArray::new_scalar(9000))?;
+                and(&counter_like, &date_like)
+            }
+            FilterType::MultiScalarProjectedKey => {
+                let int64 = batch.column(batch.schema().index_of("int64")?);
+                let float64 = batch.column(batch.schema().index_of("float64")?);
+                let ts = batch.column(batch.schema().index_of("ts")?);
+                let counter_match = eq(int64, &Int64Array::new_scalar(62))?;
+                let width_match = gt(float64, &Float64Array::new_scalar(10.0))?;
+                let date_like = lt(ts, &TimestampMillisecondArray::new_scalar(9000))?;
+                and(&and(&counter_match, &width_match)?, &date_like)
+            }
+            FilterType::ComplexOrMixedPredicates => {
+                let int64 = batch.column(batch.schema().index_of("int64")?);
+                let float64 = batch.column(batch.schema().index_of("float64")?);
+                let utf8 = batch.column(batch.schema().index_of("utf8View")?);
+                let ts = batch.column(batch.schema().index_of("ts")?);
+                let string_branch = and(
+                    &neq(utf8, &StringViewArray::new_scalar(""))?,
+                    &lt(int64, &Int64Array::new_scalar(8))?,
+                )?;
+                let scalar_branch = and(
+                    &lt(ts, &TimestampMillisecondArray::new_scalar(100))?,
+                    &gt(float64, &Float64Array::new_scalar(95.0))?,
+                )?;
+                or(&string_branch, &scalar_branch)
+            }
+            FilterType::ProjectedDynamicFilters => {
+                let int64 = batch.column(batch.schema().index_of("int64")?);
+                let ts = batch.column(batch.schema().index_of("ts")?);
+                let item_like = lt(int64, &Int64Array::new_scalar(12))?;
+                let date_like = lt(ts, &TimestampMillisecondArray::new_scalar(9000))?;
+                and(&item_like, &date_like)
+            }
+            FilterType::ProjectedPredicate5Pct
+            | FilterType::ProjectedPredicate8Pct
+            | FilterType::ProjectedPredicate10Pct
+            | FilterType::ProjectedPredicate20Pct
+            | FilterType::ProjectedPredicate30Pct
+            | FilterType::ProjectedPredicate40Pct
+            | FilterType::ProjectedPredicate50Pct => {
+                let int64 = batch.column(batch.schema().index_of("int64")?);
+                let threshold = match self {
+                    FilterType::ProjectedPredicate5Pct => 5,
+                    FilterType::ProjectedPredicate8Pct => 8,
+                    FilterType::ProjectedPredicate10Pct => 10,
+                    FilterType::ProjectedPredicate20Pct => 20,
+                    FilterType::ProjectedPredicate30Pct => 30,
+                    FilterType::ProjectedPredicate40Pct => 40,
+                    FilterType::ProjectedPredicate50Pct => 50,
+                    _ => unreachable!(),
+                };
+                lt(int64, &Int64Array::new_scalar(threshold))
+            }
+            FilterType::QuantityRangePredicate => {
+                let int64 = batch.column(batch.schema().index_of("int64")?);
+                let lower = gt(int64, &Int64Array::new_scalar(0))?;
+                let upper = lt(int64, &Int64Array::new_scalar(21))?;
+                and(&lower, &upper)
+            }
+            FilterType::ClusteredTs8PctProjectedPredicate => {
+                let ts = batch.column(batch.schema().index_of("ts")?);
+                lt(ts, &TimestampMillisecondArray::new_scalar(800))
+            }
+            FilterType::ClusteredTs20PctProjectedPredicate => {
+                let ts = batch.column(batch.schema().index_of("ts")?);
+                lt(ts, &TimestampMillisecondArray::new_scalar(2000))
+            }
+            FilterType::SparseProjectedFactScan => {
+                let ts = batch
+                    .column(batch.schema().index_of("ts")?)
+                    .as_any()
+                    .downcast_ref::<TimestampMillisecondArray>()
+                    .unwrap();
+                Ok(BooleanArray::from(
+                    ts.values()
+                        .iter()
+                        .map(|value| value % 1000 == 0)
+                        .collect::<Vec<_>>(),
+                ))
+            }
         }
     }
 
@@ -414,7 +945,27 @@ impl FilterType {
             FilterType::UnselectiveUnclustered => &[1],
             FilterType::UnselectiveClustered => &[3],
             FilterType::Composite => &[1, 3], // Use float64 column and ts column as representative for composite
-            FilterType::Utf8ViewNonEmpty => &[2],
+            FilterType::Utf8ViewNonEmpty | FilterType::Utf8ViewMissing => &[2],
+            FilterType::ScalarPrefixUtf8Output => &[0, 3],
+            FilterType::FixedThenVarWidthPredicates | FilterType::VarWidthThenFixedPredicates => {
+                &[0, 2]
+            }
+            FilterType::MultiScalarProjectedKey => &[0, 1, 3],
+            FilterType::SparseScalarFixedOutput
+            | FilterType::ProjectedDynamicFilters
+            | FilterType::SparseProjectedPredicatesFixedOutput => &[0, 3],
+            FilterType::ComplexOrMixedPredicates => &[0, 1, 2, 3],
+            FilterType::ProjectedPredicate5Pct
+            | FilterType::ProjectedPredicate8Pct
+            | FilterType::ProjectedPredicate10Pct
+            | FilterType::ProjectedPredicate20Pct
+            | FilterType::ProjectedPredicate30Pct
+            | FilterType::ProjectedPredicate40Pct
+            | FilterType::ProjectedPredicate50Pct => &[0],
+            FilterType::QuantityRangePredicate => &[0],
+            FilterType::ClusteredTs8PctProjectedPredicate
+            | FilterType::ClusteredTs20PctProjectedPredicate => &[3],
+            FilterType::SparseProjectedFactScan => &[3],
         }
     }
 }
@@ -449,17 +1000,8 @@ fn benchmark_filters_and_projections(c: &mut Criterion) {
 
     for filter_type in filter_types {
         for proj_case in &projection_cases {
-            // All indices corresponding to the 10 columns.
-            let all_indices = vec![0, 1, 2, 3];
             let filter_col = filter_type.filter_projection().to_vec();
-            // For the projection, either select all columns or exclude the filter column(s).
-            let output_projection: Vec<usize> = match proj_case {
-                ProjectionCase::AllColumns => all_indices.clone(),
-                ProjectionCase::ExcludeFilterColumn => all_indices
-                    .into_iter()
-                    .filter(|i| !filter_col.contains(i))
-                    .collect(),
-            };
+            let output_projection = output_projection_for(filter_type, proj_case);
 
             let reader = InMemoryReader::try_new(&parquet_file).unwrap();
             let metadata = Arc::clone(reader.metadata());
@@ -510,29 +1052,975 @@ fn benchmark_filters_and_projections(c: &mut Criterion) {
     }
 }
 
-/// Use async API
-async fn benchmark_async_reader(
-    reader: InMemoryReader,
-    projection_mask: ProjectionMask,
-    row_filter: RowFilter,
-) {
-    let mut stream = ParquetRecordBatchStreamBuilder::new(reader)
-        .await
-        .unwrap()
-        .with_batch_size(8192)
-        .with_projection(projection_mask)
-        .with_row_filter(row_filter)
-        .build()
-        .unwrap();
-    while let Some(b) = stream.next().await {
-        b.unwrap(); // consume the batches, no buffering
-    }
-}
+/// Compare full scan plus post-filtering against row-level pushdown strategies.
+///
+/// This group is intentionally sync-only and smaller than
+/// [`benchmark_filters_and_projections`]. It tracks the cases most likely to
+/// inform a future default `Auto` policy: selective random filters, clustered
+/// filters, ClickBench-like string filters, and the forced selector strategy
+/// that originally motivated apache/arrow-rs#8565.
+fn benchmark_sync_strategy_matrix(c: &mut Criterion) {
+    let parquet_file = Bytes::from(write_parquet_file());
+    let filter_types = [
+        FilterType::SelectiveUnclustered,
+        FilterType::ModeratelySelectiveClustered,
+        FilterType::ModeratelySelectiveUnclustered,
+        FilterType::Utf8ViewNonEmpty,
+    ];
+    let strategies = [
+        SyncStrategy::FullPostFilter,
+        SyncStrategy::PushdownAuto,
+        SyncStrategy::PushdownSelectors,
+        SyncStrategy::PushdownMask,
+    ];
 
-/// Like [`benchmark_async_reader`] but also threads `with_limit(limit)` into
-/// the stream builder. Used by the `LIMIT` benchmark below.
-async fn benchmark_async_reader_with_limit(
-    reader: InMemoryReader,
+    let mut group = c.benchmark_group("arrow_reader_row_filter_strategy_matrix");
+
+    for filter_type in filter_types {
+        for projection_case in [
+            ProjectionCase::AllColumns,
+            ProjectionCase::ExcludeFilterColumn,
+        ] {
+            let reader = InMemoryReader::try_new(&parquet_file).unwrap();
+            let metadata = Arc::clone(reader.metadata());
+            let schema_descr = metadata.file_metadata().schema_descr();
+            let output_projection = output_projection_for(filter_type, &projection_case);
+            let read_projection = full_post_filter_read_projection(filter_type, &output_projection);
+            let output_column_names = projection_names(&output_projection);
+            let projection_mask = ProjectionMask::roots(schema_descr, output_projection);
+            let read_projection_mask = ProjectionMask::roots(schema_descr, read_projection);
+            let pred_mask = ProjectionMask::roots(
+                schema_descr,
+                filter_type.filter_projection().iter().copied(),
+            );
+
+            for strategy in strategies {
+                let bench_id = BenchmarkId::new(
+                    format!("{filter_type}/{projection_case}"),
+                    strategy.to_string(),
+                );
+
+                group.bench_function(bench_id, |b| {
+                    b.iter(|| {
+                        let reader = reader.clone();
+                        let pred_mask = pred_mask.clone();
+                        let projection_mask = projection_mask.clone();
+                        let read_projection_mask = read_projection_mask.clone();
+                        let output_column_names = output_column_names.clone();
+
+                        match strategy {
+                            SyncStrategy::FullPostFilter => benchmark_sync_reader_post_filter(
+                                reader,
+                                read_projection_mask,
+                                output_column_names,
+                                filter_type,
+                            ),
+                            SyncStrategy::PushdownAuto => {
+                                let row_filter = row_filter_for(filter_type, pred_mask);
+                                benchmark_sync_reader_with_policy(
+                                    reader,
+                                    projection_mask,
+                                    row_filter,
+                                    RowSelectionPolicy::default(),
+                                )
+                            }
+                            SyncStrategy::PushdownSelectors => {
+                                let row_filter = row_filter_for(filter_type, pred_mask);
+                                benchmark_sync_reader_with_policy(
+                                    reader,
+                                    projection_mask,
+                                    row_filter,
+                                    RowSelectionPolicy::Selectors,
+                                )
+                            }
+                            SyncStrategy::PushdownMask => {
+                                let row_filter = row_filter_for(filter_type, pred_mask);
+                                benchmark_sync_reader_with_policy(
+                                    reader,
+                                    projection_mask,
+                                    row_filter,
+                                    RowSelectionPolicy::Mask,
+                                )
+                            }
+                        }
+                    });
+                });
+            }
+        }
+    }
+}
+
+/// Compare async full scan plus post-filtering against async row-level pushdown
+/// strategies. This is the matrix that exercises the current reader `Auto`
+/// policy through the async stream backed by the push decoder row-group pipeline.
+fn benchmark_async_strategy_matrix(c: &mut Criterion) {
+    let parquet_file = Bytes::from(write_parquet_file());
+    let filter_types = [
+        FilterType::SelectiveUnclustered,
+        FilterType::ModeratelySelectiveClustered,
+        FilterType::ModeratelySelectiveUnclustered,
+        FilterType::Utf8ViewNonEmpty,
+    ];
+    let strategies = [
+        AsyncStrategy::FullPostFilter,
+        AsyncStrategy::PushdownAuto,
+        AsyncStrategy::PushdownSelectors,
+        AsyncStrategy::PushdownMask,
+    ];
+
+    let rt = tokio::runtime::Builder::new_multi_thread()
+        .enable_all()
+        .build()
+        .unwrap();
+
+    let mut group = c.benchmark_group("arrow_reader_row_filter_async_strategy_matrix");
+
+    for filter_type in filter_types {
+        for projection_case in [
+            ProjectionCase::AllColumns,
+            ProjectionCase::ExcludeFilterColumn,
+        ] {
+            let reader = InMemoryReader::try_new(&parquet_file).unwrap();
+            let metadata = Arc::clone(reader.metadata());
+            let schema_descr = metadata.file_metadata().schema_descr();
+            let output_projection = output_projection_for(filter_type, &projection_case);
+            let read_projection = full_post_filter_read_projection(filter_type, &output_projection);
+            let output_column_names = projection_names(&output_projection);
+            let projection_mask = ProjectionMask::roots(schema_descr, output_projection);
+            let read_projection_mask = ProjectionMask::roots(schema_descr, read_projection);
+            let pred_mask = ProjectionMask::roots(
+                schema_descr,
+                filter_type.filter_projection().iter().copied(),
+            );
+
+            for strategy in strategies {
+                let bench_id = BenchmarkId::new(
+                    format!("{filter_type}/{projection_case}"),
+                    strategy.to_string(),
+                );
+                let rt_captured = rt.handle().clone();
+
+                group.bench_function(bench_id, |b| {
+                    b.iter(|| {
+                        let reader = reader.clone();
+                        let pred_mask = pred_mask.clone();
+                        let projection_mask = projection_mask.clone();
+                        let read_projection_mask = read_projection_mask.clone();
+                        let output_column_names = output_column_names.clone();
+
+                        rt_captured.block_on(async {
+                            match strategy {
+                                AsyncStrategy::FullPostFilter => {
+                                    benchmark_async_reader_post_filter(
+                                        reader,
+                                        read_projection_mask,
+                                        output_column_names,
+                                        filter_type,
+                                    )
+                                    .await
+                                }
+                                AsyncStrategy::PushdownAuto => {
+                                    let row_filter = row_filter_for(filter_type, pred_mask);
+                                    benchmark_async_reader_with_policy(
+                                        reader,
+                                        projection_mask,
+                                        row_filter,
+                                        RowSelectionPolicy::default(),
+                                    )
+                                    .await
+                                }
+                                AsyncStrategy::PushdownSelectors => {
+                                    let row_filter = row_filter_for(filter_type, pred_mask);
+                                    benchmark_async_reader_with_policy(
+                                        reader,
+                                        projection_mask,
+                                        row_filter,
+                                        RowSelectionPolicy::Selectors,
+                                    )
+                                    .await
+                                }
+                                AsyncStrategy::PushdownMask => {
+                                    let row_filter = row_filter_for(filter_type, pred_mask);
+                                    benchmark_async_reader_with_policy(
+                                        reader,
+                                        projection_mask,
+                                        row_filter,
+                                        RowSelectionPolicy::Mask,
+                                    )
+                                    .await
+                                }
+                            }
+                        })
+                    });
+                });
+            }
+        }
+    }
+}
+
+/// A focused async-only matrix that isolates the cases most relevant to the
+/// row-filter Auto policy. This is intentionally narrower than
+/// [`benchmark_async_strategy_matrix`]: it keeps the benchmark output focused
+/// on cases where later PRs may teach `Auto` to switch execution modes or
+/// explicitly keep predicate pushdown.
+///
+/// The cases use structure-oriented names. Comments on [`FilterType`] keep the
+/// ClickBench and TPC-DS provenance, but these are synthetic reader shapes, not
+/// end-to-end query benchmarks.
+///
+/// Individual [`FilterType`] variants include shaded-row diagrams for the
+/// representative selection shapes.
+fn benchmark_async_auto_policy_focus(c: &mut Criterion) {
+    const SMALL_TOTAL_ROWS: usize = 20_000;
+    const SMALL_ROW_GROUP_SIZE: usize = 5_000;
+
+    let parquet_file = Bytes::from(write_parquet_file());
+    let small_parquet_file = Bytes::from(write_parquet_file_with_rows(
+        SMALL_TOTAL_ROWS,
+        SMALL_ROW_GROUP_SIZE,
+    ));
+    let cases = [
+        // Baseline selectivity shapes.
+        AsyncFocusCase::new(
+            "utf8_non_empty",
+            parquet_file.clone(),
+            FilterType::Utf8ViewNonEmpty,
+            ProjectionCase::ExcludeFilterColumn,
+        ),
+        AsyncFocusCase::new(
+            "utf8_non_empty",
+            parquet_file.clone(),
+            FilterType::Utf8ViewNonEmpty,
+            ProjectionCase::AllColumns,
+        ),
+        AsyncFocusCase::new(
+            "high_selectivity_float64",
+            parquet_file.clone(),
+            FilterType::UnselectiveUnclustered,
+            ProjectionCase::ExcludeFilterColumn,
+        ),
+        AsyncFocusCase::new(
+            "high_selectivity_ts_clustered",
+            parquet_file.clone(),
+            FilterType::UnselectiveClustered,
+            ProjectionCase::ExcludeFilterColumn,
+        ),
+        AsyncFocusCase::new(
+            "fragmented_int64_10pct",
+            parquet_file.clone(),
+            FilterType::ModeratelySelectiveUnclustered,
+            ProjectionCase::ExcludeFilterColumn,
+        ),
+        AsyncFocusCase::new(
+            "selective_float64_1pct",
+            parquet_file.clone(),
+            FilterType::SelectiveUnclustered,
+            ProjectionCase::ExcludeFilterColumn,
+        ),
+        // Filter-only and count-only shapes. These guard the cases where there
+        // is no deferred output column to amortize the cost of row selection.
+        AsyncFocusCase::new(
+            "point_lookup_filter_only",
+            parquet_file.clone(),
+            FilterType::PointLookup,
+            ProjectionCase::FilterColumnsOnly,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_8pct_filter_only",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate8Pct,
+            ProjectionCase::FilterColumnsOnly,
+        ),
+        AsyncFocusCase::new(
+            "sparse_scalar_count_only",
+            parquet_file.clone(),
+            FilterType::SparseScalarFixedOutput,
+            ProjectionCase::CountOnly,
+        ),
+        AsyncFocusCase::new(
+            "small_fragmented_scalar_filter_only",
+            small_parquet_file.clone(),
+            FilterType::ModeratelySelectiveUnclustered,
+            ProjectionCase::FilterColumnsOnly,
+        ),
+        AsyncFocusCase::new(
+            "quantity_range_filter_columns_only",
+            parquet_file.clone(),
+            FilterType::QuantityRangePredicate,
+            ProjectionCase::FilterColumnsOnly,
+        ),
+        // Deferred-output shapes. Predicate columns are not part of the output,
+        // so pushdown can skip decoding projected columns for rejected rows.
+        AsyncFocusCase::new(
+            "scalar_prefix_utf8_output",
+            parquet_file.clone(),
+            FilterType::ScalarPrefixUtf8Output,
+            ProjectionCase::Utf8Only,
+        ),
+        AsyncFocusCase::new(
+            "small_scalar_prefix_utf8_output",
+            small_parquet_file.clone(),
+            FilterType::ScalarPrefixUtf8Output,
+            ProjectionCase::Utf8Only,
+        ),
+        AsyncFocusCase::new(
+            "point_lookup_deferred_fixed_output",
+            parquet_file.clone(),
+            FilterType::PointLookup,
+            ProjectionCase::Float64Only,
+        ),
+        AsyncFocusCase::new(
+            "sparse_scalar_fixed_output",
+            parquet_file.clone(),
+            FilterType::SparseScalarFixedOutput,
+            ProjectionCase::Float64Only,
+        ),
+        AsyncFocusCase::new(
+            "quantity_range_numeric_output",
+            parquet_file.clone(),
+            FilterType::QuantityRangePredicate,
+            ProjectionCase::Float64Only,
+        ),
+        // Multi-predicate shapes. These make predicate order and predicate
+        // evaluation cost visible separately from projection cost.
+        AsyncFocusCase::new(
+            "fixed_then_varwidth_predicates",
+            parquet_file.clone(),
+            FilterType::FixedThenVarWidthPredicates,
+            ProjectionCase::Float64Only,
+        ),
+        AsyncFocusCase::new(
+            "varwidth_then_fixed_predicates",
+            parquet_file.clone(),
+            FilterType::VarWidthThenFixedPredicates,
+            ProjectionCase::Float64Only,
+        ),
+        AsyncFocusCase::new(
+            "multi_scalar_projected_key",
+            parquet_file.clone(),
+            FilterType::MultiScalarProjectedKey,
+            ProjectionCase::Float64AndTs,
+        ),
+        AsyncFocusCase::new(
+            "complex_or_mixed_predicates",
+            parquet_file.clone(),
+            FilterType::ComplexOrMixedPredicates,
+            ProjectionCase::Float64Only,
+        ),
+        // Projected-predicate shapes. The predicate column is also projected,
+        // so pushdown must not assume the predicate decode is purely overhead.
+        AsyncFocusCase::new(
+            "projected_dynamic_filters",
+            parquet_file.clone(),
+            FilterType::ProjectedDynamicFilters,
+            ProjectionCase::FixedColumns,
+        ),
+        AsyncFocusCase::new(
+            "sparse_projected_predicates_fixed_output",
+            parquet_file.clone(),
+            FilterType::SparseProjectedPredicatesFixedOutput,
+            ProjectionCase::FixedColumns,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_5pct_fixed_output",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate5Pct,
+            ProjectionCase::Int64AndFloat64,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_8pct_fixed_output",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate8Pct,
+            ProjectionCase::Int64AndFloat64,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_8pct_varwidth_output",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate8Pct,
+            ProjectionCase::Int64AndUtf8,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_10pct_fixed_output",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate10Pct,
+            ProjectionCase::Int64AndFloat64,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_20pct_fixed_output",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate20Pct,
+            ProjectionCase::Int64AndFloat64,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_20pct_varwidth_output",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate20Pct,
+            ProjectionCase::Int64AndUtf8,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_30pct_fixed_output",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate30Pct,
+            ProjectionCase::Int64AndFloat64,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_40pct_fixed_output",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate40Pct,
+            ProjectionCase::Int64AndFloat64,
+        ),
+        AsyncFocusCase::new(
+            "projected_predicate_50pct_fixed_output",
+            parquet_file.clone(),
+            FilterType::ProjectedPredicate50Pct,
+            ProjectionCase::Int64AndFloat64,
+        ),
+        AsyncFocusCase::new(
+            "clustered_ts_8pct_fixed_output",
+            parquet_file.clone(),
+            FilterType::ClusteredTs8PctProjectedPredicate,
+            ProjectionCase::Float64AndTs,
+        ),
+        AsyncFocusCase::new(
+            "clustered_ts_8pct_varwidth_output",
+            parquet_file.clone(),
+            FilterType::ClusteredTs8PctProjectedPredicate,
+            ProjectionCase::TsAndUtf8,
+        ),
+        AsyncFocusCase::new(
+            "clustered_ts_20pct_fixed_output",
+            parquet_file.clone(),
+            FilterType::ClusteredTs20PctProjectedPredicate,
+            ProjectionCase::Float64AndTs,
+        ),
+        AsyncFocusCase::new(
+            "clustered_ts_20pct_varwidth_output",
+            parquet_file.clone(),
+            FilterType::ClusteredTs20PctProjectedPredicate,
+            ProjectionCase::TsAndUtf8,
+        ),
+        AsyncFocusCase::new(
+            "sparse_projected_fact_scan",
+            parquet_file.clone(),
+            FilterType::SparseProjectedFactScan,
+            ProjectionCase::FixedColumns,
+        ),
+        AsyncFocusCase::new(
+            "sparse_utf8_projected_predicate",
+            parquet_file.clone(),
+            FilterType::Utf8ViewMissing,
+            ProjectionCase::AllColumns,
+        ),
+    ];
+    let strategies = [
+        AsyncStrategy::FullPostFilter,
+        AsyncStrategy::PushdownAuto,
+        AsyncStrategy::PushdownMask,
+        AsyncStrategy::PushdownSelectors,
+    ];
+
+    let rt = tokio::runtime::Builder::new_multi_thread()
+        .enable_all()
+        .build()
+        .unwrap();
+
+    let mut group = c.benchmark_group("arrow_reader_row_filter_async_auto_policy_focus");
+
+    for case in cases {
+        benchmark_async_focus_case(&mut group, &rt, case, &strategies);
+    }
+}
+
+/// Isolate projected scans that do not construct a [`RowFilter`].
+///
+/// This tracks the reader-level shape seen in TPC-DS Q83 return-table scans:
+/// a narrow primitive projection where row-level pushdown metrics are zero.
+/// It deliberately lives outside the adaptive-materialization matrix because there is no
+/// filter strategy to choose.
+///
+/// ```text
+/// no RowFilter             projected primitive columns
+/// ┌───────────────┐    ┌───────────────┐
+/// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+/// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+/// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+/// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+/// │      ...      │    │      ...      │
+/// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+/// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+/// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+/// │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│    │▒▒▒▒▒▒▒▒▒▒▒▒▒▒▒│
+/// └───────────────┘    └───────────────┘
+/// ```
+fn benchmark_projection_scan_focus(c: &mut Criterion) {
+    let parquet_file = Bytes::from(write_parquet_file());
+    let rt = tokio::runtime::Builder::new_multi_thread()
+        .enable_all()
+        .build()
+        .unwrap();
+
+    let mut group = c.benchmark_group("arrow_reader_projection_scan_focus");
+
+    let case_name = "primitive_projection_only";
+    let projection = vec![0, 1, 3];
+    let reader = InMemoryReader::try_new(&parquet_file).unwrap();
+    let metadata = Arc::clone(reader.metadata());
+    let schema_descr = metadata.file_metadata().schema_descr();
+    let projection_mask = ProjectionMask::roots(schema_descr, projection);
+
+    let bench_id = BenchmarkId::new(case_name, "async");
+    let rt_captured = rt.handle().clone();
+    group.bench_function(bench_id, |b| {
+        b.iter(|| {
+            let reader = reader.clone();
+            let projection_mask = projection_mask.clone();
+            rt_captured.block_on(benchmark_async_reader_projected(reader, projection_mask));
+        });
+    });
+
+    let bench_id = BenchmarkId::new(case_name, "sync");
+    group.bench_function(bench_id, |b| {
+        b.iter(|| {
+            let reader = reader.clone();
+            let projection_mask = projection_mask.clone();
+            benchmark_sync_reader_projected(reader, projection_mask);
+        });
+    });
+}
+
+struct AsyncFocusCase {
+    case_name: &'static str,
+    parquet_file: Bytes,
+    filter_type: FilterType,
+    projection_case: ProjectionCase,
+}
+
+impl AsyncFocusCase {
+    fn new(
+        case_name: &'static str,
+        parquet_file: Bytes,
+        filter_type: FilterType,
+        projection_case: ProjectionCase,
+    ) -> Self {
+        Self {
+            case_name,
+            parquet_file,
+            filter_type,
+            projection_case,
+        }
+    }
+}
+
+fn benchmark_async_focus_case(
+    group: &mut BenchmarkGroup<'_, WallTime>,
+    rt: &tokio::runtime::Runtime,
+    case: AsyncFocusCase,
+    strategies: &[AsyncStrategy],
+) {
+    let AsyncFocusCase {
+        case_name,
+        parquet_file,
+        filter_type,
+        projection_case,
+    } = case;
+
+    let reader = InMemoryReader::try_new(&parquet_file).unwrap();
+    let metadata = Arc::clone(reader.metadata());
+    let schema_descr = metadata.file_metadata().schema_descr();
+    let output_projection = output_projection_for(filter_type, &projection_case);
+    let read_projection = full_post_filter_read_projection(filter_type, &output_projection);
+    let output_column_names = projection_names(&output_projection);
+    let projection_mask = ProjectionMask::roots(schema_descr, output_projection);
+    let read_projection_mask = ProjectionMask::roots(schema_descr, read_projection);
+    let pred_mask = ProjectionMask::roots(
+        schema_descr,
+        filter_type.filter_projection().iter().copied(),
+    );
+    let fixed_pred_mask = ProjectionMask::roots(schema_descr, [0]);
+    let varwidth_pred_mask = ProjectionMask::roots(schema_descr, [2]);
+    let sparse_int64_pred_mask = ProjectionMask::roots(schema_descr, [0]);
+    let sparse_ts_pred_mask = ProjectionMask::roots(schema_descr, [3]);
+    let scalar_float64_pred_mask = ProjectionMask::roots(schema_descr, [1]);
+
+    for strategy in strategies.iter().copied() {
+        let bench_id = BenchmarkId::new(
+            format!("{case_name}/{projection_case}"),
+            strategy.to_string(),
+        );
+        let rt_captured = rt.handle().clone();
+
+        group.bench_function(bench_id, |b| {
+            b.iter(|| {
+                let reader = reader.clone();
+                let pred_mask = pred_mask.clone();
+                let fixed_pred_mask = fixed_pred_mask.clone();
+                let varwidth_pred_mask = varwidth_pred_mask.clone();
+                let sparse_int64_pred_mask = sparse_int64_pred_mask.clone();
+                let sparse_ts_pred_mask = sparse_ts_pred_mask.clone();
+                let scalar_float64_pred_mask = scalar_float64_pred_mask.clone();
+                let projection_mask = projection_mask.clone();
+                let read_projection_mask = read_projection_mask.clone();
+                let output_column_names = output_column_names.clone();
+
+                rt_captured.block_on(async {
+                    match strategy {
+                        AsyncStrategy::FullPostFilter => {
+                            benchmark_async_reader_post_filter(
+                                reader,
+                                read_projection_mask,
+                                output_column_names,
+                                filter_type,
+                            )
+                            .await
+                        }
+                        AsyncStrategy::PushdownAuto => {
+                            let row_filter = row_filter_for_focus_case(
+                                filter_type,
+                                pred_mask,
+                                fixed_pred_mask,
+                                varwidth_pred_mask,
+                                sparse_int64_pred_mask,
+                                sparse_ts_pred_mask,
+                                scalar_float64_pred_mask,
+                            );
+                            benchmark_async_reader_with_policy(
+                                reader,
+                                projection_mask,
+                                row_filter,
+                                RowSelectionPolicy::default(),
+                            )
+                            .await
+                        }
+                        AsyncStrategy::PushdownSelectors => {
+                            let row_filter = row_filter_for_focus_case(
+                                filter_type,
+                                pred_mask,
+                                fixed_pred_mask,
+                                varwidth_pred_mask,
+                                sparse_int64_pred_mask,
+                                sparse_ts_pred_mask,
+                                scalar_float64_pred_mask,
+                            );
+                            benchmark_async_reader_with_policy(
+                                reader,
+                                projection_mask,
+                                row_filter,
+                                RowSelectionPolicy::Selectors,
+                            )
+                            .await
+                        }
+                        AsyncStrategy::PushdownMask => {
+                            let row_filter = row_filter_for_focus_case(
+                                filter_type,
+                                pred_mask,
+                                fixed_pred_mask,
+                                varwidth_pred_mask,
+                                sparse_int64_pred_mask,
+                                sparse_ts_pred_mask,
+                                scalar_float64_pred_mask,
+                            );
+                            benchmark_async_reader_with_policy(
+                                reader,
+                                projection_mask,
+                                row_filter,
+                                RowSelectionPolicy::Mask,
+                            )
+                            .await
+                        }
+                    }
+                })
+            });
+        });
+    }
+}
+
+fn output_projection_for(filter_type: FilterType, projection_case: &ProjectionCase) -> Vec<usize> {
+    let filter_columns = filter_type.filter_projection();
+    match projection_case {
+        ProjectionCase::AllColumns | ProjectionCase::ExcludeFilterColumn => COLUMN_NAMES
+            .iter()
+            .enumerate()
+            .map(|(idx, _)| idx)
+            .filter(move |idx| {
+                matches!(projection_case, ProjectionCase::AllColumns)
+                    || !filter_columns.contains(idx)
+            })
+            .collect(),
+        ProjectionCase::FilterColumnsOnly => filter_columns.to_vec(),
+        ProjectionCase::CountOnly => vec![],
+        ProjectionCase::FixedColumns => vec![0, 1, 3],
+        ProjectionCase::Float64AndTs => vec![1, 3],
+        ProjectionCase::Float64Only => vec![1],
+        ProjectionCase::Int64AndFloat64 => vec![0, 1],
+        ProjectionCase::Int64AndUtf8 => vec![0, 2],
+        ProjectionCase::TsAndUtf8 => vec![2, 3],
+        ProjectionCase::Utf8Only => vec![2],
+    }
+}
+
+fn full_post_filter_read_projection(
+    filter_type: FilterType,
+    output_projection: &[usize],
+) -> Vec<usize> {
+    let mut read_projection = output_projection.to_vec();
+    for filter_idx in filter_type.filter_projection() {
+        if !read_projection.contains(filter_idx) {
+            read_projection.push(*filter_idx);
+        }
+    }
+    read_projection.sort_unstable();
+    read_projection
+}
+
+fn projection_names(projection: &[usize]) -> Vec<&'static str> {
+    projection.iter().map(|idx| COLUMN_NAMES[*idx]).collect()
+}
+
+pub(crate) fn filter_projected_record_batch(
+    batch: &RecordBatch,
+    filter: &BooleanArray,
+    output_column_names: &[&str],
+) -> arrow::error::Result<RecordBatch> {
+    let output_projection = output_column_names
+        .iter()
+        .map(|name| batch.schema().index_of(name))
+        .collect::<arrow::error::Result<Vec<_>>>()?;
+    let output = batch.project(&output_projection)?;
+    arrow_select::filter::filter_record_batch(&output, filter)
+}
+
+pub(crate) fn post_filter_projected_num_rows(
+    batch: &RecordBatch,
+    filter: &BooleanArray,
+    output_column_names: &[&str],
+) -> arrow::error::Result<usize> {
+    if output_column_names.is_empty() {
+        return Ok(filter.true_count());
+    }
+
+    let output = filter_projected_record_batch(batch, filter, output_column_names)?;
+    Ok(output.num_rows())
+}
+
+fn row_filter_for(filter_type: FilterType, pred_mask: ProjectionMask) -> RowFilter {
+    let filter = ArrowPredicateFn::new(pred_mask, move |batch| filter_type.filter_batch(&batch));
+    RowFilter::new(vec![Box::new(filter)])
+}
+
+fn row_filter_for_focus_case(
+    filter_type: FilterType,
+    pred_mask: ProjectionMask,
+    fixed_pred_mask: ProjectionMask,
+    varwidth_pred_mask: ProjectionMask,
+    sparse_int64_pred_mask: ProjectionMask,
+    sparse_ts_pred_mask: ProjectionMask,
+    scalar_float64_pred_mask: ProjectionMask,
+) -> RowFilter {
+    match filter_type {
+        FilterType::FixedThenVarWidthPredicates | FilterType::VarWidthThenFixedPredicates => {
+            let int64_filter = ArrowPredicateFn::new(fixed_pred_mask, move |batch: RecordBatch| {
+                let int64 = batch.column(batch.schema().index_of("int64")?);
+                eq(int64, &Int64Array::new_scalar(9999))
+            });
+            let utf8_filter =
+                ArrowPredicateFn::new(varwidth_pred_mask, move |batch: RecordBatch| {
+                    let utf8 = batch.column(batch.schema().index_of("utf8View")?);
+                    neq(utf8, &StringViewArray::new_scalar(""))
+                });
+
+            match filter_type {
+                FilterType::FixedThenVarWidthPredicates => {
+                    RowFilter::new(vec![Box::new(int64_filter), Box::new(utf8_filter)])
+                }
+                FilterType::VarWidthThenFixedPredicates => {
+                    RowFilter::new(vec![Box::new(utf8_filter), Box::new(int64_filter)])
+                }
+                _ => unreachable!(),
+            }
+        }
+        FilterType::MultiScalarProjectedKey => {
+            let int64_filter =
+                ArrowPredicateFn::new(sparse_int64_pred_mask, move |batch: RecordBatch| {
+                    let int64 = batch.column(batch.schema().index_of("int64")?);
+                    eq(int64, &Int64Array::new_scalar(62))
+                });
+            let float64_filter =
+                ArrowPredicateFn::new(scalar_float64_pred_mask, move |batch: RecordBatch| {
+                    let float64 = batch.column(batch.schema().index_of("float64")?);
+                    gt(float64, &Float64Array::new_scalar(10.0))
+                });
+            let ts_filter =
+                ArrowPredicateFn::new(sparse_ts_pred_mask, move |batch: RecordBatch| {
+                    let ts = batch.column(batch.schema().index_of("ts")?);
+                    lt(ts, &TimestampMillisecondArray::new_scalar(9000))
+                });
+
+            RowFilter::new(vec![
+                Box::new(int64_filter),
+                Box::new(float64_filter),
+                Box::new(ts_filter),
+            ])
+        }
+        FilterType::SparseScalarFixedOutput
+        | FilterType::ProjectedDynamicFilters
+        | FilterType::SparseProjectedPredicatesFixedOutput => {
+            let int64_filter =
+                ArrowPredicateFn::new(sparse_int64_pred_mask, move |batch: RecordBatch| {
+                    let int64 = batch.column(batch.schema().index_of("int64")?);
+                    let scalar = match filter_type {
+                        FilterType::ProjectedDynamicFilters => 12,
+                        _ => 8,
+                    };
+                    lt(int64, &Int64Array::new_scalar(scalar))
+                });
+            let ts_filter =
+                ArrowPredicateFn::new(sparse_ts_pred_mask, move |batch: RecordBatch| {
+                    let ts = batch.column(batch.schema().index_of("ts")?);
+                    lt(ts, &TimestampMillisecondArray::new_scalar(9000))
+                });
+
+            RowFilter::new(vec![Box::new(int64_filter), Box::new(ts_filter)])
+        }
+        _ => row_filter_for(filter_type, pred_mask),
+    }
+}
+
+#[derive(Clone, Copy)]
+enum NestedFilterType {
+    AlwaysTrueTag,
+    TagNotZero,
+}
+
+impl std::fmt::Display for NestedFilterType {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        match self {
+            Self::AlwaysTrueTag => write!(f, "always_true_tag"),
+            Self::TagNotZero => write!(f, "tag_not_zero"),
+        }
+    }
+}
+
+impl NestedFilterType {
+    fn filter_batch(self, batch: &RecordBatch) -> arrow::error::Result<BooleanArray> {
+        match self {
+            Self::AlwaysTrueTag => Ok(BooleanArray::from(vec![true; batch.num_rows()])),
+            Self::TagNotZero => {
+                let tag = batch.column(batch.schema().index_of("tag")?);
+                let scalar = StringViewArray::new_scalar("tag_0");
+                neq(tag, &scalar)
+            }
+        }
+    }
+}
+
+fn nested_row_filter_for(filter_type: NestedFilterType, pred_mask: ProjectionMask) -> RowFilter {
+    let filter = ArrowPredicateFn::new(pred_mask, move |batch| filter_type.filter_batch(&batch));
+    RowFilter::new(vec![Box::new(filter)])
+}
+
+/// Use async API
+async fn benchmark_async_reader(
+    reader: InMemoryReader,
+    projection_mask: ProjectionMask,
+    row_filter: RowFilter,
+) {
+    let mut stream = ParquetRecordBatchStreamBuilder::new(reader)
+        .await
+        .unwrap()
+        .with_batch_size(8192)
+        .with_projection(projection_mask)
+        .with_row_filter(row_filter)
+        .build()
+        .unwrap();
+    while let Some(b) = stream.next().await {
+        b.unwrap(); // consume the batches, no buffering
+    }
+}
+
+async fn benchmark_async_reader_with_policy(
+    reader: InMemoryReader,
+    projection_mask: ProjectionMask,
+    row_filter: RowFilter,
+    row_selection_policy: RowSelectionPolicy,
+) {
+    let mut stream = ParquetRecordBatchStreamBuilder::new(reader)
+        .await
+        .unwrap()
+        .with_batch_size(8192)
+        .with_projection(projection_mask)
+        .with_row_filter(row_filter)
+        .with_row_selection_policy(row_selection_policy)
+        .build()
+        .unwrap();
+    while let Some(b) = stream.next().await {
+        b.unwrap(); // consume the batches, no buffering
+    }
+}
+
+async fn benchmark_async_reader_post_filter(
+    reader: InMemoryReader,
+    read_projection: ProjectionMask,
+    output_column_names: Vec<&'static str>,
+    filter_type: FilterType,
+) {
+    let mut stream = ParquetRecordBatchStreamBuilder::new(reader)
+        .await
+        .unwrap()
+        .with_batch_size(8192)
+        .with_projection(read_projection)
+        .build()
+        .unwrap();
+
+    while let Some(b) = stream.next().await {
+        let batch = b.unwrap();
+        let filter = filter_type.filter_batch(&batch).unwrap();
+        let output_rows =
+            post_filter_projected_num_rows(&batch, &filter, &output_column_names).unwrap();
+        std::hint::black_box(output_rows);
+    }
+}
+
+async fn benchmark_async_reader_post_filter_nested(
+    reader: InMemoryReader,
+    read_projection: ProjectionMask,
+    output_column_names: &[&str],
+    filter_type: NestedFilterType,
+) {
+    let mut stream = ParquetRecordBatchStreamBuilder::new(reader)
+        .await
+        .unwrap()
+        .with_batch_size(8192)
+        .with_projection(read_projection)
+        .build()
+        .unwrap();
+
+    while let Some(b) = stream.next().await {
+        let batch = b.unwrap();
+        let filter = filter_type.filter_batch(&batch).unwrap();
+        let output_rows =
+            post_filter_projected_num_rows(&batch, &filter, output_column_names).unwrap();
+        std::hint::black_box(output_rows);
+    }
+}
+
+async fn benchmark_async_reader_projected(reader: InMemoryReader, projection_mask: ProjectionMask) {
+    let mut stream = ParquetRecordBatchStreamBuilder::new(reader)
+        .await
+        .unwrap()
+        .with_batch_size(8192)
+        .with_projection(projection_mask)
+        .build()
+        .unwrap();
+    while let Some(b) = stream.next().await {
+        let batch = b.unwrap();
+        std::hint::black_box(batch.num_rows());
+    }
+}
+
+/// Like [`benchmark_async_reader`] but also threads `with_limit(limit)` into
+/// the stream builder. Used by the `LIMIT` benchmark below.
+async fn benchmark_async_reader_with_limit(
+    reader: InMemoryReader,
     projection_mask: ProjectionMask,
     row_filter: RowFilter,
     limit: usize,
@@ -569,6 +2057,61 @@ fn benchmark_sync_reader(
     }
 }
 
+fn benchmark_sync_reader_with_policy(
+    reader: InMemoryReader,
+    projection_mask: ProjectionMask,
+    row_filter: RowFilter,
+    row_selection_policy: RowSelectionPolicy,
+) {
+    let stream = ParquetRecordBatchReaderBuilder::try_new(reader.into_inner())
+        .unwrap()
+        .with_batch_size(8192)
+        .with_projection(projection_mask)
+        .with_row_filter(row_filter)
+        .with_row_selection_policy(row_selection_policy)
+        .build()
+        .unwrap();
+    for b in stream {
+        b.unwrap(); // consume the batches, no buffering
+    }
+}
+
+fn benchmark_sync_reader_post_filter(
+    reader: InMemoryReader,
+    read_projection: ProjectionMask,
+    output_column_names: Vec<&'static str>,
+    filter_type: FilterType,
+) {
+    let stream = ParquetRecordBatchReaderBuilder::try_new(reader.into_inner())
+        .unwrap()
+        .with_batch_size(8192)
+        .with_projection(read_projection)
+        .build()
+        .unwrap();
+
+    for b in stream {
+        let batch = b.unwrap();
+        let filter = filter_type.filter_batch(&batch).unwrap();
+        let output_rows =
+            post_filter_projected_num_rows(&batch, &filter, &output_column_names).unwrap();
+        std::hint::black_box(output_rows);
+    }
+}
+
+fn benchmark_sync_reader_projected(reader: InMemoryReader, projection_mask: ProjectionMask) {
+    let stream = ParquetRecordBatchReaderBuilder::try_new(reader.into_inner())
+        .unwrap()
+        .with_batch_size(8192)
+        .with_projection(projection_mask)
+        .build()
+        .unwrap();
+
+    for b in stream {
+        let batch = b.unwrap();
+        std::hint::black_box(batch.num_rows());
+    }
+}
+
 /// Adapter to read asynchronously from in memory bytes and always loads the
 /// metadata with page indexes.
 #[derive(Debug, Clone)]
@@ -636,7 +2179,6 @@ fn benchmark_filters_with_limit(c: &mut Criterion) {
         ProjectionCase::AllColumns,
         ProjectionCase::ExcludeFilterColumn,
     ];
-    let all_indices = vec![0, 1, 2, 3];
 
     let rt = tokio::runtime::Builder::new_multi_thread()
         .enable_all()
@@ -648,14 +2190,7 @@ fn benchmark_filters_with_limit(c: &mut Criterion) {
     for filter_type in filter_types {
         for proj_case in &projection_cases {
             let filter_col = filter_type.filter_projection().to_vec();
-            let output_projection: Vec<usize> = match proj_case {
-                ProjectionCase::AllColumns => all_indices.clone(),
-                ProjectionCase::ExcludeFilterColumn => all_indices
-                    .iter()
-                    .copied()
-                    .filter(|i| !filter_col.contains(i))
-                    .collect(),
-            };
+            let output_projection = output_projection_for(filter_type, proj_case);
 
             let reader = InMemoryReader::try_new(&parquet_file).unwrap();
             let metadata = Arc::clone(reader.metadata());
@@ -693,9 +2228,109 @@ fn benchmark_filters_with_limit(c: &mut Criterion) {
     }
 }
 
+/// Focused nested-output case for comparing manual post-filtering against
+/// row-filter pushdown policies.
+///
+/// The predicate column is an unprojected variable-width scalar column, and the
+/// output is a whole nested `Struct` root. This isolates the reader case enabled
+/// by root-aware post-filter projection without requiring recursive nested-child
+/// projection.
+fn benchmark_async_nested_post_filter_focus(c: &mut Criterion) {
+    let parquet_file = Bytes::from(write_nested_parquet_file_with_rows(
+        TOTAL_ROWS,
+        ROW_GROUP_SIZE,
+    ));
+    let strategies = [
+        AsyncStrategy::FullPostFilter,
+        AsyncStrategy::PushdownAuto,
+        AsyncStrategy::PushdownMask,
+        AsyncStrategy::PushdownSelectors,
+    ];
+
+    let rt = tokio::runtime::Builder::new_multi_thread()
+        .enable_all()
+        .build()
+        .unwrap();
+
+    let mut group = c.benchmark_group("arrow_reader_row_filter_async_nested_post_filter_focus");
+    let reader = InMemoryReader::try_new(&parquet_file).unwrap();
+    let metadata = Arc::clone(reader.metadata());
+    let schema_descr = metadata.file_metadata().schema_descr();
+    let output_projection = ProjectionMask::columns(schema_descr, ["payload"]);
+    let read_projection = ProjectionMask::columns(schema_descr, ["tag", "payload"]);
+    let pred_mask = ProjectionMask::columns(schema_descr, ["tag"]);
+    let filter_cases = [
+        NestedFilterType::AlwaysTrueTag,
+        NestedFilterType::TagNotZero,
+    ];
+
+    for filter_case in filter_cases {
+        for strategy in strategies {
+            let bench_id = BenchmarkId::new(
+                format!("whole_struct_output/{filter_case}"),
+                strategy.to_string(),
+            );
+            let rt_captured = rt.handle().clone();
+            group.bench_function(bench_id, |b| {
+                b.iter(|| {
+                    let reader = reader.clone();
+                    let pred_mask = pred_mask.clone();
+                    let output_projection = output_projection.clone();
+                    let read_projection = read_projection.clone();
+                    rt_captured.block_on(async {
+                        match strategy {
+                            AsyncStrategy::FullPostFilter => {
+                                benchmark_async_reader_post_filter_nested(
+                                    reader,
+                                    read_projection,
+                                    &["payload"],
+                                    filter_case,
+                                )
+                                .await
+                            }
+                            AsyncStrategy::PushdownAuto => {
+                                benchmark_async_reader_with_policy(
+                                    reader,
+                                    output_projection,
+                                    nested_row_filter_for(filter_case, pred_mask),
+                                    RowSelectionPolicy::default(),
+                                )
+                                .await
+                            }
+                            AsyncStrategy::PushdownSelectors => {
+                                benchmark_async_reader_with_policy(
+                                    reader,
+                                    output_projection,
+                                    nested_row_filter_for(filter_case, pred_mask),
+                                    RowSelectionPolicy::Selectors,
+                                )
+                                .await
+                            }
+                            AsyncStrategy::PushdownMask => {
+                                benchmark_async_reader_with_policy(
+                                    reader,
+                                    output_projection,
+                                    nested_row_filter_for(filter_case, pred_mask),
+                                    RowSelectionPolicy::Mask,
+                                )
+                                .await
+                            }
+                        }
+                    })
+                });
+            });
+        }
+    }
+}
+
 criterion_group!(
     benches,
     benchmark_filters_and_projections,
+    benchmark_sync_strategy_matrix,
+    benchmark_async_strategy_matrix,
+    benchmark_async_auto_policy_focus,
+    benchmark_projection_scan_focus,
     benchmark_filters_with_limit,
+    benchmark_async_nested_post_filter_focus,
 );
 criterion_main!(benches);
diff --git a/parquet/benches/row_selection_cursor.rs b/parquet/benches/row_selection_cursor.rs
index 49c9e6d68acf..c458f5c12a52 100644
--- a/parquet/benches/row_selection_cursor.rs
+++ b/parquet/benches/row_selection_cursor.rs
@@ -15,6 +15,15 @@
 // specific language governing permissions and limitations
 // under the License.
 
+//! Benchmarks the cost of applying `RowSelection` as selector queues versus
+//! boolean masks.
+//!
+//! The broad sweep varies selector length, selection density, run-length
+//! distribution, data type, projected column count, and `Utf8View` payload size.
+//! The shape-focus suite keeps the data shape narrower and varies the maximum
+//! selected-run length (`maxrun`) so the results can show where
+//! `RowSelectionPolicy::Auto` should prefer `Selectors` or `Mask`.
+
 use std::hint;
 use std::sync::Arc;
 
@@ -34,9 +43,39 @@ const TOTAL_ROWS: usize = 1 << 20;
 const BATCH_SIZE: usize = 1 << 10;
 const BASE_SEED: u64 = 0xA55AA55A;
 const AVG_SELECTOR_LENGTHS: &[usize] = &[4, 8, 12, 16, 20, 24, 28, 32, 36, 40];
+const SHAPE_FOCUS_SELECTED_RUN_LENGTHS: &[usize] = &[1, 2, 4, 8, 32];
+// At 80% selectivity, maxrun1 and maxrun2 cannot be represented without
+// zero-length skip runs, so the dense-focused cases start at maxrun4.
+const DENSE_SHAPE_FOCUS_SELECTED_RUN_LENGTHS: &[usize] = &[4, 8, 32];
 const COLUMN_WIDTHS: &[usize] = &[2, 4, 8, 16, 32];
 const UTF8VIEW_LENS: &[usize] = &[4, 8, 16, 32, 64, 128, 256];
 const BENCH_MODES: &[BenchMode] = &[BenchMode::ReadSelector, BenchMode::ReadMask];
+const SHAPE_FOCUS_SCENARIOS: &[ShapeFocusScenario] = &[
+    ShapeFocusScenario {
+        name: "sparse10",
+        select_ratio: 0.1,
+        start_with_select: false,
+        selected_run_lengths: SHAPE_FOCUS_SELECTED_RUN_LENGTHS,
+    },
+    ShapeFocusScenario {
+        name: "sparse20",
+        select_ratio: 0.2,
+        start_with_select: false,
+        selected_run_lengths: SHAPE_FOCUS_SELECTED_RUN_LENGTHS,
+    },
+    ShapeFocusScenario {
+        name: "moderate40",
+        select_ratio: 0.4,
+        start_with_select: false,
+        selected_run_lengths: SHAPE_FOCUS_SELECTED_RUN_LENGTHS,
+    },
+    ShapeFocusScenario {
+        name: "dense80",
+        select_ratio: 0.8,
+        start_with_select: true,
+        selected_run_lengths: DENSE_SHAPE_FOCUS_SELECTED_RUN_LENGTHS,
+    },
+];
 
 struct DataProfile {
     name: &'static str,
@@ -203,6 +242,66 @@ fn criterion_benchmark(c: &mut Criterion) {
             BASE_SEED ^ ((offset as u64) << 40),
         );
     }
+
+    bench_shape_focus(c);
+}
+
+/// Focused selector-shape matrix for `Selectors` versus `Mask`.
+///
+/// It fixes the input profile to `int32` and `utf8view`, then varies
+/// selectivity and the requested maximum selected-run length. The benchmark
+/// suffix reports this as `maxrunNN` because the final selected run may be
+/// shorter than the requested maximum.
+fn bench_shape_focus(c: &mut Criterion) {
+    let profiles = [
+        DataProfile {
+            name: "int32",
+            build_batch: build_int32_batch,
+        },
+        DataProfile {
+            name: "utf8view",
+            build_batch: build_utf8view_batch,
+        },
+    ];
+
+    for profile in profiles {
+        let parquet_data = build_parquet_data(TOTAL_ROWS, profile.build_batch);
+        for scenario in shape_focus_scenarios() {
+            for &selected_run_len in scenario.selected_run_lengths {
+                let selectors =
+                    generate_shape_focus_selectors(selected_run_len, TOTAL_ROWS, scenario);
+                assert!(
+                    !selectors.is_empty(),
+                    "invalid shape focus case {} maxrun {}",
+                    scenario.name,
+                    selected_run_len
+                );
+
+                let suffix =
+                    shape_focus_suffix(scenario, profile.name, selected_run_len, &selectors);
+                let selection = RowSelection::from(selectors);
+
+                let bench_input = BenchInput {
+                    parquet_data: parquet_data.clone(),
+                    selection,
+                };
+
+                for &mode in BENCH_MODES {
+                    c.bench_with_input(
+                        BenchmarkId::new(mode.label(), &suffix),
+                        &bench_input,
+                        |b, input| {
+                            b.iter(|| {
+                                let total =
+                                    run_read(&input.parquet_data, &input.selection, mode.policy());
+                                hint::black_box(total);
+                            });
+                        },
+                    );
+                }
+            }
+        }
+    }
 }
 
 fn bench_over_lengths(
@@ -349,6 +448,13 @@ struct Scenario {
     distribution: RunDistribution,
 }
 
+pub(crate) struct ShapeFocusScenario {
+    pub(crate) name: &'static str,
+    select_ratio: f64,
+    start_with_select: bool,
+    pub(crate) selected_run_lengths: &'static [usize],
+}
+
 #[derive(Clone)]
 enum RunDistribution {
     Constant,
@@ -409,6 +515,87 @@ fn generate_selectors(
     selection.into()
 }
 
+pub(crate) fn shape_focus_scenarios() -> &'static [ShapeFocusScenario] {
+    SHAPE_FOCUS_SCENARIOS
+}
+
+pub(crate) fn generate_shape_focus_selectors(
+    selected_run_len: usize,
+    total_rows: usize,
+    scenario: &ShapeFocusScenario,
+) -> Vec<RowSelector> {
+    const CYCLE_ROWS: usize = 1_000;
+
+    assert!(selected_run_len > 0);
+    assert!(
+        (0.0..=1.0).contains(&scenario.select_ratio),
+        "select_ratio must be in [0, 1]"
+    );
+
+    let mut selectors = Vec::new();
+    let mut remaining_rows = total_rows;
+
+    while remaining_rows > 0 {
+        let cycle_rows = CYCLE_ROWS.min(remaining_rows);
+        let selected_rows = (cycle_rows as f64 * scenario.select_ratio).round() as usize;
+        if selected_rows == 0 {
+            selectors.push(RowSelector::skip(cycle_rows));
+            remaining_rows -= cycle_rows;
+            continue;
+        }
+        if selected_rows >= cycle_rows {
+            selectors.push(RowSelector::select(cycle_rows));
+            remaining_rows -= cycle_rows;
+            continue;
+        }
+
+        let selected_runs = selected_rows.div_ceil(selected_run_len);
+        let skipped_rows = cycle_rows - selected_rows;
+        if skipped_rows < selected_runs {
+            return Vec::new();
+        }
+
+        let base_skip_len = skipped_rows / selected_runs;
+        let extra_skip_runs = skipped_rows % selected_runs;
+        let mut remaining_selected_rows = selected_rows;
+
+        for run_idx in 0..selected_runs {
+            let skip_len = base_skip_len + usize::from(run_idx < extra_skip_runs);
+            let select_len = selected_run_len.min(remaining_selected_rows);
+            if scenario.start_with_select {
+                selectors.push(RowSelector::select(select_len));
+                selectors.push(RowSelector::skip(skip_len));
+            } else {
+                selectors.push(RowSelector::skip(skip_len));
+                selectors.push(RowSelector::select(select_len));
+            }
+            remaining_selected_rows -= select_len;
+        }
+
+        remaining_rows -= cycle_rows;
+    }
+
+    let selection: RowSelection = selectors.into();
+    selection.into()
+}
+
+pub(crate) fn shape_focus_suffix(
+    scenario: &ShapeFocusScenario,
+    profile_name: &str,
+    selected_run_len: usize,
+    selectors: &[RowSelector],
+) -> String {
+    let stats = SelectorStats::new(selectors);
+    format!(
+        "shape-focus-{}-{}-maxrun{:02}-avg{:.1}-sel{:02}",
+        scenario.name,
+        profile_name,
+        selected_run_len,
+        stats.average_selector_len,
+        (stats.select_ratio * 100.0).round() as u32
+    )
+}
+
 fn sample_length(mean: f64, distribution: &RunDistribution, rng: &mut StdRng) -> usize {
     match distribution {
         RunDistribution::Constant => mean.round().max(1.0) as usize,